aboutsummaryrefslogtreecommitdiff
path: root/src/reader/parser/inside_opening_tag.rs
blob: b7f185acf213a55fa104bd09ca6d0c4aca81dec3 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
use crate::reader::error::SyntaxError;
use crate::common::is_name_start_char;
use crate::namespace;
use crate::{attribute::OwnedAttribute, common::is_whitespace_char};

use crate::reader::lexer::Token;

use super::{OpeningTagSubstate, PullParser, QualifiedNameTarget, Result, State};

impl PullParser {
    pub fn inside_opening_tag(&mut self, t: Token, s: OpeningTagSubstate) -> Option<Result> {
        match s {
            OpeningTagSubstate::InsideName => self.read_qualified_name(t, QualifiedNameTarget::OpeningTagNameTarget, |this, token, name| {
                match name.prefix_ref() {
                    Some(prefix) if prefix == namespace::NS_XML_PREFIX ||
                                    prefix == namespace::NS_XMLNS_PREFIX =>
                        Some(this.error(SyntaxError::InvalidNamePrefix(prefix.into()))),
                    _ => {
                        this.data.element_name = Some(name.clone());
                        match token {
                            Token::TagEnd => this.emit_start_element(false),
                            Token::EmptyTagEnd => this.emit_start_element(true),
                            Token::Character(c) if is_whitespace_char(c) => this.into_state_continue(State::InsideOpeningTag(OpeningTagSubstate::InsideTag)),
                            _ => unreachable!()
                        }
                    }
                }
            }),

            OpeningTagSubstate::InsideTag => match t {
                Token::TagEnd => self.emit_start_element(false),
                Token::EmptyTagEnd => self.emit_start_element(true),
                Token::Character(c) if is_whitespace_char(c) => None,  // skip whitespace
                Token::Character(c) if is_name_start_char(c) => {
                    self.buf.push(c);
                    self.into_state_continue(State::InsideOpeningTag(OpeningTagSubstate::InsideAttributeName))
                }
                _ => Some(self.error(SyntaxError::UnexpectedTokenInOpeningTag(t)))
            },

            OpeningTagSubstate::InsideAttributeName => self.read_qualified_name(t, QualifiedNameTarget::AttributeNameTarget, |this, token, name| {
                this.data.attr_name = Some(name);
                match token {
                    Token::EqualsSign => this.into_state_continue(State::InsideOpeningTag(OpeningTagSubstate::InsideAttributeValue)),
                    Token::Character(c) if is_whitespace_char(c) => this.into_state_continue(State::InsideOpeningTag(OpeningTagSubstate::AfterAttributeName)),
                    _ => unreachable!()
                }
            }),

            OpeningTagSubstate::AfterAttributeName => match t {
                Token::EqualsSign => self.into_state_continue(State::InsideOpeningTag(OpeningTagSubstate::InsideAttributeValue)),
                Token::Character(c) if is_whitespace_char(c) => None,
                _ => Some(self.error(SyntaxError::UnexpectedTokenInOpeningTag(t)))
            },

            OpeningTagSubstate::InsideAttributeValue => self.read_attribute_value(t, |this, value| {
                let name = this.data.take_attr_name()?;  // will always succeed here
                // check that no attribute with such name is already present
                // if there is one, XML is not well-formed
                if this.data.attributes.iter().any(|a| a.name == name) {  // TODO: looks bad
                    // TODO: ideally this error should point to the beginning of the attribute,
                    // TODO: not the end of its value
                    Some(this.error(SyntaxError::RedefinedAttribute(name.to_string().into())))
                } else {
                    match name.prefix_ref() {
                        // declaring a new prefix; it is sufficient to check prefix only
                        // because "xmlns" prefix is reserved
                        Some(namespace::NS_XMLNS_PREFIX) => {
                            let ln = &*name.local_name;
                            if ln == namespace::NS_XMLNS_PREFIX {
                                Some(this.error(SyntaxError::CannotRedefineXmlnsPrefix))
                            } else if ln == namespace::NS_XML_PREFIX && &*value != namespace::NS_XML_URI {
                                Some(this.error(SyntaxError::CannotRedefineXmlPrefix))
                            } else if value.is_empty() {
                                Some(this.error(SyntaxError::CannotUndefinePrefix(ln.into())))
                            } else {
                                this.nst.put(name.local_name.clone(), value);
                                this.into_state_continue(State::InsideOpeningTag(OpeningTagSubstate::AfterAttributeValue))
                            }
                        }

                        // declaring default namespace
                        None if &*name.local_name == namespace::NS_XMLNS_PREFIX =>
                            match &*value {
                                namespace::NS_XMLNS_PREFIX | namespace::NS_XML_PREFIX | namespace::NS_XML_URI | namespace::NS_XMLNS_URI =>
                                    Some(this.error(SyntaxError::InvalidDefaultNamespace(value.into()))),
                                _ => {
                                    this.nst.put(namespace::NS_NO_PREFIX, value.clone());
                                    this.into_state_continue(State::InsideOpeningTag(OpeningTagSubstate::AfterAttributeValue))
                                }
                            },

                        // regular attribute
                        _ => {
                            this.data.attributes.push(OwnedAttribute {
                                name: name.clone(),
                                value
                            });
                            this.into_state_continue(State::InsideOpeningTag(OpeningTagSubstate::AfterAttributeValue))
                        }
                    }
                }
            }),

            OpeningTagSubstate::AfterAttributeValue => match t {
                Token::Character(c) if is_whitespace_char(c) => self.into_state_continue(State::InsideOpeningTag(OpeningTagSubstate::InsideTag)),
                Token::TagEnd => self.emit_start_element(false),
                Token::EmptyTagEnd => self.emit_start_element(true),
                _ => Some(self.error(SyntaxError::UnexpectedTokenInOpeningTag(t)))
            },
        }
    }
}