script/dom/servoparser/
xml.rs

1/* This Source Code Form is subject to the terms of the Mozilla Public
2 * License, v. 2.0. If a copy of the MPL was not distributed with this
3 * file, You can obtain one at https://mozilla.org/MPL/2.0/. */
4
5#![cfg_attr(crown, allow(crown::unrooted_must_root))]
6
7use std::cell::Cell;
8
9use markup5ever::TokenizerResult;
10use script_bindings::trace::CustomTraceable;
11use servo_url::ServoUrl;
12use xml5ever::buffer_queue::BufferQueue;
13use xml5ever::tokenizer::XmlTokenizer;
14use xml5ever::tree_builder::XmlTreeBuilder;
15
16use crate::dom::bindings::inheritance::Castable;
17use crate::dom::bindings::root::{Dom, DomRoot};
18use crate::dom::document::Document;
19use crate::dom::html::htmlscriptelement::HTMLScriptElement;
20use crate::dom::node::Node;
21use crate::dom::servoparser::{ParsingAlgorithm, Sink};
22
23#[derive(JSTraceable, MallocSizeOf)]
24#[cfg_attr(crown, crown::unrooted_must_root_lint::must_root)]
25pub(crate) struct Tokenizer {
26    #[ignore_malloc_size_of = "Defined in xml5ever"]
27    inner: XmlTokenizer<XmlTreeBuilder<Dom<Node>, Sink>>,
28}
29
30impl Tokenizer {
31    pub(crate) fn new(document: &Document, url: ServoUrl) -> Self {
32        let sink = Sink {
33            base_url: url,
34            document: Dom::from_ref(document),
35            current_line: Cell::new(1),
36            script: Default::default(),
37            parsing_algorithm: ParsingAlgorithm::Normal,
38            custom_element_reaction_stack: document.custom_element_reaction_stack(),
39        };
40
41        let tb = XmlTreeBuilder::new(sink, Default::default());
42        let tok = XmlTokenizer::new(tb, Default::default());
43
44        Tokenizer { inner: tok }
45    }
46
47    pub(crate) fn feed(&self, input: &BufferQueue) -> TokenizerResult<DomRoot<HTMLScriptElement>> {
48        loop {
49            match self.inner.run(input) {
50                TokenizerResult::Done => return TokenizerResult::Done,
51                TokenizerResult::Script(handle) => {
52                    // Apparently the parser can sometimes create <script> elements without a namespace, resulting
53                    // in them not being HTMLScriptElements.
54                    if let Some(script) = handle.downcast::<HTMLScriptElement>() {
55                        return TokenizerResult::Script(DomRoot::from_ref(script));
56                    }
57                },
58            }
59        }
60    }
61
62    pub(crate) fn end(&self) {
63        self.inner.end()
64    }
65
66    pub(crate) fn url(&self) -> &ServoUrl {
67        &self.inner.sink.sink.base_url
68    }
69}