1use std::borrow::Cow;
6use std::cell::{Cell, RefCell};
7use std::mem;
8use std::rc::Rc;
9
10use base64::Engine as _;
11use base64::engine::general_purpose;
12use content_security_policy::sandboxing_directive::SandboxingFlagSet;
13use devtools_traits::ScriptToDevtoolsControlMsg;
14use dom_struct::dom_struct;
15use embedder_traits::resources::{self, Resource};
16use encoding_rs::{Encoding, UTF_8};
17use html5ever::buffer_queue::BufferQueue;
18use html5ever::tendril::StrTendril;
19use html5ever::tree_builder::{ElementFlags, NodeOrText, QuirksMode, TreeSink};
20use html5ever::{Attribute, ExpandedName, LocalName, QualName, local_name, ns};
21use hyper_serde::Serde;
22use js::context::JSContext;
23use markup5ever::TokenizerResult;
24use mime::{self, Mime};
25use net_traits::mime_classifier::{ApacheBugFlag, MediaType, MimeClassifier, NoSniffFlag};
26use net_traits::policy_container::PolicyContainer;
27use net_traits::request::RequestId;
28use net_traits::{
29 FetchMetadata, LoadContext, Metadata, NetworkError, ReferrerPolicy, ResourceFetchTiming,
30};
31use profile_traits::time::{
32 ProfilerCategory, ProfilerChan, TimerMetadata, TimerMetadataFrameType, TimerMetadataReflowType,
33};
34use profile_traits::time_profile;
35use script_bindings::cell::DomRefCell;
36use script_bindings::reflector::{Reflector, reflect_dom_object};
37use script_bindings::script_runtime::temp_cx;
38use script_traits::DocumentActivity;
39use servo_base::id::{PipelineId, WebViewId};
40use servo_config::pref;
41use servo_constellation_traits::{LoadOrigin, TargetSnapshotParams};
42use servo_url::{MutableOrigin, ServoUrl};
43use style::context::QuirksMode as ServoQuirksMode;
44use tendril::stream::LossyDecoder;
45use tendril::{ByteTendril, TendrilSink};
46
47use crate::document_loader::{DocumentLoader, LoadType};
48use crate::dom::bindings::codegen::Bindings::DocumentBinding::{
49 DocumentMethods, DocumentReadyState,
50};
51use crate::dom::bindings::codegen::Bindings::HTMLImageElementBinding::HTMLImageElementMethods;
52use crate::dom::bindings::codegen::Bindings::HTMLMediaElementBinding::HTMLMediaElementMethods;
53use crate::dom::bindings::codegen::Bindings::HTMLTemplateElementBinding::HTMLTemplateElementMethods;
54use crate::dom::bindings::codegen::Bindings::NodeBinding::NodeMethods;
55use crate::dom::bindings::codegen::Bindings::ShadowRootBinding::{
56 ShadowRootMode, SlotAssignmentMode,
57};
58use crate::dom::bindings::inheritance::Castable;
59use crate::dom::bindings::refcounted::Trusted;
60use crate::dom::bindings::reflector::DomGlobal;
61use crate::dom::bindings::root::{Dom, DomRoot, MutNullableDom};
62use crate::dom::bindings::settings_stack::is_execution_stack_empty;
63use crate::dom::bindings::str::{DOMString, USVString};
64use crate::dom::characterdata::CharacterData;
65use crate::dom::comment::Comment;
66use crate::dom::csp::{Violation, parse_csp_list_from_metadata};
67use crate::dom::customelementregistry::CustomElementReactionStack;
68use crate::dom::document::{Document, DocumentSource, HasBrowsingContext, IsHTMLDocument};
69use crate::dom::documentfragment::DocumentFragment;
70use crate::dom::documenttype::DocumentType;
71use crate::dom::element::{CustomElementCreationMode, Element, ElementCreator};
72use crate::dom::globalscope::GlobalScope;
73use crate::dom::html::htmlformelement::{FormControlElementHelpers, HTMLFormElement};
74use crate::dom::html::htmlimageelement::HTMLImageElement;
75use crate::dom::html::htmlscriptelement::{HTMLScriptElement, ScriptResult};
76use crate::dom::html::htmltemplateelement::HTMLTemplateElement;
77use crate::dom::iterators::ShadowIncluding;
78use crate::dom::node::Node;
79use crate::dom::performance::performanceentry::PerformanceEntry;
80use crate::dom::performance::performancenavigationtiming::PerformanceNavigationTiming;
81use crate::dom::processinginstruction::ProcessingInstruction;
82use crate::dom::processingoptions::{
83 LinkHeader, LinkProcessingPhase, extract_links_from_headers, process_link_headers,
84};
85use crate::dom::reporting::reportingendpoint::ReportingEndpoint;
86use crate::dom::security::csp::CspReporting;
87use crate::dom::security::xframeoptions::check_a_navigation_response_adherence_to_x_frame_options;
88use crate::dom::shadowroot::IsUserAgentWidget;
89use crate::dom::text::Text;
90use crate::dom::types::{HTMLElement, HTMLMediaElement, HTMLOptionElement};
91use crate::dom::virtualmethods::vtable_for;
92use crate::navigation::determine_the_origin;
93use crate::network_listener::FetchResponseListener;
94use crate::realms::{enter_auto_realm, enter_realm};
95use crate::script_runtime::{CanGc, IntroductionType};
96use crate::script_thread::ScriptThread;
97
98mod async_html;
99pub(crate) mod encoding;
100pub(crate) mod html;
101mod prefetch;
102mod xml;
103
104use encoding::{NetworkDecoderState, NetworkSink};
105pub(crate) use html::serialize_html_fragment;
106
107#[dom_struct]
108pub(crate) struct ServoParser {
121 reflector: Reflector,
122 document: Dom<Document>,
124 network_decoder: DomRefCell<NetworkDecoderState>,
126 #[ignore_malloc_size_of = "Defined in html5ever"]
128 #[no_trace]
129 network_input: BufferQueue,
130 #[ignore_malloc_size_of = "Defined in html5ever"]
132 #[no_trace]
133 script_input: BufferQueue,
134 tokenizer: Tokenizer,
136 last_chunk_received: Cell<bool>,
138 suspended: Cell<bool>,
140 script_nesting_level: Cell<usize>,
142 aborted: Cell<bool>,
144 stopped: Cell<bool>,
146 script_created_parser: bool,
148 #[no_trace]
153 prefetch_decoder: RefCell<LossyDecoder<NetworkSink>>,
154 prefetch_tokenizer: prefetch::Tokenizer,
158 #[ignore_malloc_size_of = "Defined in html5ever"]
159 #[no_trace]
160 prefetch_input: BufferQueue,
161 content_for_devtools: Option<DomRefCell<String>>,
164}
165
166pub(crate) struct ElementAttribute {
167 name: QualName,
168 value: DOMString,
169}
170
171#[derive(Clone, Copy, JSTraceable, MallocSizeOf, PartialEq)]
172pub(crate) enum ParsingAlgorithm {
173 Normal,
174 Fragment,
175}
176
177impl ElementAttribute {
178 pub(crate) fn new(name: QualName, value: DOMString) -> ElementAttribute {
179 ElementAttribute { name, value }
180 }
181}
182
183impl ServoParser {
184 pub(crate) fn parser_is_not_active(&self) -> bool {
185 self.can_write()
186 }
187
188 pub(crate) fn parse_html_document(
190 cx: &mut JSContext,
191 document: &Document,
192 input: Option<DOMString>,
193 url: ServoUrl,
194 encoding_hint_from_content_type: Option<&'static Encoding>,
195 encoding_of_container_document: Option<&'static Encoding>,
196 ) {
197 assert!(document.is_html_document());
201
202 let parser = ServoParser::new(
204 document,
205 if pref!(dom_servoparser_async_html_tokenizer_enabled) {
206 Tokenizer::AsyncHtml(self::async_html::Tokenizer::new(document, url, None))
207 } else {
208 Tokenizer::Html(self::html::Tokenizer::new(
209 document,
210 url,
211 None,
212 ParsingAlgorithm::Normal,
213 ))
214 },
215 ParserKind::Normal,
216 encoding_hint_from_content_type,
217 encoding_of_container_document,
218 CanGc::from_cx(cx),
219 );
220
221 if let Some(input) = input {
227 parser.parse_complete_string_chunk(cx, String::from(input));
228 } else {
229 parser.document.set_current_parser(Some(&parser));
230 }
231 }
232
233 pub(crate) fn parse_html_fragment<'el>(
235 cx: &mut JSContext,
236 context: &'el Element,
237 input: DOMString,
238 allow_declarative_shadow_roots: bool,
239 ) -> impl Iterator<Item = DomRoot<Node>> + use<'el> {
240 let context_node = context.upcast::<Node>();
241 let context_document = context_node.owner_doc();
242 let window = context_document.window();
243 let url = context_document.url();
244
245 let loader = DocumentLoader::new_with_threads(
247 context_document.loader().resource_threads().clone(),
248 Some(url.clone()),
249 );
250 let document = Document::new(
251 window,
252 HasBrowsingContext::No,
253 Some(url.clone()),
254 context_document.about_base_url(),
255 context_document.origin().clone(),
256 IsHTMLDocument::HTMLDocument,
257 None,
258 None,
259 DocumentActivity::Inactive,
260 DocumentSource::FromParser,
261 loader,
262 None,
263 None,
264 Default::default(),
265 false,
266 allow_declarative_shadow_roots,
267 Some(context_document.insecure_requests_policy()),
268 context_document.has_trustworthy_ancestor_or_current_origin(),
269 context_document.custom_element_reaction_stack(),
270 context_document.creation_sandboxing_flag_set(),
271 CanGc::from_cx(cx),
272 );
273
274 document.set_quirks_mode(context_document.quirks_mode());
278
279 let form = context_node
286 .inclusive_ancestors(ShadowIncluding::No)
287 .find(|element| element.is::<HTMLFormElement>());
288
289 let fragment_context = FragmentContext {
290 context_elem: context_node,
291 form_elem: form.as_deref(),
292 context_element_allows_scripting: context_document.scripting_enabled(),
293 };
294
295 let parser = ServoParser::new(
296 &document,
297 Tokenizer::Html(self::html::Tokenizer::new(
298 &document,
299 url,
300 Some(fragment_context),
301 ParsingAlgorithm::Fragment,
302 )),
303 ParserKind::Normal,
304 None,
305 None,
306 CanGc::from_cx(cx),
307 );
308 parser.parse_complete_string_chunk(cx, String::from(input));
309
310 let root_element = document.GetDocumentElement().expect("no document element");
312 FragmentParsingResult {
313 inner: root_element.upcast::<Node>().children(),
314 }
315 }
316
317 pub(crate) fn parse_html_script_input(document: &Document, url: ServoUrl) {
318 let parser = ServoParser::new(
319 document,
320 if pref!(dom_servoparser_async_html_tokenizer_enabled) {
321 Tokenizer::AsyncHtml(self::async_html::Tokenizer::new(document, url, None))
322 } else {
323 Tokenizer::Html(self::html::Tokenizer::new(
324 document,
325 url,
326 None,
327 ParsingAlgorithm::Normal,
328 ))
329 },
330 ParserKind::ScriptCreated,
331 None,
332 None,
333 CanGc::deprecated_note(),
334 );
335 document.set_current_parser(Some(&parser));
336 }
337
338 pub(crate) fn parse_xml_document(
339 cx: &mut JSContext,
340 document: &Document,
341 input: Option<DOMString>,
342 url: ServoUrl,
343 encoding_hint_from_content_type: Option<&'static Encoding>,
344 ) {
345 let parser = ServoParser::new(
346 document,
347 Tokenizer::Xml(self::xml::Tokenizer::new(document, url)),
348 ParserKind::Normal,
349 encoding_hint_from_content_type,
350 None,
351 CanGc::from_cx(cx),
352 );
353
354 if let Some(input) = input {
356 parser.parse_complete_string_chunk(cx, String::from(input));
357 } else {
358 parser.document.set_current_parser(Some(&parser));
359 }
360 }
361
362 pub(crate) fn script_nesting_level(&self) -> usize {
363 self.script_nesting_level.get()
364 }
365
366 pub(crate) fn is_script_created(&self) -> bool {
367 self.script_created_parser
368 }
369
370 pub(crate) fn resume_with_pending_parsing_blocking_script(
385 &self,
386 cx: &mut JSContext,
387 script: &HTMLScriptElement,
388 result: ScriptResult,
389 ) {
390 assert!(self.suspended.get());
391 self.suspended.set(false);
392
393 self.script_input.swap_with(&self.network_input);
394 while let Some(chunk) = self.script_input.pop_front() {
395 self.network_input.push_back(chunk);
396 }
397
398 let script_nesting_level = self.script_nesting_level.get();
399 assert_eq!(script_nesting_level, 0);
400
401 self.script_nesting_level.set(script_nesting_level + 1);
402 script.execute(cx, result);
403 self.script_nesting_level.set(script_nesting_level);
404
405 if !self.suspended.get() && !self.aborted.get() {
406 self.parse_sync(cx);
407 }
408 }
409
410 pub(crate) fn can_write(&self) -> bool {
411 self.script_created_parser || self.script_nesting_level.get() > 0
412 }
413
414 pub(crate) fn write(&self, cx: &mut JSContext, text: DOMString) {
416 assert!(self.can_write());
417
418 if self.document.has_pending_parsing_blocking_script() {
419 self.script_input.push_back(String::from(text).into());
423 return;
424 }
425
426 assert!(self.script_input.is_empty());
430
431 let input = BufferQueue::default();
432 input.push_back(String::from(text).into());
433
434 let profiler_chan = self
435 .document
436 .window()
437 .as_global_scope()
438 .time_profiler_chan()
439 .clone();
440 let profiler_metadata = TimerMetadata {
441 url: self.document.url().as_str().into(),
442 iframe: TimerMetadataFrameType::RootWindow,
443 incremental: TimerMetadataReflowType::FirstReflow,
444 };
445 self.tokenize(cx, |cx, tokenizer| {
446 tokenizer.feed(cx, &input, profiler_chan.clone(), profiler_metadata.clone())
447 });
448
449 if self.suspended.get() {
450 while let Some(chunk) = input.pop_front() {
454 self.script_input.push_back(chunk);
455 }
456 return;
457 }
458
459 assert!(input.is_empty());
460 }
461
462 pub(crate) fn close(&self, cx: &mut JSContext) {
464 assert!(self.script_created_parser);
465
466 self.last_chunk_received.set(true);
468
469 if self.suspended.get() {
471 return;
472 }
473
474 self.parse_sync(cx);
477 }
478
479 pub(crate) fn abort(&self, cx: &mut JSContext) {
481 assert!(!self.aborted.get());
482 self.aborted.set(true);
483
484 self.script_input.replace_with(BufferQueue::default());
486 self.network_input.replace_with(BufferQueue::default());
487
488 self.document
490 .set_ready_state(cx, DocumentReadyState::Interactive);
491
492 self.tokenizer.end(cx);
494 self.document.set_current_parser(None);
495
496 self.document
498 .set_ready_state(cx, DocumentReadyState::Complete);
499 }
500
501 pub(crate) fn get_current_line(&self) -> u32 {
502 self.tokenizer.get_current_line()
503 }
504
505 #[cfg_attr(crown, expect(crown::unrooted_must_root))]
506 fn new_inherited(
507 document: &Document,
508 tokenizer: Tokenizer,
509 kind: ParserKind,
510 encoding_hint_from_content_type: Option<&'static Encoding>,
511 encoding_of_container_document: Option<&'static Encoding>,
512 ) -> Self {
513 let content_for_devtools = (document.global().devtools_chan().is_some() &&
517 document.has_browsing_context())
518 .then_some(DomRefCell::new(String::new()));
519
520 ServoParser {
521 reflector: Reflector::new(),
522 document: Dom::from_ref(document),
523 network_decoder: DomRefCell::new(NetworkDecoderState::new(
524 encoding_hint_from_content_type,
525 encoding_of_container_document,
526 )),
527 network_input: BufferQueue::default(),
528 script_input: BufferQueue::default(),
529 tokenizer,
530 last_chunk_received: Cell::new(false),
531 suspended: Default::default(),
532 script_nesting_level: Default::default(),
533 aborted: Default::default(),
534 stopped: Default::default(),
535 script_created_parser: kind == ParserKind::ScriptCreated,
536 prefetch_decoder: RefCell::new(LossyDecoder::new_encoding_rs(
537 encoding_hint_from_content_type.unwrap_or(UTF_8),
538 Default::default(),
539 )),
540 prefetch_tokenizer: prefetch::Tokenizer::new(document),
541 prefetch_input: BufferQueue::default(),
542 content_for_devtools,
543 }
544 }
545
546 #[cfg_attr(crown, expect(crown::unrooted_must_root))]
547 fn new(
548 document: &Document,
549 tokenizer: Tokenizer,
550 kind: ParserKind,
551 encoding_hint_from_content_type: Option<&'static Encoding>,
552 encoding_of_container_document: Option<&'static Encoding>,
553 can_gc: CanGc,
554 ) -> DomRoot<Self> {
555 reflect_dom_object(
556 Box::new(ServoParser::new_inherited(
557 document,
558 tokenizer,
559 kind,
560 encoding_hint_from_content_type,
561 encoding_of_container_document,
562 )),
563 document.window(),
564 can_gc,
565 )
566 }
567
568 fn push_tendril_input_chunk(&self, chunk: StrTendril) {
569 if let Some(mut content_for_devtools) = self
570 .content_for_devtools
571 .as_ref()
572 .map(|content| content.borrow_mut())
573 {
574 content_for_devtools.push_str(chunk.as_ref());
576 }
577
578 if chunk.is_empty() {
579 return;
580 }
581
582 self.network_input.push_back(chunk);
585 }
586
587 fn push_bytes_input_chunk(&self, chunk: Vec<u8>) {
588 if let Some(decoded_chunk) = self
590 .network_decoder
591 .borrow_mut()
592 .push(&chunk, &self.document)
593 {
594 self.push_tendril_input_chunk(decoded_chunk);
595 }
596
597 if self.should_prefetch() {
598 let mut prefetch_decoder = self.prefetch_decoder.borrow_mut();
604 prefetch_decoder.process(ByteTendril::from(&*chunk));
605
606 self.prefetch_input
607 .push_back(mem::take(&mut prefetch_decoder.inner_sink_mut().output));
608 self.prefetch_tokenizer.feed(&self.prefetch_input);
609 }
610 }
611
612 fn should_prefetch(&self) -> bool {
613 self.document.browsing_context().is_some()
621 }
622
623 fn push_string_input_chunk(&self, chunk: String) {
624 let chunk = StrTendril::from(chunk);
627 self.push_tendril_input_chunk(chunk);
628 }
629
630 fn parse_sync(&self, cx: &mut JSContext) {
631 assert!(self.script_input.is_empty());
632
633 if self.last_chunk_received.get() {
637 let chunk = self.network_decoder.borrow_mut().finish(&self.document);
638 if !chunk.is_empty() {
639 self.push_tendril_input_chunk(chunk);
640 }
641 }
642
643 if self.aborted.get() {
644 return;
645 }
646
647 let profiler_chan = self
648 .document
649 .window()
650 .as_global_scope()
651 .time_profiler_chan()
652 .clone();
653 let profiler_metadata = TimerMetadata {
654 url: self.document.url().as_str().into(),
655 iframe: TimerMetadataFrameType::RootWindow,
656 incremental: TimerMetadataReflowType::FirstReflow,
657 };
658 self.tokenize(cx, |cx, tokenizer| {
659 tokenizer.feed(
660 cx,
661 &self.network_input,
662 profiler_chan.clone(),
663 profiler_metadata.clone(),
664 )
665 });
666
667 if self.suspended.get() {
668 return;
669 }
670
671 assert!(self.network_input.is_empty());
672
673 if self.last_chunk_received.get() {
674 self.finish(cx);
675 }
676 }
677
678 fn parse_complete_string_chunk(&self, cx: &mut JSContext, input: String) {
679 self.document.set_current_parser(Some(self));
680 self.push_string_input_chunk(input);
681 self.last_chunk_received.set(true);
682 if !self.suspended.get() {
683 self.parse_sync(cx);
684 }
685 }
686
687 fn parse_bytes_chunk(&self, cx: &mut JSContext, input: Vec<u8>) {
688 let _realm = enter_realm(&*self.document);
689 self.document.set_current_parser(Some(self));
690 self.push_bytes_input_chunk(input);
691 if !self.suspended.get() {
692 self.parse_sync(cx);
693 }
694 }
695
696 fn tokenize<F>(&self, cx: &mut JSContext, feed: F)
697 where
698 F: Fn(&mut JSContext, &Tokenizer) -> TokenizerResult<DomRoot<HTMLScriptElement>>,
699 {
700 loop {
701 assert!(!self.suspended.get());
702 assert!(!self.aborted.get());
703
704 self.document.window().reflow_if_reflow_timer_expired(cx);
705 let script = match feed(cx, &self.tokenizer) {
706 TokenizerResult::Done => return,
707 TokenizerResult::EncodingIndicator(_) => continue,
708 TokenizerResult::Script(script) => script,
709 };
710
711 if is_execution_stack_empty() {
718 self.document.window().perform_a_microtask_checkpoint(cx);
719 }
720
721 let script_nesting_level = self.script_nesting_level.get();
722
723 self.script_nesting_level.set(script_nesting_level + 1);
724 script.set_initial_script_text();
725 let introduction_type_override =
726 (script_nesting_level > 0).then_some(IntroductionType::INJECTED_SCRIPT);
727 script.prepare(cx, introduction_type_override);
728 self.script_nesting_level.set(script_nesting_level);
729
730 if self.document.has_pending_parsing_blocking_script() {
731 self.suspended.set(true);
732 return;
733 }
734 if self.aborted.get() {
735 return;
736 }
737 }
738 }
739
740 pub(crate) fn has_aborted(&self) -> bool {
742 self.aborted.get()
743 }
744
745 pub(crate) fn has_stopped(&self) -> bool {
747 self.stopped.get()
748 }
749
750 fn finish(&self, cx: &mut JSContext) {
752 assert!(!self.suspended.get());
753 assert!(self.last_chunk_received.get());
754 assert!(self.script_input.is_empty());
755 assert!(self.network_input.is_empty());
756 assert!(self.network_decoder.borrow().is_finished());
757
758 self.stopped.set(true);
759
760 self.document.set_current_parser(None);
766
767 self.document
769 .set_ready_state(cx, DocumentReadyState::Interactive);
770
771 self.tokenizer.end(cx);
773
774 let url = self.tokenizer.url().clone();
776 self.document.finish_load(LoadType::PageSource(url), cx);
777
778 if let Some(content_for_devtools) = self
780 .content_for_devtools
781 .as_ref()
782 .map(|content| content.take())
783 {
784 let global = self.document.global();
785 let chan = global.devtools_chan().expect("Guaranteed by new");
786 let pipeline_id = self.document.global().pipeline_id();
787 let _ = chan.send(ScriptToDevtoolsControlMsg::UpdateSourceContent(
788 pipeline_id,
789 content_for_devtools,
790 ));
791 }
792 }
793}
794
795struct FragmentParsingResult<I>
796where
797 I: Iterator<Item = DomRoot<Node>>,
798{
799 inner: I,
800}
801
802impl<I> Iterator for FragmentParsingResult<I>
803where
804 I: Iterator<Item = DomRoot<Node>>,
805{
806 type Item = DomRoot<Node>;
807
808 #[expect(unsafe_code)]
809 fn next(&mut self) -> Option<DomRoot<Node>> {
810 let mut cx = unsafe { script_bindings::script_runtime::temp_cx() };
811 let cx = &mut cx;
812
813 let next = self.inner.next()?;
814 next.remove_self(cx);
815 Some(next)
816 }
817
818 fn size_hint(&self) -> (usize, Option<usize>) {
819 self.inner.size_hint()
820 }
821}
822
823#[derive(JSTraceable, MallocSizeOf, PartialEq)]
824enum ParserKind {
825 Normal,
826 ScriptCreated,
827}
828
829#[derive(JSTraceable, MallocSizeOf)]
830#[cfg_attr(crown, crown::unrooted_must_root_lint::must_root)]
831enum Tokenizer {
832 Html(self::html::Tokenizer),
833 AsyncHtml(self::async_html::Tokenizer),
834 Xml(self::xml::Tokenizer),
835}
836
837impl Tokenizer {
838 fn feed(
839 &self,
840 cx: &mut JSContext,
841 input: &BufferQueue,
842 profiler_chan: ProfilerChan,
843 profiler_metadata: TimerMetadata,
844 ) -> TokenizerResult<DomRoot<HTMLScriptElement>> {
845 match *self {
846 Tokenizer::Html(ref tokenizer) => time_profile!(
847 ProfilerCategory::ScriptParseHTML,
848 Some(profiler_metadata),
849 profiler_chan,
850 || tokenizer.feed(input),
851 ),
852 Tokenizer::AsyncHtml(ref tokenizer) => time_profile!(
853 ProfilerCategory::ScriptParseHTML,
854 Some(profiler_metadata),
855 profiler_chan,
856 || tokenizer.feed(input, cx),
857 ),
858 Tokenizer::Xml(ref tokenizer) => time_profile!(
859 ProfilerCategory::ScriptParseXML,
860 Some(profiler_metadata),
861 profiler_chan,
862 || tokenizer.feed(input),
863 ),
864 }
865 }
866
867 fn end(&self, cx: &mut JSContext) {
868 match *self {
869 Tokenizer::Html(ref tokenizer) => tokenizer.end(),
870 Tokenizer::AsyncHtml(ref tokenizer) => tokenizer.end(cx),
871 Tokenizer::Xml(ref tokenizer) => tokenizer.end(),
872 }
873 }
874
875 fn url(&self) -> &ServoUrl {
876 match *self {
877 Tokenizer::Html(ref tokenizer) => tokenizer.url(),
878 Tokenizer::AsyncHtml(ref tokenizer) => tokenizer.url(),
879 Tokenizer::Xml(ref tokenizer) => tokenizer.url(),
880 }
881 }
882
883 fn set_plaintext_state(&self) {
884 match *self {
885 Tokenizer::Html(ref tokenizer) => tokenizer.set_plaintext_state(),
886 Tokenizer::AsyncHtml(ref tokenizer) => tokenizer.set_plaintext_state(),
887 Tokenizer::Xml(_) => unimplemented!(),
888 }
889 }
890
891 fn get_current_line(&self) -> u32 {
892 match *self {
893 Tokenizer::Html(ref tokenizer) => tokenizer.get_current_line(),
894 Tokenizer::AsyncHtml(ref tokenizer) => tokenizer.get_current_line(),
895 Tokenizer::Xml(ref tokenizer) => tokenizer.get_current_line(),
896 }
897 }
898}
899
900struct NavigationParams {
904 policy_container: PolicyContainer,
906 content_type: Option<Mime>,
908 link_headers: Vec<LinkHeader>,
910 final_sandboxing_flag_set: SandboxingFlagSet,
912 resource_header: Vec<u8>,
914 about_base_url: Option<ServoUrl>,
916}
917
918pub(crate) struct ParserContext {
921 parser: Option<Trusted<ServoParser>>,
923 is_synthesized_document: bool,
925 has_loaded_document: bool,
927 webview_id: WebViewId,
929 pipeline_id: PipelineId,
931 url: ServoUrl,
933 pushed_entry_index: Option<usize>,
935 navigation_params: NavigationParams,
937 parent_info: Option<PipelineId>,
939 target_snapshot_params: TargetSnapshotParams,
940 load_origin: LoadOrigin,
941}
942
943impl ParserContext {
944 pub(crate) fn new(
945 webview_id: WebViewId,
946 pipeline_id: PipelineId,
947 url: ServoUrl,
948 creation_sandboxing_flag_set: SandboxingFlagSet,
949 parent_info: Option<PipelineId>,
950 target_snapshot_params: TargetSnapshotParams,
951 load_origin: LoadOrigin,
952 ) -> ParserContext {
953 ParserContext {
954 parser: None,
955 is_synthesized_document: false,
956 has_loaded_document: false,
957 webview_id,
958 pipeline_id,
959 url,
960 parent_info,
961 pushed_entry_index: None,
962 navigation_params: NavigationParams {
963 policy_container: Default::default(),
964 content_type: None,
965 link_headers: vec![],
966 final_sandboxing_flag_set: creation_sandboxing_flag_set,
967 resource_header: vec![],
968 about_base_url: Default::default(),
969 },
970 target_snapshot_params,
971 load_origin,
972 }
973 }
974
975 pub(crate) fn set_policy_container(&mut self, policy_container: Option<&PolicyContainer>) {
976 let Some(policy_container) = policy_container else {
977 return;
978 };
979 self.navigation_params.policy_container = policy_container.clone();
980 }
981
982 pub(crate) fn set_about_base_url(&mut self, about_base_url: Option<ServoUrl>) {
983 self.navigation_params.about_base_url = about_base_url;
984 }
985
986 pub(crate) fn get_document(&self) -> Option<DomRoot<Document>> {
987 self.parser
988 .as_ref()
989 .map(|parser| parser.root().document.as_rooted())
990 }
991
992 pub(crate) fn parent_info(&self) -> Option<PipelineId> {
993 self.parent_info
994 }
995
996 fn create_policy_container_from_fetch_response(metadata: &Metadata) -> PolicyContainer {
998 PolicyContainer {
1005 csp_list: parse_csp_list_from_metadata(&metadata.headers),
1007 embedder_policy: Default::default(),
1011 referrer_policy: ReferrerPolicy::parse_header_for_response(&metadata.headers),
1013 }
1014 }
1015
1016 fn initialize_document_object(&self, document: &Document) {
1018 document.set_policy_container(self.navigation_params.policy_container.clone());
1020 document.set_active_sandboxing_flag_set(self.navigation_params.final_sandboxing_flag_set);
1021 document.set_about_base_url(self.navigation_params.about_base_url.clone());
1022 process_link_headers(
1024 &self.navigation_params.link_headers,
1025 document,
1026 LinkProcessingPhase::PreMedia,
1027 );
1028 }
1029
1030 fn process_link_headers_in_media_phase_with_task(&mut self, document: &Document) {
1032 let link_headers = std::mem::take(&mut self.navigation_params.link_headers);
1036 if !link_headers.is_empty() {
1037 let window = document.window();
1038 let document = Trusted::new(document);
1039 window
1040 .upcast::<GlobalScope>()
1041 .task_manager()
1042 .networking_task_source()
1043 .queue(task!(process_link_headers_task: move || {
1044 process_link_headers(&link_headers, &document.root(), LinkProcessingPhase::Media);
1045 }));
1046 }
1047 }
1048
1049 fn load_document(&mut self, cx: &mut JSContext) {
1051 assert!(!self.has_loaded_document);
1052 self.has_loaded_document = true;
1053 let Some(ref parser) = self.parser.as_ref().map(|p| p.root()) else {
1054 return;
1055 };
1056 let content_type = &self.navigation_params.content_type;
1058 let mime_type = MimeClassifier::default().classify(
1059 LoadContext::Browsing,
1060 NoSniffFlag::Off,
1061 ApacheBugFlag::from_content_type(content_type.as_ref()),
1062 content_type,
1063 &self.navigation_params.resource_header,
1064 );
1065 let Some(media_type) = MimeClassifier::get_media_type(&mime_type) else {
1069 let page = format!(
1070 "<html><body><p>Unknown content type ({}).</p></body></html>",
1071 &mime_type,
1072 );
1073 self.load_inline_unknown_content(cx, parser, page);
1074 return;
1075 };
1076 match media_type {
1077 MediaType::Html => self.load_html_document(parser),
1079 MediaType::Xml => self.load_xml_document(parser),
1081 MediaType::JavaScript | MediaType::Text | MediaType::Css => {
1083 self.load_text_document(cx, parser)
1084 },
1085 MediaType::Json => self.load_json_document(cx, parser),
1087 MediaType::Image | MediaType::AudioVideo => {
1089 self.load_media_document(cx, parser, media_type, &mime_type);
1090 return;
1091 },
1092 MediaType::Font => {
1093 let page = format!(
1094 "<html><body><p>Unable to load font with content type ({}).</p></body></html>",
1095 &mime_type,
1096 );
1097 self.load_inline_unknown_content(cx, parser, page);
1098 return;
1099 },
1100 };
1101
1102 parser.parse_bytes_chunk(
1103 cx,
1104 std::mem::take(&mut self.navigation_params.resource_header),
1105 );
1106 }
1107
1108 fn load_html_document(&mut self, parser: &ServoParser) {
1110 self.initialize_document_object(&parser.document);
1113 self.process_link_headers_in_media_phase_with_task(&parser.document);
1117 }
1118
1119 fn load_xml_document(&mut self, parser: &ServoParser) {
1121 self.initialize_document_object(&parser.document);
1127 self.process_link_headers_in_media_phase_with_task(&parser.document);
1131 }
1132
1133 fn load_text_document(&mut self, cx: &mut JSContext, parser: &ServoParser) {
1135 self.initialize_document_object(&parser.document);
1138 let page = "<pre>\n".into();
1145 parser.push_string_input_chunk(page);
1146 parser.parse_sync(cx);
1147 parser.tokenizer.set_plaintext_state();
1148 self.process_link_headers_in_media_phase_with_task(&parser.document);
1152 }
1153
1154 fn load_media_document(
1156 &mut self,
1157 cx: &mut JSContext,
1158 parser: &ServoParser,
1159 media_type: MediaType,
1160 mime_type: &Mime,
1161 ) {
1162 self.initialize_document_object(&parser.document);
1165 self.is_synthesized_document = true;
1167 parser.last_chunk_received.set(true);
1168 let page = "<html><body></body></html>".into();
1170 parser.push_string_input_chunk(page);
1171 parser.parse_sync(cx);
1172
1173 let doc = &parser.document;
1174 let node = if media_type == MediaType::Image {
1177 let img = Element::create(
1178 cx,
1179 QualName::new(None, ns!(html), local_name!("img")),
1180 None,
1181 doc,
1182 ElementCreator::ParserCreated(1),
1183 CustomElementCreationMode::Asynchronous,
1184 None,
1185 );
1186 let img = DomRoot::downcast::<HTMLImageElement>(img).unwrap();
1187 img.SetSrc(cx, USVString(self.url.to_string()));
1188 DomRoot::upcast::<Node>(img)
1189 } else if mime_type.type_() == mime::AUDIO {
1190 let audio = Element::create(
1191 cx,
1192 QualName::new(None, ns!(html), local_name!("audio")),
1193 None,
1194 doc,
1195 ElementCreator::ParserCreated(1),
1196 CustomElementCreationMode::Asynchronous,
1197 None,
1198 );
1199 let audio = DomRoot::downcast::<HTMLMediaElement>(audio).unwrap();
1200 audio.SetControls(cx, true);
1201 audio.SetSrc(cx, USVString(self.url.to_string()));
1202 DomRoot::upcast::<Node>(audio)
1203 } else {
1204 let video = Element::create(
1205 cx,
1206 QualName::new(None, ns!(html), local_name!("video")),
1207 None,
1208 doc,
1209 ElementCreator::ParserCreated(1),
1210 CustomElementCreationMode::Asynchronous,
1211 None,
1212 );
1213 let video = DomRoot::downcast::<HTMLMediaElement>(video).unwrap();
1214 video.SetControls(cx, true);
1215 video.SetSrc(cx, USVString(self.url.to_string()));
1216 DomRoot::upcast::<Node>(video)
1217 };
1218 let doc_body = DomRoot::upcast::<Node>(doc.GetBody().unwrap());
1220 doc_body.AppendChild(cx, &node).expect("Appending failed");
1221 let link_headers = std::mem::take(&mut self.navigation_params.link_headers);
1223 process_link_headers(&link_headers, doc, LinkProcessingPhase::Media);
1224 }
1225
1226 fn load_json_document(&mut self, cx: &mut JSContext, parser: &ServoParser) {
1228 self.initialize_document_object(&parser.document);
1229 parser.push_string_input_chunk(resources::read_string(Resource::JsonViewerHTML));
1230 parser.parse_sync(cx);
1231 parser.tokenizer.set_plaintext_state();
1232 self.process_link_headers_in_media_phase_with_task(&parser.document);
1233 }
1234
1235 fn load_inline_unknown_content(
1237 &mut self,
1238 cx: &mut JSContext,
1239 parser: &ServoParser,
1240 page: String,
1241 ) {
1242 self.is_synthesized_document = true;
1243 parser.document.mark_as_internal();
1244 parser.push_string_input_chunk(page);
1245 parser.last_chunk_received.set(true);
1247 parser.parse_sync(cx);
1248 }
1249
1250 fn submit_resource_timing(&mut self) {
1252 let Some(parser) = self.parser.as_ref() else {
1253 return;
1254 };
1255 let parser = parser.root();
1256 if parser.aborted.get() {
1257 return;
1258 }
1259
1260 let document = &parser.document;
1261
1262 let performance_entry = PerformanceNavigationTiming::new(
1263 &document.global(),
1264 document,
1265 CanGc::deprecated_note(),
1266 );
1267 self.pushed_entry_index = document
1268 .global()
1269 .performance()
1270 .queue_entry(performance_entry.upcast::<PerformanceEntry>());
1271 }
1272}
1273
1274impl FetchResponseListener for ParserContext {
1275 fn process_request_body(&mut self, _: RequestId) {}
1276
1277 fn process_response(
1280 &mut self,
1281 cx: &mut JSContext,
1282 _: RequestId,
1283 meta_result: Result<FetchMetadata, NetworkError>,
1284 ) {
1285 let (metadata, mut error) = match meta_result {
1286 Ok(meta) => (
1287 Some(match meta {
1288 FetchMetadata::Unfiltered(m) => m,
1289 FetchMetadata::Filtered { unsafe_, .. } => unsafe_,
1290 }),
1291 None,
1292 ),
1293 Err(error) => (
1294 match &error {
1296 NetworkError::LoadCancelled => {
1297 return;
1298 },
1299 _ => {
1300 let mut meta = Metadata::default(self.url.clone());
1301 let mime: Option<Mime> = "text/html".parse().ok();
1302 meta.set_content_type(mime.as_ref());
1303 Some(meta)
1304 },
1305 },
1306 Some(error),
1307 ),
1308 };
1309 let content_type: Option<Mime> = metadata
1310 .clone()
1311 .and_then(|meta| meta.content_type)
1312 .map(Serde::into_inner)
1313 .map(Into::into);
1314
1315 let (policy_container, endpoints_list, link_headers) = match metadata.as_ref() {
1320 None => (PolicyContainer::default(), None, vec![]),
1321 Some(metadata) => (
1322 Self::create_policy_container_from_fetch_response(metadata),
1323 ReportingEndpoint::parse_reporting_endpoints_header(
1324 &self.url.clone(),
1325 &metadata.headers,
1326 ),
1327 extract_links_from_headers(&metadata.headers),
1328 ),
1329 };
1330
1331 let final_sandboxing_flag_set = policy_container
1335 .csp_list
1336 .as_ref()
1337 .and_then(|csp| csp.get_sandboxing_flag_set_for_document())
1338 .unwrap_or(SandboxingFlagSet::empty())
1339 .union(self.target_snapshot_params.sandboxing_flags);
1340
1341 let source_origin = match self.load_origin {
1345 LoadOrigin::Script(ref snapshot) => {
1346 Some(MutableOrigin::from_snapshot(snapshot.clone()))
1347 },
1348 _ => None,
1349 };
1350 let origin = determine_the_origin(
1351 metadata.as_ref().map(|metadata| &metadata.final_url),
1352 final_sandboxing_flag_set,
1353 source_origin,
1354 );
1355
1356 let parser = match ScriptThread::page_headers_available(
1357 self.webview_id,
1358 self.pipeline_id,
1359 metadata.as_ref(),
1360 origin.clone(),
1361 cx,
1362 ) {
1363 Some(parser) => parser,
1364 None => return,
1365 };
1366 if parser.aborted.get() {
1367 return;
1368 }
1369
1370 let mut realm = enter_auto_realm(cx, &*parser.document);
1371 let cx = &mut realm;
1372 let document = &parser.document;
1373 let window = document.window();
1374
1375 if
1378 policy_container.csp_list.should_navigation_response_to_navigation_request_be_blocked(
1385 window,
1386 self.url.clone().into_url(),
1387 &origin.immutable().clone().into_url_origin(),
1388 )
1389 || !check_a_navigation_response_adherence_to_x_frame_options(
1397 window,
1398 policy_container.csp_list.as_ref(),
1399 &origin,
1400 metadata
1401 .as_ref()
1402 .and_then(|metadata| metadata.headers.as_ref()),
1403 ) {
1404 error = Some(NetworkError::ContentSecurityPolicy);
1408 document.make_document_unsalvageable();
1410 }
1415
1416 if let Some(endpoints) = endpoints_list {
1417 window.set_endpoints_list(endpoints);
1418 }
1419 self.parser = Some(Trusted::new(&*parser));
1420 self.navigation_params = NavigationParams {
1421 policy_container,
1422 content_type,
1423 final_sandboxing_flag_set,
1424 link_headers,
1425 about_base_url: document.about_base_url(),
1426 resource_header: vec![],
1427 };
1428 self.submit_resource_timing();
1429
1430 if let Some(error) = error {
1438 let page = match error {
1439 NetworkError::SslValidation(reason, bytes) => {
1440 let page = resources::read_string(Resource::BadCertHTML);
1441 let page = page.replace("${reason}", &reason);
1442 let encoded_bytes = general_purpose::STANDARD_NO_PAD.encode(bytes);
1443 let page = page.replace("${bytes}", encoded_bytes.as_str());
1444 page.replace("${secret}", &net_traits::PRIVILEGED_SECRET.to_string())
1445 },
1446 NetworkError::BlobURLStoreError(reason) |
1447 NetworkError::WebsocketConnectionFailure(reason) |
1448 NetworkError::HttpError(reason) |
1449 NetworkError::ResourceLoadError(reason) |
1450 NetworkError::MimeType(reason) => {
1451 let page = resources::read_string(Resource::NetErrorHTML);
1452 page.replace("${reason}", &reason)
1453 },
1454 NetworkError::Crash(details) => {
1455 let page = resources::read_string(Resource::CrashHTML);
1456 page.replace("${details}", &details)
1457 },
1458 NetworkError::UnsupportedScheme |
1459 NetworkError::CorsGeneral |
1460 NetworkError::CrossOriginResponse |
1461 NetworkError::CorsCredentials |
1462 NetworkError::CorsAllowMethods |
1463 NetworkError::CorsAllowHeaders |
1464 NetworkError::CorsMethod |
1465 NetworkError::CorsAuthorization |
1466 NetworkError::CorsHeaders |
1467 NetworkError::ConnectionFailure |
1468 NetworkError::RedirectError |
1469 NetworkError::TooManyRedirects |
1470 NetworkError::TooManyInFlightKeepAliveRequests |
1471 NetworkError::InvalidMethod |
1472 NetworkError::ContentSecurityPolicy |
1473 NetworkError::Nosniff |
1474 NetworkError::SubresourceIntegrity |
1475 NetworkError::MixedContent |
1476 NetworkError::CacheError |
1477 NetworkError::InvalidPort |
1478 NetworkError::LocalDirectoryError |
1479 NetworkError::PartialResponseToNonRangeRequestError |
1480 NetworkError::ProtocolHandlerSubstitutionError |
1481 NetworkError::DecompressionError => {
1482 let page = resources::read_string(Resource::NetErrorHTML);
1483 page.replace("${reason}", &format!("{:?}", error))
1484 },
1485 NetworkError::LoadCancelled => {
1486 return;
1488 },
1489 };
1490 self.load_inline_unknown_content(cx, &parser, page);
1491 }
1492 }
1493
1494 fn process_response_chunk(&mut self, cx: &mut JSContext, _: RequestId, payload: Vec<u8>) {
1495 if self.is_synthesized_document {
1496 return;
1497 }
1498 let Some(parser) = self.parser.as_ref().map(|p| p.root()) else {
1499 return;
1500 };
1501 if parser.aborted.get() {
1502 return;
1503 }
1504 if !self.has_loaded_document {
1505 self.navigation_params
1507 .resource_header
1508 .extend_from_slice(&payload);
1509 if self.navigation_params.resource_header.len() >= 1445 {
1511 self.load_document(cx);
1512 }
1513 } else {
1514 parser.parse_bytes_chunk(cx, payload);
1515 }
1516 }
1517
1518 fn process_response_eof(
1522 mut self,
1523 cx: &mut JSContext,
1524 _: RequestId,
1525 status: Result<(), NetworkError>,
1526 timing: ResourceFetchTiming,
1527 ) {
1528 let parser = match self.parser.as_ref() {
1529 Some(parser) => parser.root(),
1530 None => return,
1531 };
1532 if parser.aborted.get() || self.is_synthesized_document {
1533 return;
1534 }
1535
1536 if let Err(error) = &status {
1537 debug!("Failed to load page URL {}, error: {error:?}", self.url);
1539 }
1540
1541 if !self.has_loaded_document {
1545 self.load_document(cx);
1546 }
1547
1548 let mut realm = enter_auto_realm(cx, &*parser);
1549 let cx = &mut realm;
1550
1551 if status.is_ok() {
1552 parser.document.set_resource_fetch_timing(timing);
1553 }
1554
1555 parser.last_chunk_received.set(true);
1556 if !parser.suspended.get() {
1557 parser.parse_sync(cx);
1558 }
1559
1560 if let Some(pushed_index) = self.pushed_entry_index {
1562 let document = &parser.document;
1563 let performance_entry =
1564 PerformanceNavigationTiming::new(&document.global(), document, CanGc::from_cx(cx));
1565 document
1566 .global()
1567 .performance()
1568 .update_entry(pushed_index, performance_entry.upcast::<PerformanceEntry>());
1569 }
1570 }
1571
1572 fn process_csp_violations(&mut self, _: RequestId, _: Vec<Violation>) {
1573 unreachable!("Script_thread should handle reporting violations for parser contexts");
1574 }
1575}
1576
1577pub(crate) struct FragmentContext<'a> {
1578 pub(crate) context_elem: &'a Node,
1579 pub(crate) form_elem: Option<&'a Node>,
1580 pub(crate) context_element_allows_scripting: bool,
1581}
1582
1583#[cfg_attr(crown, expect(crown::unrooted_must_root))]
1584fn insert(
1585 cx: &mut JSContext,
1586 parent: &Node,
1587 reference_child: Option<&Node>,
1588 child: NodeOrText<Dom<Node>>,
1589 parsing_algorithm: ParsingAlgorithm,
1590 custom_element_reaction_stack: &CustomElementReactionStack,
1591) {
1592 match child {
1593 NodeOrText::AppendNode(n) => {
1594 let element_in_non_fragment =
1598 parsing_algorithm != ParsingAlgorithm::Fragment && n.is::<Element>();
1599 if element_in_non_fragment {
1600 custom_element_reaction_stack.push_new_element_queue();
1601 }
1602 parent.InsertBefore(cx, &n, reference_child).unwrap();
1603 if element_in_non_fragment {
1604 custom_element_reaction_stack.pop_current_element_queue(cx);
1605 }
1606 },
1607 NodeOrText::AppendText(t) => {
1608 let text = reference_child
1610 .and_then(Node::GetPreviousSibling)
1611 .or_else(|| parent.GetLastChild())
1612 .and_then(DomRoot::downcast::<Text>);
1613
1614 if let Some(text) = text {
1615 text.upcast::<CharacterData>().append_data(cx, &t);
1616 } else {
1617 let text = Text::new(cx, String::from(t).into(), &parent.owner_doc());
1618 parent
1619 .InsertBefore(cx, text.upcast(), reference_child)
1620 .unwrap();
1621 }
1622 },
1623 }
1624}
1625
1626#[derive(JSTraceable, MallocSizeOf)]
1627#[cfg_attr(crown, crown::unrooted_must_root_lint::must_root)]
1628pub(crate) struct Sink {
1629 #[no_trace]
1630 base_url: ServoUrl,
1631 document: Dom<Document>,
1632 current_line: Cell<u64>,
1633 script: MutNullableDom<HTMLScriptElement>,
1634 parsing_algorithm: ParsingAlgorithm,
1635 #[conditional_malloc_size_of]
1636 custom_element_reaction_stack: Rc<CustomElementReactionStack>,
1637}
1638
1639impl Sink {
1640 fn same_tree(&self, x: &Dom<Node>, y: &Dom<Node>) -> bool {
1641 let x = x.downcast::<Element>().expect("Element node expected");
1642 let y = y.downcast::<Element>().expect("Element node expected");
1643
1644 x.is_in_same_home_subtree(y)
1645 }
1646
1647 fn has_parent_node(&self, node: &Dom<Node>) -> bool {
1648 node.GetParentNode().is_some()
1649 }
1650}
1651
1652impl TreeSink for Sink {
1653 type Output = Self;
1654
1655 #[cfg_attr(crown, expect(crown::unrooted_must_root))]
1656 fn finish(self) -> Self {
1657 self
1658 }
1659
1660 type Handle = Dom<Node>;
1661 type ElemName<'a>
1662 = ExpandedName<'a>
1663 where
1664 Self: 'a;
1665
1666 fn get_document(&self) -> Dom<Node> {
1667 Dom::from_ref(self.document.upcast())
1668 }
1669
1670 #[expect(unsafe_code)]
1671 fn get_template_contents(&self, target: &Dom<Node>) -> Dom<Node> {
1672 let mut cx = unsafe { temp_cx() };
1674 let cx = &mut cx;
1675 let template = target
1676 .downcast::<HTMLTemplateElement>()
1677 .expect("tried to get template contents of non-HTMLTemplateElement in HTML parsing");
1678 Dom::from_ref(template.Content(cx).upcast())
1679 }
1680
1681 fn same_node(&self, x: &Dom<Node>, y: &Dom<Node>) -> bool {
1682 x == y
1683 }
1684
1685 fn elem_name<'a>(&self, target: &'a Dom<Node>) -> ExpandedName<'a> {
1686 let elem = target
1687 .downcast::<Element>()
1688 .expect("tried to get name of non-Element in HTML parsing");
1689 ExpandedName {
1690 ns: elem.namespace(),
1691 local: elem.local_name(),
1692 }
1693 }
1694
1695 #[expect(unsafe_code)]
1696 fn create_element(
1697 &self,
1698 name: QualName,
1699 attrs: Vec<Attribute>,
1700 flags: ElementFlags,
1701 ) -> Dom<Node> {
1702 let mut cx = unsafe { temp_cx() };
1704 let cx = &mut cx;
1705 let attrs = attrs
1706 .into_iter()
1707 .map(|attr| ElementAttribute::new(attr.name, DOMString::from(String::from(attr.value))))
1708 .collect();
1709 let parsing_algorithm = if flags.template {
1710 ParsingAlgorithm::Fragment
1711 } else {
1712 self.parsing_algorithm
1713 };
1714 let element = create_element_for_token(
1715 cx,
1716 name,
1717 attrs,
1718 &self.document,
1719 ElementCreator::ParserCreated(self.current_line.get()),
1720 parsing_algorithm,
1721 &self.custom_element_reaction_stack,
1722 flags.had_duplicate_attributes,
1723 );
1724 Dom::from_ref(element.upcast())
1725 }
1726
1727 #[expect(unsafe_code)]
1728 fn create_comment(&self, text: StrTendril) -> Dom<Node> {
1729 let mut cx = unsafe { temp_cx() };
1731 let cx = &mut cx;
1732 let comment = Comment::new(
1733 cx,
1734 DOMString::from(String::from(text)),
1735 &self.document,
1736 None,
1737 );
1738 Dom::from_ref(comment.upcast())
1739 }
1740
1741 #[expect(unsafe_code)]
1742 fn create_pi(&self, target: StrTendril, data: StrTendril) -> Dom<Node> {
1743 let mut cx = unsafe { temp_cx() };
1745 let cx = &mut cx;
1746 let doc = &*self.document;
1747 let pi = ProcessingInstruction::new(
1748 cx,
1749 DOMString::from(String::from(target)),
1750 DOMString::from(String::from(data)),
1751 doc,
1752 );
1753 Dom::from_ref(pi.upcast())
1754 }
1755
1756 #[expect(unsafe_code)]
1757 fn associate_with_form(
1758 &self,
1759 target: &Dom<Node>,
1760 form: &Dom<Node>,
1761 nodes: (&Dom<Node>, Option<&Dom<Node>>),
1762 ) {
1763 let mut cx = unsafe { temp_cx() };
1765 let cx = &mut cx;
1766 let (element, prev_element) = nodes;
1767 let tree_node = prev_element.map_or(element, |prev| {
1768 if self.has_parent_node(element) {
1769 element
1770 } else {
1771 prev
1772 }
1773 });
1774 if !self.same_tree(tree_node, form) {
1775 return;
1776 }
1777
1778 let node = target;
1779 let form = DomRoot::downcast::<HTMLFormElement>(DomRoot::from_ref(&**form))
1780 .expect("Owner must be a form element");
1781
1782 let elem = node.downcast::<Element>();
1783 let control = elem.and_then(|e| e.as_maybe_form_control());
1784
1785 if let Some(control) = control {
1786 control.set_form_owner_from_parser(cx, &form);
1787 }
1788 }
1789
1790 #[expect(unsafe_code)]
1791 #[cfg_attr(crown, expect(crown::unrooted_must_root))]
1792 fn append_before_sibling(&self, sibling: &Dom<Node>, new_node: NodeOrText<Dom<Node>>) {
1793 let mut cx = unsafe { temp_cx() };
1795 let cx = &mut cx;
1796
1797 let parent = sibling
1798 .GetParentNode()
1799 .expect("append_before_sibling called on node without parent");
1800
1801 insert(
1802 cx,
1803 &parent,
1804 Some(sibling),
1805 new_node,
1806 self.parsing_algorithm,
1807 &self.custom_element_reaction_stack,
1808 );
1809 }
1810
1811 fn parse_error(&self, msg: Cow<'static, str>) {
1812 debug!("Parse error: {}", msg);
1813 }
1814
1815 fn set_quirks_mode(&self, mode: QuirksMode) {
1816 let mode = match mode {
1817 QuirksMode::Quirks => ServoQuirksMode::Quirks,
1818 QuirksMode::LimitedQuirks => ServoQuirksMode::LimitedQuirks,
1819 QuirksMode::NoQuirks => ServoQuirksMode::NoQuirks,
1820 };
1821 self.document.set_quirks_mode(mode);
1822 }
1823
1824 #[expect(unsafe_code)]
1825 #[cfg_attr(crown, expect(crown::unrooted_must_root))]
1826 fn append(&self, parent: &Dom<Node>, child: NodeOrText<Dom<Node>>) {
1827 let mut cx = unsafe { temp_cx() };
1829 let cx = &mut cx;
1830
1831 insert(
1832 cx,
1833 parent,
1834 None,
1835 child,
1836 self.parsing_algorithm,
1837 &self.custom_element_reaction_stack,
1838 );
1839 }
1840
1841 #[cfg_attr(crown, expect(crown::unrooted_must_root))]
1842 fn append_based_on_parent_node(
1843 &self,
1844 elem: &Dom<Node>,
1845 prev_elem: &Dom<Node>,
1846 child: NodeOrText<Dom<Node>>,
1847 ) {
1848 if self.has_parent_node(elem) {
1849 self.append_before_sibling(elem, child);
1850 } else {
1851 self.append(prev_elem, child);
1852 }
1853 }
1854
1855 #[expect(unsafe_code)]
1856 fn append_doctype_to_document(
1857 &self,
1858 name: StrTendril,
1859 public_id: StrTendril,
1860 system_id: StrTendril,
1861 ) {
1862 let mut cx = unsafe { temp_cx() };
1864 let cx = &mut cx;
1865
1866 let doc = &*self.document;
1867 let doctype = DocumentType::new(
1868 cx,
1869 DOMString::from(String::from(name)),
1870 Some(DOMString::from(String::from(public_id))),
1871 Some(DOMString::from(String::from(system_id))),
1872 doc,
1873 );
1874 doc.upcast::<Node>()
1875 .AppendChild(cx, doctype.upcast())
1876 .expect("Appending failed");
1877 }
1878
1879 #[expect(unsafe_code)]
1880 fn add_attrs_if_missing(&self, target: &Dom<Node>, attrs: Vec<Attribute>) {
1881 let mut cx = unsafe { temp_cx() };
1883 let cx = &mut cx;
1884
1885 let elem = target
1886 .downcast::<Element>()
1887 .expect("tried to set attrs on non-Element in HTML parsing");
1888 for attr in attrs {
1889 elem.set_attribute_from_parser(
1890 cx,
1891 attr.name,
1892 DOMString::from(String::from(attr.value)),
1893 None,
1894 );
1895 }
1896 }
1897
1898 #[expect(unsafe_code)]
1899 fn remove_from_parent(&self, target: &Dom<Node>) {
1900 let mut cx = unsafe { temp_cx() };
1902 let cx = &mut cx;
1903
1904 if let Some(ref parent) = target.GetParentNode() {
1905 parent.RemoveChild(cx, target).unwrap();
1906 }
1907 }
1908
1909 fn mark_script_already_started(&self, node: &Dom<Node>) {
1910 let script = node.downcast::<HTMLScriptElement>();
1911 if let Some(script) = script {
1912 script.set_already_started(true)
1913 }
1914 }
1915
1916 #[expect(unsafe_code)]
1917 fn reparent_children(&self, node: &Dom<Node>, new_parent: &Dom<Node>) {
1918 let mut cx = unsafe { temp_cx() };
1920 let cx = &mut cx;
1921
1922 while let Some(ref child) = node.GetFirstChild() {
1923 new_parent.AppendChild(cx, child).unwrap();
1924 }
1925 }
1926
1927 fn is_mathml_annotation_xml_integration_point(&self, handle: &Dom<Node>) -> bool {
1930 let elem = handle.downcast::<Element>().unwrap();
1931 elem.get_attribute_string_value(&local_name!("encoding"))
1932 .is_some_and(|value| {
1933 value.eq_ignore_ascii_case("text/html") ||
1934 value.eq_ignore_ascii_case("application/xhtml+xml")
1935 })
1936 }
1937
1938 fn set_current_line(&self, line_number: u64) {
1939 self.current_line.set(line_number);
1940 }
1941
1942 #[expect(unsafe_code)]
1943 fn pop(&self, node: &Dom<Node>) {
1944 let mut cx = unsafe { temp_cx() };
1946 let cx = &mut cx;
1947
1948 let node = DomRoot::from_ref(&**node);
1949 vtable_for(&node).pop(cx);
1950 }
1951
1952 fn allow_declarative_shadow_roots(&self, intended_parent: &Dom<Node>) -> bool {
1953 intended_parent.owner_doc().allow_declarative_shadow_roots()
1954 }
1955
1956 #[expect(unsafe_code)]
1960 fn attach_declarative_shadow(
1961 &self,
1962 host: &Dom<Node>,
1963 template: &Dom<Node>,
1964 attributes: &[Attribute],
1965 ) -> bool {
1966 let mut cx = unsafe { temp_cx() };
1968 let cx = &mut cx;
1969
1970 attach_declarative_shadow_inner(cx, host, template, attributes)
1971 }
1972
1973 #[expect(unsafe_code)]
1974 fn maybe_clone_an_option_into_selectedcontent(&self, option: &Self::Handle) {
1975 let mut cx = unsafe { temp_cx() };
1977 let cx = &mut cx;
1978
1979 let Some(option) = option.downcast::<HTMLOptionElement>() else {
1980 if cfg!(debug_assertions) {
1981 unreachable!();
1982 }
1983 log::error!(
1984 "Received non-option element in maybe_clone_an_option_into_selectedcontent"
1985 );
1986 return;
1987 };
1988
1989 option.maybe_clone_an_option_into_selectedcontent(cx)
1990 }
1991}
1992
1993#[expect(clippy::too_many_arguments)]
1995fn create_element_for_token(
1996 cx: &mut JSContext,
1997 name: QualName,
1998 attrs: Vec<ElementAttribute>,
1999 document: &Document,
2000 creator: ElementCreator,
2001 parsing_algorithm: ParsingAlgorithm,
2002 custom_element_reaction_stack: &CustomElementReactionStack,
2003 had_duplicate_attributes: bool,
2004) -> DomRoot<Element> {
2005 let is = attrs
2023 .iter()
2024 .find(|attr| attr.name.local.eq_str_ignore_ascii_case("is"))
2025 .map(|attr| LocalName::from(&attr.value));
2026
2027 let definition = document.lookup_custom_element_definition(&name.ns, &name.local, is.as_ref());
2033
2034 let will_execute_script =
2037 definition.is_some() && parsing_algorithm != ParsingAlgorithm::Fragment;
2038
2039 if will_execute_script {
2041 document.increment_throw_on_dynamic_markup_insertion_counter();
2043 if is_execution_stack_empty() {
2046 document.window().perform_a_microtask_checkpoint(cx);
2047 }
2048 custom_element_reaction_stack.push_new_element_queue()
2051 }
2052
2053 let creation_mode = if will_execute_script {
2056 CustomElementCreationMode::Synchronous
2057 } else {
2058 CustomElementCreationMode::Asynchronous
2059 };
2060 let element = Element::create(cx, name, is, document, creator, creation_mode, None);
2061
2062 for attr in attrs {
2064 element.set_attribute_from_parser(cx, attr.name, attr.value, None);
2065 }
2066
2067 if had_duplicate_attributes {
2070 element.set_had_duplicate_attributes();
2071 }
2072
2073 if will_execute_script {
2075 custom_element_reaction_stack.pop_current_element_queue(cx);
2080 document.decrement_throw_on_dynamic_markup_insertion_counter();
2082 }
2083
2084 if let Some(html_element) = element.downcast::<HTMLElement>() &&
2094 element.is_resettable() &&
2095 !html_element.is_form_associated_custom_element()
2096 {
2097 element.reset(cx);
2098 }
2099
2100 element
2110}
2111
2112fn attach_declarative_shadow_inner(
2113 cx: &mut JSContext,
2114 host: &Node,
2115 template: &Node,
2116 attributes: &[Attribute],
2117) -> bool {
2118 let host_element = host.downcast::<Element>().unwrap();
2119
2120 if host_element.shadow_root().is_some() {
2121 return false;
2122 }
2123
2124 let template_element = template.downcast::<HTMLTemplateElement>().unwrap();
2125
2126 let mut shadow_root_mode = ShadowRootMode::Open;
2136 let mut slot_assignment_mode = SlotAssignmentMode::Named;
2137 let mut clonable = false;
2138 let mut delegatesfocus = false;
2139 let mut serializable = false;
2140
2141 attributes
2142 .iter()
2143 .for_each(|attr: &Attribute| match attr.name.local {
2144 local_name!("shadowrootmode") => {
2145 if attr.value.eq_ignore_ascii_case("open") {
2146 shadow_root_mode = ShadowRootMode::Open;
2147 } else if attr.value.eq_ignore_ascii_case("closed") {
2148 shadow_root_mode = ShadowRootMode::Closed;
2149 } else {
2150 unreachable!("shadowrootmode value is not open nor closed");
2151 }
2152 },
2153 local_name!("shadowrootclonable") => {
2154 clonable = true;
2155 },
2156 local_name!("shadowrootdelegatesfocus") => {
2157 delegatesfocus = true;
2158 },
2159 local_name!("shadowrootserializable") => {
2160 serializable = true;
2161 },
2162 local_name!("shadowrootslotassignment") => {
2163 if attr.value.eq_ignore_ascii_case("manual") {
2164 slot_assignment_mode = SlotAssignmentMode::Manual;
2165 }
2166 },
2167 _ => {},
2168 });
2169
2170 match host_element.attach_shadow(
2173 cx,
2174 IsUserAgentWidget::No,
2175 shadow_root_mode,
2176 clonable,
2177 serializable,
2178 delegatesfocus,
2179 slot_assignment_mode,
2180 ) {
2181 Ok(shadow_root) => {
2182 shadow_root.set_declarative(true);
2184
2185 let shadow = shadow_root.upcast::<DocumentFragment>();
2187 template_element.set_contents(Some(shadow));
2188
2189 shadow_root.set_available_to_element_internals(true);
2191
2192 true
2193 },
2194 Err(_) => false,
2195 }
2196}