mirror of
https://github.com/servo/servo.git
synced 2025-08-03 20:50:07 +01:00
Reorganise ServoParser
Free-standing fonctions parse_html and friends are now static methods on ServoParser, and the HTML and XML tokenizers have been moved to private submodules.
This commit is contained in:
parent
57c4db7c67
commit
15e8e92540
8 changed files with 291 additions and 280 deletions
|
@ -46,6 +46,7 @@ use euclid::{Matrix2D, Matrix4D, Point2D};
|
||||||
use euclid::length::Length as EuclidLength;
|
use euclid::length::Length as EuclidLength;
|
||||||
use euclid::rect::Rect;
|
use euclid::rect::Rect;
|
||||||
use euclid::size::Size2D;
|
use euclid::size::Size2D;
|
||||||
|
use html5ever::tokenizer::buffer_queue::BufferQueue;
|
||||||
use html5ever::tree_builder::QuirksMode;
|
use html5ever::tree_builder::QuirksMode;
|
||||||
use html5ever_atoms::{Prefix, LocalName, Namespace, QualName};
|
use html5ever_atoms::{Prefix, LocalName, Namespace, QualName};
|
||||||
use hyper::header::Headers;
|
use hyper::header::Headers;
|
||||||
|
@ -322,7 +323,7 @@ no_jsmanaged_fields!(HashSet<T>);
|
||||||
no_jsmanaged_fields!(FrameId, FrameType, WindowSizeData, WindowSizeType, PipelineId);
|
no_jsmanaged_fields!(FrameId, FrameType, WindowSizeData, WindowSizeType, PipelineId);
|
||||||
no_jsmanaged_fields!(TimerEventId, TimerSource);
|
no_jsmanaged_fields!(TimerEventId, TimerSource);
|
||||||
no_jsmanaged_fields!(WorkerId);
|
no_jsmanaged_fields!(WorkerId);
|
||||||
no_jsmanaged_fields!(QuirksMode);
|
no_jsmanaged_fields!(BufferQueue, QuirksMode);
|
||||||
no_jsmanaged_fields!(Runtime);
|
no_jsmanaged_fields!(Runtime);
|
||||||
no_jsmanaged_fields!(Headers, Method);
|
no_jsmanaged_fields!(Headers, Method);
|
||||||
no_jsmanaged_fields!(WindowProxyHandler);
|
no_jsmanaged_fields!(WindowProxyHandler);
|
||||||
|
|
|
@ -18,8 +18,7 @@ use dom::bindings::str::DOMString;
|
||||||
use dom::document::{Document, IsHTMLDocument};
|
use dom::document::{Document, IsHTMLDocument};
|
||||||
use dom::document::DocumentSource;
|
use dom::document::DocumentSource;
|
||||||
use dom::globalscope::GlobalScope;
|
use dom::globalscope::GlobalScope;
|
||||||
use dom::servoparser::html::{ParseContext, parse_html};
|
use dom::servoparser::ServoParser;
|
||||||
use dom::servoparser::xml::{self, parse_xml};
|
|
||||||
use dom::window::Window;
|
use dom::window::Window;
|
||||||
|
|
||||||
#[dom_struct]
|
#[dom_struct]
|
||||||
|
@ -70,7 +69,7 @@ impl DOMParserMethods for DOMParser {
|
||||||
loader,
|
loader,
|
||||||
None,
|
None,
|
||||||
None);
|
None);
|
||||||
parse_html(&document, s, url, ParseContext::Owner(None));
|
ServoParser::parse_html_document(&document, s, url, None);
|
||||||
document.set_ready_state(DocumentReadyState::Complete);
|
document.set_ready_state(DocumentReadyState::Complete);
|
||||||
Ok(document)
|
Ok(document)
|
||||||
}
|
}
|
||||||
|
@ -86,7 +85,7 @@ impl DOMParserMethods for DOMParser {
|
||||||
loader,
|
loader,
|
||||||
None,
|
None,
|
||||||
None);
|
None);
|
||||||
parse_xml(&document, s, url, xml::ParseContext::Owner(None));
|
ServoParser::parse_xml_document(&document, s, url, None);
|
||||||
Ok(document)
|
Ok(document)
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -47,7 +47,7 @@ use dom::htmltextareaelement::{HTMLTextAreaElement, LayoutHTMLTextAreaElementHel
|
||||||
use dom::nodelist::NodeList;
|
use dom::nodelist::NodeList;
|
||||||
use dom::processinginstruction::ProcessingInstruction;
|
use dom::processinginstruction::ProcessingInstruction;
|
||||||
use dom::range::WeakRangeVec;
|
use dom::range::WeakRangeVec;
|
||||||
use dom::servoparser::html::parse_html_fragment;
|
use dom::servoparser::ServoParser;
|
||||||
use dom::svgsvgelement::{SVGSVGElement, LayoutSVGSVGElementHelpers};
|
use dom::svgsvgelement::{SVGSVGElement, LayoutSVGSVGElementHelpers};
|
||||||
use dom::text::Text;
|
use dom::text::Text;
|
||||||
use dom::virtualmethods::{VirtualMethods, vtable_for};
|
use dom::virtualmethods::{VirtualMethods, vtable_for};
|
||||||
|
@ -833,7 +833,7 @@ impl Node {
|
||||||
let context_document = document_from_node(self);
|
let context_document = document_from_node(self);
|
||||||
let fragment = DocumentFragment::new(&context_document);
|
let fragment = DocumentFragment::new(&context_document);
|
||||||
if context_document.is_html_document() {
|
if context_document.is_html_document() {
|
||||||
parse_html_fragment(self.upcast(), markup, fragment.upcast());
|
ServoParser::parse_html_fragment(self.upcast(), markup, fragment.upcast());
|
||||||
} else {
|
} else {
|
||||||
// FIXME: XML case
|
// FIXME: XML case
|
||||||
unimplemented!();
|
unimplemented!();
|
||||||
|
|
|
@ -4,23 +4,19 @@
|
||||||
|
|
||||||
#![allow(unrooted_must_root)]
|
#![allow(unrooted_must_root)]
|
||||||
|
|
||||||
use document_loader::DocumentLoader;
|
|
||||||
use dom::bindings::codegen::Bindings::DocumentBinding::DocumentMethods;
|
|
||||||
use dom::bindings::codegen::Bindings::HTMLTemplateElementBinding::HTMLTemplateElementMethods;
|
use dom::bindings::codegen::Bindings::HTMLTemplateElementBinding::HTMLTemplateElementMethods;
|
||||||
use dom::bindings::codegen::Bindings::NodeBinding::NodeMethods;
|
use dom::bindings::codegen::Bindings::NodeBinding::NodeMethods;
|
||||||
use dom::bindings::inheritance::{Castable, CharacterDataTypeId, NodeTypeId};
|
use dom::bindings::inheritance::{Castable, CharacterDataTypeId, NodeTypeId};
|
||||||
use dom::bindings::js::{JS, RootedReference};
|
use dom::bindings::js::{JS, Root};
|
||||||
use dom::bindings::str::DOMString;
|
use dom::bindings::str::DOMString;
|
||||||
|
use dom::bindings::trace::JSTraceable;
|
||||||
use dom::characterdata::CharacterData;
|
use dom::characterdata::CharacterData;
|
||||||
use dom::comment::Comment;
|
use dom::comment::Comment;
|
||||||
use dom::document::{DocumentSource, IsHTMLDocument};
|
|
||||||
use dom::document::Document;
|
use dom::document::Document;
|
||||||
use dom::documenttype::DocumentType;
|
use dom::documenttype::DocumentType;
|
||||||
use dom::element::{Element, ElementCreator};
|
use dom::element::{Element, ElementCreator};
|
||||||
use dom::htmlformelement::HTMLFormElement;
|
|
||||||
use dom::htmlscriptelement::HTMLScriptElement;
|
use dom::htmlscriptelement::HTMLScriptElement;
|
||||||
use dom::htmltemplateelement::HTMLTemplateElement;
|
use dom::htmltemplateelement::HTMLTemplateElement;
|
||||||
use dom::node::{document_from_node, window_from_node};
|
|
||||||
use dom::node::Node;
|
use dom::node::Node;
|
||||||
use dom::processinginstruction::ProcessingInstruction;
|
use dom::processinginstruction::ProcessingInstruction;
|
||||||
use dom::text::Text;
|
use dom::text::Text;
|
||||||
|
@ -29,28 +25,107 @@ use html5ever::serialize::{AttrRef, Serializable, Serializer};
|
||||||
use html5ever::serialize::TraversalScope;
|
use html5ever::serialize::TraversalScope;
|
||||||
use html5ever::serialize::TraversalScope::{ChildrenOnly, IncludeNode};
|
use html5ever::serialize::TraversalScope::{ChildrenOnly, IncludeNode};
|
||||||
use html5ever::tendril::StrTendril;
|
use html5ever::tendril::StrTendril;
|
||||||
use html5ever::tokenizer::{Tokenizer as H5ETokenizer, TokenizerOpts};
|
use html5ever::tokenizer::{Tokenizer as HtmlTokenizer, TokenizerOpts, TokenizerResult};
|
||||||
|
use html5ever::tokenizer::buffer_queue::BufferQueue;
|
||||||
use html5ever::tree_builder::{NodeOrText, QuirksMode};
|
use html5ever::tree_builder::{NodeOrText, QuirksMode};
|
||||||
use html5ever::tree_builder::{TreeBuilder, TreeBuilderOpts, TreeSink};
|
use html5ever::tree_builder::{Tracer as HtmlTracer, TreeBuilder, TreeBuilderOpts, TreeSink};
|
||||||
use html5ever_atoms::QualName;
|
use html5ever_atoms::QualName;
|
||||||
use msg::constellation_msg::PipelineId;
|
use js::jsapi::JSTracer;
|
||||||
use std::borrow::Cow;
|
use std::borrow::Cow;
|
||||||
use std::io::{self, Write};
|
use std::io::{self, Write};
|
||||||
use super::{HtmlTokenizer, LastChunkState, ServoParser, Sink, Tokenizer};
|
use super::{FragmentContext, Sink};
|
||||||
use url::Url;
|
use url::Url;
|
||||||
|
|
||||||
fn insert(parent: &Node, reference_child: Option<&Node>, child: NodeOrText<JS<Node>>) {
|
#[derive(HeapSizeOf, JSTraceable)]
|
||||||
match child {
|
#[must_root]
|
||||||
NodeOrText::AppendNode(n) => {
|
pub struct Tokenizer {
|
||||||
assert!(parent.InsertBefore(&n, reference_child).is_ok());
|
#[ignore_heap_size_of = "Defined in html5ever"]
|
||||||
},
|
inner: HtmlTokenizer<TreeBuilder<JS<Node>, Sink>>,
|
||||||
NodeOrText::AppendText(t) => {
|
#[ignore_heap_size_of = "Defined in html5ever"]
|
||||||
// FIXME(ajeffrey): convert directly from tendrils to DOMStrings
|
input_buffer: BufferQueue,
|
||||||
let s: String = t.into();
|
}
|
||||||
let text = Text::new(DOMString::from(s), &parent.owner_doc());
|
|
||||||
assert!(parent.InsertBefore(text.upcast(), reference_child).is_ok());
|
impl Tokenizer {
|
||||||
|
pub fn new(
|
||||||
|
document: &Document,
|
||||||
|
url: Url,
|
||||||
|
fragment_context: Option<FragmentContext>)
|
||||||
|
-> Self {
|
||||||
|
let sink = Sink {
|
||||||
|
base_url: url,
|
||||||
|
document: JS::from_ref(document),
|
||||||
|
};
|
||||||
|
|
||||||
|
let options = TreeBuilderOpts {
|
||||||
|
ignore_missing_rules: true,
|
||||||
|
.. Default::default()
|
||||||
|
};
|
||||||
|
|
||||||
|
let inner = if let Some(fc) = fragment_context {
|
||||||
|
let tb = TreeBuilder::new_for_fragment(
|
||||||
|
sink,
|
||||||
|
JS::from_ref(fc.context_elem),
|
||||||
|
fc.form_elem.map(|n| JS::from_ref(n)),
|
||||||
|
options);
|
||||||
|
|
||||||
|
let tok_options = TokenizerOpts {
|
||||||
|
initial_state: Some(tb.tokenizer_state_for_context_elem()),
|
||||||
|
.. Default::default()
|
||||||
|
};
|
||||||
|
|
||||||
|
HtmlTokenizer::new(tb, tok_options)
|
||||||
|
} else {
|
||||||
|
HtmlTokenizer::new(TreeBuilder::new(sink, options), Default::default())
|
||||||
|
};
|
||||||
|
|
||||||
|
Tokenizer {
|
||||||
|
inner: inner,
|
||||||
|
input_buffer: BufferQueue::new(),
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
pub fn feed(&mut self, input: String) {
|
||||||
|
self.input_buffer.push_back(input.into());
|
||||||
|
self.run();
|
||||||
|
}
|
||||||
|
|
||||||
|
#[allow(unrooted_must_root)]
|
||||||
|
pub fn run(&mut self) {
|
||||||
|
while let TokenizerResult::Script(script) = self.inner.feed(&mut self.input_buffer) {
|
||||||
|
let script = Root::from_ref(script.downcast::<HTMLScriptElement>().unwrap());
|
||||||
|
if !script.prepare() {
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn end(&mut self) {
|
||||||
|
assert!(self.input_buffer.is_empty());
|
||||||
|
self.inner.end();
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn set_plaintext_state(&mut self) {
|
||||||
|
self.inner.set_plaintext_state();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl JSTraceable for HtmlTokenizer<TreeBuilder<JS<Node>, Sink>> {
|
||||||
|
fn trace(&self, trc: *mut JSTracer) {
|
||||||
|
struct Tracer(*mut JSTracer);
|
||||||
|
let tracer = Tracer(trc);
|
||||||
|
|
||||||
|
impl HtmlTracer for Tracer {
|
||||||
|
type Handle = JS<Node>;
|
||||||
|
#[allow(unrooted_must_root)]
|
||||||
|
fn trace_handle(&self, node: &JS<Node>) {
|
||||||
|
node.trace(self.0);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
let tree_builder = self.sink();
|
||||||
|
tree_builder.trace_handles(&tracer);
|
||||||
|
tree_builder.sink().trace(trc);
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
impl<'a> TreeSink for Sink {
|
impl<'a> TreeSink for Sink {
|
||||||
|
@ -161,6 +236,20 @@ impl<'a> TreeSink for Sink {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
fn insert(parent: &Node, reference_child: Option<&Node>, child: NodeOrText<JS<Node>>) {
|
||||||
|
match child {
|
||||||
|
NodeOrText::AppendNode(n) => {
|
||||||
|
assert!(parent.InsertBefore(&n, reference_child).is_ok());
|
||||||
|
},
|
||||||
|
NodeOrText::AppendText(t) => {
|
||||||
|
// FIXME(ajeffrey): convert directly from tendrils to DOMStrings
|
||||||
|
let s: String = t.into();
|
||||||
|
let text = Text::new(DOMString::from(s), &parent.owner_doc());
|
||||||
|
assert!(parent.InsertBefore(text.upcast(), reference_child).is_ok());
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
impl<'a> Serializable for &'a Node {
|
impl<'a> Serializable for &'a Node {
|
||||||
fn serialize<'wr, Wr: Write>(&self, serializer: &mut Serializer<'wr, Wr>,
|
fn serialize<'wr, Wr: Write>(&self, serializer: &mut Serializer<'wr, Wr>,
|
||||||
traversal_scope: TraversalScope) -> io::Result<()> {
|
traversal_scope: TraversalScope) -> io::Result<()> {
|
||||||
|
@ -237,100 +326,3 @@ impl<'a> Serializable for &'a Node {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
/// FragmentContext is used only to pass this group of related values
|
|
||||||
/// into functions.
|
|
||||||
#[derive(Copy, Clone)]
|
|
||||||
pub struct FragmentContext<'a> {
|
|
||||||
pub context_elem: &'a Node,
|
|
||||||
pub form_elem: Option<&'a Node>,
|
|
||||||
}
|
|
||||||
|
|
||||||
pub enum ParseContext<'a> {
|
|
||||||
Fragment(FragmentContext<'a>),
|
|
||||||
Owner(Option<PipelineId>),
|
|
||||||
}
|
|
||||||
|
|
||||||
pub fn parse_html(document: &Document,
|
|
||||||
input: DOMString,
|
|
||||||
url: Url,
|
|
||||||
context: ParseContext) {
|
|
||||||
let sink = Sink {
|
|
||||||
base_url: url,
|
|
||||||
document: JS::from_ref(document),
|
|
||||||
};
|
|
||||||
|
|
||||||
let options = TreeBuilderOpts {
|
|
||||||
ignore_missing_rules: true,
|
|
||||||
.. Default::default()
|
|
||||||
};
|
|
||||||
|
|
||||||
let parser = match context {
|
|
||||||
ParseContext::Owner(owner) => {
|
|
||||||
let tb = TreeBuilder::new(sink, options);
|
|
||||||
let tok = H5ETokenizer::new(tb, Default::default());
|
|
||||||
|
|
||||||
ServoParser::new(
|
|
||||||
document,
|
|
||||||
owner,
|
|
||||||
Tokenizer::HTML(HtmlTokenizer::new(tok)),
|
|
||||||
LastChunkState::NotReceived)
|
|
||||||
},
|
|
||||||
ParseContext::Fragment(fc) => {
|
|
||||||
let tb = TreeBuilder::new_for_fragment(
|
|
||||||
sink,
|
|
||||||
JS::from_ref(fc.context_elem),
|
|
||||||
fc.form_elem.map(|n| JS::from_ref(n)),
|
|
||||||
options);
|
|
||||||
|
|
||||||
let tok_options = TokenizerOpts {
|
|
||||||
initial_state: Some(tb.tokenizer_state_for_context_elem()),
|
|
||||||
.. Default::default()
|
|
||||||
};
|
|
||||||
let tok = H5ETokenizer::new(tb, tok_options);
|
|
||||||
|
|
||||||
ServoParser::new(
|
|
||||||
document,
|
|
||||||
None,
|
|
||||||
Tokenizer::HTML(HtmlTokenizer::new(tok)),
|
|
||||||
LastChunkState::Received)
|
|
||||||
}
|
|
||||||
};
|
|
||||||
parser.parse_chunk(String::from(input));
|
|
||||||
}
|
|
||||||
|
|
||||||
// https://html.spec.whatwg.org/multipage/#parsing-html-fragments
|
|
||||||
pub fn parse_html_fragment(context_node: &Node,
|
|
||||||
input: DOMString,
|
|
||||||
output: &Node) {
|
|
||||||
let window = window_from_node(context_node);
|
|
||||||
let context_document = document_from_node(context_node);
|
|
||||||
let url = context_document.url();
|
|
||||||
|
|
||||||
// Step 1.
|
|
||||||
let loader = DocumentLoader::new(&*context_document.loader());
|
|
||||||
let document = Document::new(&window, None, Some(url.clone()),
|
|
||||||
IsHTMLDocument::HTMLDocument,
|
|
||||||
None, None,
|
|
||||||
DocumentSource::FromParser,
|
|
||||||
loader,
|
|
||||||
None, None);
|
|
||||||
|
|
||||||
// Step 2.
|
|
||||||
document.set_quirks_mode(context_document.quirks_mode());
|
|
||||||
|
|
||||||
// Step 11.
|
|
||||||
let form = context_node.inclusive_ancestors()
|
|
||||||
.find(|element| element.is::<HTMLFormElement>());
|
|
||||||
let fragment_context = FragmentContext {
|
|
||||||
context_elem: context_node,
|
|
||||||
form_elem: form.r(),
|
|
||||||
};
|
|
||||||
parse_html(&document, input, url.clone(), ParseContext::Fragment(fragment_context));
|
|
||||||
|
|
||||||
// Step 14.
|
|
||||||
let root_element = document.GetDocumentElement().expect("no document element");
|
|
||||||
for child in root_element.upcast::<Node>().children() {
|
|
||||||
output.AppendChild(&child).unwrap();
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
|
@ -2,33 +2,27 @@
|
||||||
* License, v. 2.0. If a copy of the MPL was not distributed with this
|
* License, v. 2.0. If a copy of the MPL was not distributed with this
|
||||||
* file, You can obtain one at http://mozilla.org/MPL/2.0/. */
|
* file, You can obtain one at http://mozilla.org/MPL/2.0/. */
|
||||||
|
|
||||||
use document_loader::LoadType;
|
use document_loader::{DocumentLoader, LoadType};
|
||||||
use dom::bindings::cell::DOMRefCell;
|
use dom::bindings::cell::DOMRefCell;
|
||||||
use dom::bindings::codegen::Bindings::DocumentBinding::DocumentMethods;
|
use dom::bindings::codegen::Bindings::DocumentBinding::DocumentMethods;
|
||||||
use dom::bindings::codegen::Bindings::HTMLImageElementBinding::HTMLImageElementMethods;
|
use dom::bindings::codegen::Bindings::HTMLImageElementBinding::HTMLImageElementMethods;
|
||||||
use dom::bindings::codegen::Bindings::NodeBinding::NodeMethods;
|
use dom::bindings::codegen::Bindings::NodeBinding::NodeMethods;
|
||||||
use dom::bindings::codegen::Bindings::ServoParserBinding;
|
use dom::bindings::codegen::Bindings::ServoParserBinding;
|
||||||
use dom::bindings::inheritance::Castable;
|
use dom::bindings::inheritance::Castable;
|
||||||
use dom::bindings::js::{JS, Root};
|
use dom::bindings::js::{JS, Root, RootedReference};
|
||||||
use dom::bindings::refcounted::Trusted;
|
use dom::bindings::refcounted::Trusted;
|
||||||
use dom::bindings::reflector::{Reflector, reflect_dom_object};
|
use dom::bindings::reflector::{Reflector, reflect_dom_object};
|
||||||
use dom::bindings::str::DOMString;
|
use dom::bindings::str::DOMString;
|
||||||
use dom::bindings::trace::JSTraceable;
|
use dom::document::{Document, DocumentSource, IsHTMLDocument};
|
||||||
use dom::document::Document;
|
|
||||||
use dom::globalscope::GlobalScope;
|
use dom::globalscope::GlobalScope;
|
||||||
|
use dom::htmlformelement::HTMLFormElement;
|
||||||
use dom::htmlimageelement::HTMLImageElement;
|
use dom::htmlimageelement::HTMLImageElement;
|
||||||
use dom::htmlscriptelement::HTMLScriptElement;
|
use dom::node::{Node, document_from_node, window_from_node};
|
||||||
use dom::node::Node;
|
|
||||||
use encoding::all::UTF_8;
|
use encoding::all::UTF_8;
|
||||||
use encoding::types::{DecoderTrap, Encoding};
|
use encoding::types::{DecoderTrap, Encoding};
|
||||||
use html5ever::tokenizer::{Tokenizer as H5ETokenizer, TokenizerResult};
|
|
||||||
use html5ever::tokenizer::buffer_queue::BufferQueue;
|
|
||||||
use html5ever::tree_builder::Tracer as HtmlTracer;
|
|
||||||
use html5ever::tree_builder::TreeBuilder as HtmlTreeBuilder;
|
|
||||||
use hyper::header::ContentType;
|
use hyper::header::ContentType;
|
||||||
use hyper::mime::{Mime, SubLevel, TopLevel};
|
use hyper::mime::{Mime, SubLevel, TopLevel};
|
||||||
use hyper_serde::Serde;
|
use hyper_serde::Serde;
|
||||||
use js::jsapi::JSTracer;
|
|
||||||
use msg::constellation_msg::PipelineId;
|
use msg::constellation_msg::PipelineId;
|
||||||
use net_traits::{FetchMetadata, FetchResponseListener, Metadata, NetworkError};
|
use net_traits::{FetchMetadata, FetchResponseListener, Metadata, NetworkError};
|
||||||
use network_listener::PreInvoke;
|
use network_listener::PreInvoke;
|
||||||
|
@ -39,11 +33,9 @@ use std::cell::Cell;
|
||||||
use std::collections::VecDeque;
|
use std::collections::VecDeque;
|
||||||
use url::Url;
|
use url::Url;
|
||||||
use util::resource_files::read_resource_file;
|
use util::resource_files::read_resource_file;
|
||||||
use xml5ever::tokenizer::XmlTokenizer;
|
|
||||||
use xml5ever::tree_builder::{Tracer as XmlTracer, XmlTreeBuilder};
|
|
||||||
|
|
||||||
pub mod html;
|
mod html;
|
||||||
pub mod xml;
|
mod xml;
|
||||||
|
|
||||||
#[dom_struct]
|
#[dom_struct]
|
||||||
pub struct ServoParser {
|
pub struct ServoParser {
|
||||||
|
@ -70,6 +62,76 @@ enum LastChunkState {
|
||||||
}
|
}
|
||||||
|
|
||||||
impl ServoParser {
|
impl ServoParser {
|
||||||
|
pub fn parse_html_document(
|
||||||
|
document: &Document,
|
||||||
|
input: DOMString,
|
||||||
|
url: Url,
|
||||||
|
owner: Option<PipelineId>) {
|
||||||
|
let parser = ServoParser::new(
|
||||||
|
document,
|
||||||
|
owner,
|
||||||
|
Tokenizer::Html(self::html::Tokenizer::new(document, url, None)),
|
||||||
|
LastChunkState::NotReceived);
|
||||||
|
parser.parse_chunk(String::from(input));
|
||||||
|
}
|
||||||
|
|
||||||
|
// https://html.spec.whatwg.org/multipage/#parsing-html-fragments
|
||||||
|
pub fn parse_html_fragment(
|
||||||
|
context_node: &Node,
|
||||||
|
input: DOMString,
|
||||||
|
output: &Node) {
|
||||||
|
let window = window_from_node(context_node);
|
||||||
|
let context_document = document_from_node(context_node);
|
||||||
|
let url = context_document.url();
|
||||||
|
|
||||||
|
// Step 1.
|
||||||
|
let loader = DocumentLoader::new(&*context_document.loader());
|
||||||
|
let document = Document::new(&window, None, Some(url.clone()),
|
||||||
|
IsHTMLDocument::HTMLDocument,
|
||||||
|
None, None,
|
||||||
|
DocumentSource::FromParser,
|
||||||
|
loader,
|
||||||
|
None, None);
|
||||||
|
|
||||||
|
// Step 2.
|
||||||
|
document.set_quirks_mode(context_document.quirks_mode());
|
||||||
|
|
||||||
|
// Step 11.
|
||||||
|
let form = context_node.inclusive_ancestors()
|
||||||
|
.find(|element| element.is::<HTMLFormElement>());
|
||||||
|
let fragment_context = FragmentContext {
|
||||||
|
context_elem: context_node,
|
||||||
|
form_elem: form.r(),
|
||||||
|
};
|
||||||
|
|
||||||
|
let parser = ServoParser::new(
|
||||||
|
&document,
|
||||||
|
None,
|
||||||
|
Tokenizer::Html(
|
||||||
|
self::html::Tokenizer::new(&document, url.clone(), Some(fragment_context))),
|
||||||
|
LastChunkState::Received);
|
||||||
|
parser.parse_chunk(String::from(input));
|
||||||
|
|
||||||
|
// Step 14.
|
||||||
|
let root_element = document.GetDocumentElement().expect("no document element");
|
||||||
|
for child in root_element.upcast::<Node>().children() {
|
||||||
|
output.AppendChild(&child).unwrap();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn parse_xml_document(
|
||||||
|
document: &Document,
|
||||||
|
input: DOMString,
|
||||||
|
url: Url,
|
||||||
|
owner: Option<PipelineId>) {
|
||||||
|
let parser = ServoParser::new(
|
||||||
|
document,
|
||||||
|
owner,
|
||||||
|
Tokenizer::Xml(self::xml::Tokenizer::new(document, url)),
|
||||||
|
LastChunkState::NotReceived);
|
||||||
|
parser.parse_chunk(String::from(input));
|
||||||
|
}
|
||||||
|
|
||||||
#[allow(unrooted_must_root)]
|
#[allow(unrooted_must_root)]
|
||||||
fn new_inherited(
|
fn new_inherited(
|
||||||
document: &Document,
|
document: &Document,
|
||||||
|
@ -215,57 +277,11 @@ impl ServoParser {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
#[derive(HeapSizeOf)]
|
#[derive(HeapSizeOf, JSTraceable)]
|
||||||
#[must_root]
|
#[must_root]
|
||||||
enum Tokenizer {
|
enum Tokenizer {
|
||||||
HTML(HtmlTokenizer),
|
Html(self::html::Tokenizer),
|
||||||
XML(
|
Xml(self::xml::Tokenizer),
|
||||||
#[ignore_heap_size_of = "Defined in xml5ever"]
|
|
||||||
XmlTokenizer<XmlTreeBuilder<JS<Node>, Sink>>
|
|
||||||
),
|
|
||||||
}
|
|
||||||
|
|
||||||
#[derive(HeapSizeOf)]
|
|
||||||
#[must_root]
|
|
||||||
struct HtmlTokenizer {
|
|
||||||
#[ignore_heap_size_of = "Defined in html5ever"]
|
|
||||||
inner: H5ETokenizer<HtmlTreeBuilder<JS<Node>, Sink>>,
|
|
||||||
#[ignore_heap_size_of = "Defined in html5ever"]
|
|
||||||
input_buffer: BufferQueue,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl HtmlTokenizer {
|
|
||||||
#[allow(unrooted_must_root)]
|
|
||||||
fn new(inner: H5ETokenizer<HtmlTreeBuilder<JS<Node>, Sink>>) -> Self {
|
|
||||||
HtmlTokenizer {
|
|
||||||
inner: inner,
|
|
||||||
input_buffer: BufferQueue::new(),
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
fn feed(&mut self, input: String) {
|
|
||||||
self.input_buffer.push_back(input.into());
|
|
||||||
self.run();
|
|
||||||
}
|
|
||||||
|
|
||||||
#[allow(unrooted_must_root)]
|
|
||||||
fn run(&mut self) {
|
|
||||||
while let TokenizerResult::Script(script) = self.inner.feed(&mut self.input_buffer) {
|
|
||||||
let script = Root::from_ref(script.downcast::<HTMLScriptElement>().unwrap());
|
|
||||||
if !script.prepare() {
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
fn end(&mut self) {
|
|
||||||
assert!(self.input_buffer.is_empty());
|
|
||||||
self.inner.end();
|
|
||||||
}
|
|
||||||
|
|
||||||
fn set_plaintext_state(&mut self) {
|
|
||||||
self.inner.set_plaintext_state();
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
|
|
||||||
#[derive(JSTraceable, HeapSizeOf)]
|
#[derive(JSTraceable, HeapSizeOf)]
|
||||||
|
@ -278,70 +294,36 @@ struct Sink {
|
||||||
impl Tokenizer {
|
impl Tokenizer {
|
||||||
fn feed(&mut self, input: String) {
|
fn feed(&mut self, input: String) {
|
||||||
match *self {
|
match *self {
|
||||||
Tokenizer::HTML(ref mut tokenizer) => tokenizer.feed(input),
|
Tokenizer::Html(ref mut tokenizer) => tokenizer.feed(input),
|
||||||
Tokenizer::XML(ref mut tokenizer) => tokenizer.feed(input.into()),
|
Tokenizer::Xml(ref mut tokenizer) => tokenizer.feed(input.into()),
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
fn run(&mut self) {
|
fn run(&mut self) {
|
||||||
match *self {
|
match *self {
|
||||||
Tokenizer::HTML(ref mut tokenizer) => tokenizer.run(),
|
Tokenizer::Html(ref mut tokenizer) => tokenizer.run(),
|
||||||
Tokenizer::XML(ref mut tokenizer) => tokenizer.run(),
|
Tokenizer::Xml(ref mut tokenizer) => tokenizer.run(),
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
fn end(&mut self) {
|
fn end(&mut self) {
|
||||||
match *self {
|
match *self {
|
||||||
Tokenizer::HTML(ref mut tokenizer) => tokenizer.end(),
|
Tokenizer::Html(ref mut tokenizer) => tokenizer.end(),
|
||||||
Tokenizer::XML(ref mut tokenizer) => tokenizer.end(),
|
Tokenizer::Xml(ref mut tokenizer) => tokenizer.end(),
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
fn set_plaintext_state(&mut self) {
|
fn set_plaintext_state(&mut self) {
|
||||||
match *self {
|
match *self {
|
||||||
Tokenizer::HTML(ref mut tokenizer) => tokenizer.set_plaintext_state(),
|
Tokenizer::Html(ref mut tokenizer) => tokenizer.set_plaintext_state(),
|
||||||
Tokenizer::XML(_) => { /* todo */ },
|
Tokenizer::Xml(_) => unimplemented!(),
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
fn profiler_category(&self) -> ProfilerCategory {
|
fn profiler_category(&self) -> ProfilerCategory {
|
||||||
match *self {
|
match *self {
|
||||||
Tokenizer::HTML(_) => ProfilerCategory::ScriptParseHTML,
|
Tokenizer::Html(_) => ProfilerCategory::ScriptParseHTML,
|
||||||
Tokenizer::XML(_) => ProfilerCategory::ScriptParseXML,
|
Tokenizer::Xml(_) => ProfilerCategory::ScriptParseXML,
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl JSTraceable for Tokenizer {
|
|
||||||
fn trace(&self, trc: *mut JSTracer) {
|
|
||||||
struct Tracer(*mut JSTracer);
|
|
||||||
let tracer = Tracer(trc);
|
|
||||||
|
|
||||||
match *self {
|
|
||||||
Tokenizer::HTML(ref tokenizer) => {
|
|
||||||
impl HtmlTracer for Tracer {
|
|
||||||
type Handle = JS<Node>;
|
|
||||||
#[allow(unrooted_must_root)]
|
|
||||||
fn trace_handle(&self, node: &JS<Node>) {
|
|
||||||
node.trace(self.0);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
let tree_builder = tokenizer.inner.sink();
|
|
||||||
tree_builder.trace_handles(&tracer);
|
|
||||||
tree_builder.sink().trace(trc);
|
|
||||||
},
|
|
||||||
Tokenizer::XML(ref tokenizer) => {
|
|
||||||
impl XmlTracer for Tracer {
|
|
||||||
type Handle = JS<Node>;
|
|
||||||
#[allow(unrooted_must_root)]
|
|
||||||
fn trace_handle(&self, node: JS<Node>) {
|
|
||||||
node.trace(self.0);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
let tree_builder = tokenizer.sink();
|
|
||||||
tree_builder.trace_handles(&tracer);
|
|
||||||
tree_builder.sink().trace(trc);
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -499,3 +481,8 @@ impl FetchResponseListener for ParserContext {
|
||||||
}
|
}
|
||||||
|
|
||||||
impl PreInvoke for ParserContext {}
|
impl PreInvoke for ParserContext {}
|
||||||
|
|
||||||
|
pub struct FragmentContext<'a> {
|
||||||
|
pub context_elem: &'a Node,
|
||||||
|
pub form_elem: Option<&'a Node>,
|
||||||
|
}
|
||||||
|
|
|
@ -8,6 +8,7 @@ use dom::bindings::codegen::Bindings::NodeBinding::NodeMethods;
|
||||||
use dom::bindings::inheritance::Castable;
|
use dom::bindings::inheritance::Castable;
|
||||||
use dom::bindings::js::{JS, Root};
|
use dom::bindings::js::{JS, Root};
|
||||||
use dom::bindings::str::DOMString;
|
use dom::bindings::str::DOMString;
|
||||||
|
use dom::bindings::trace::JSTraceable;
|
||||||
use dom::comment::Comment;
|
use dom::comment::Comment;
|
||||||
use dom::document::Document;
|
use dom::document::Document;
|
||||||
use dom::documenttype::DocumentType;
|
use dom::documenttype::DocumentType;
|
||||||
|
@ -17,13 +18,68 @@ use dom::node::Node;
|
||||||
use dom::processinginstruction::ProcessingInstruction;
|
use dom::processinginstruction::ProcessingInstruction;
|
||||||
use dom::text::Text;
|
use dom::text::Text;
|
||||||
use html5ever_atoms::{Prefix, QualName};
|
use html5ever_atoms::{Prefix, QualName};
|
||||||
use msg::constellation_msg::PipelineId;
|
use js::jsapi::JSTracer;
|
||||||
use std::borrow::Cow;
|
use std::borrow::Cow;
|
||||||
use super::{LastChunkState, ServoParser, Sink, Tokenizer};
|
use super::Sink;
|
||||||
use url::Url;
|
use url::Url;
|
||||||
use xml5ever::tendril::StrTendril;
|
use xml5ever::tendril::StrTendril;
|
||||||
use xml5ever::tokenizer::{Attribute, QName, XmlTokenizer};
|
use xml5ever::tokenizer::{Attribute, QName, XmlTokenizer};
|
||||||
use xml5ever::tree_builder::{NextParserState, NodeOrText, TreeSink, XmlTreeBuilder};
|
use xml5ever::tree_builder::{NextParserState, NodeOrText};
|
||||||
|
use xml5ever::tree_builder::{Tracer as XmlTracer, TreeSink, XmlTreeBuilder};
|
||||||
|
|
||||||
|
#[derive(HeapSizeOf, JSTraceable)]
|
||||||
|
#[must_root]
|
||||||
|
pub struct Tokenizer {
|
||||||
|
#[ignore_heap_size_of = "Defined in xml5ever"]
|
||||||
|
inner: XmlTokenizer<XmlTreeBuilder<JS<Node>, Sink>>,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl Tokenizer {
|
||||||
|
pub fn new(document: &Document, url: Url) -> Self {
|
||||||
|
let sink = Sink {
|
||||||
|
base_url: url,
|
||||||
|
document: JS::from_ref(document),
|
||||||
|
};
|
||||||
|
|
||||||
|
let tb = XmlTreeBuilder::new(sink);
|
||||||
|
let tok = XmlTokenizer::new(tb, Default::default());
|
||||||
|
|
||||||
|
Tokenizer {
|
||||||
|
inner: tok,
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn feed(&mut self, input: String) {
|
||||||
|
self.inner.feed(input.into())
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn run(&mut self) {
|
||||||
|
self.inner.run()
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn end(&mut self) {
|
||||||
|
self.inner.end()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl JSTraceable for XmlTokenizer<XmlTreeBuilder<JS<Node>, Sink>> {
|
||||||
|
fn trace(&self, trc: *mut JSTracer) {
|
||||||
|
struct Tracer(*mut JSTracer);
|
||||||
|
let tracer = Tracer(trc);
|
||||||
|
|
||||||
|
impl XmlTracer for Tracer {
|
||||||
|
type Handle = JS<Node>;
|
||||||
|
#[allow(unrooted_must_root)]
|
||||||
|
fn trace_handle(&self, node: JS<Node>) {
|
||||||
|
node.trace(self.0);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
let tree_builder = self.sink();
|
||||||
|
tree_builder.trace_handles(&tracer);
|
||||||
|
tree_builder.sink().trace(trc);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
impl<'a> TreeSink for Sink {
|
impl<'a> TreeSink for Sink {
|
||||||
type Handle = JS<Node>;
|
type Handle = JS<Node>;
|
||||||
|
@ -119,28 +175,3 @@ impl<'a> TreeSink for Sink {
|
||||||
NextParserState::Continue
|
NextParserState::Continue
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
pub enum ParseContext {
|
|
||||||
Owner(Option<PipelineId>)
|
|
||||||
}
|
|
||||||
|
|
||||||
|
|
||||||
pub fn parse_xml(document: &Document,
|
|
||||||
input: DOMString,
|
|
||||||
url: Url,
|
|
||||||
context: ParseContext) {
|
|
||||||
let parser = match context {
|
|
||||||
ParseContext::Owner(owner) => {
|
|
||||||
let tb = XmlTreeBuilder::new(Sink {
|
|
||||||
base_url: url,
|
|
||||||
document: JS::from_ref(document),
|
|
||||||
});
|
|
||||||
let tok = XmlTokenizer::new(tb, Default::default());
|
|
||||||
|
|
||||||
ServoParser::new(
|
|
||||||
document, owner, Tokenizer::XML(tok), LastChunkState::NotReceived)
|
|
||||||
}
|
|
||||||
};
|
|
||||||
parser.parse_chunk(String::from(input));
|
|
||||||
}
|
|
||||||
|
|
|
@ -28,8 +28,7 @@ use dom::globalscope::GlobalScope;
|
||||||
use dom::headers::is_forbidden_header_name;
|
use dom::headers::is_forbidden_header_name;
|
||||||
use dom::htmlformelement::{encode_multipart_form_data, generate_boundary};
|
use dom::htmlformelement::{encode_multipart_form_data, generate_boundary};
|
||||||
use dom::progressevent::ProgressEvent;
|
use dom::progressevent::ProgressEvent;
|
||||||
use dom::servoparser::html::{ParseContext, parse_html};
|
use dom::servoparser::ServoParser;
|
||||||
use dom::servoparser::xml::{self, parse_xml};
|
|
||||||
use dom::window::Window;
|
use dom::window::Window;
|
||||||
use dom::workerglobalscope::WorkerGlobalScope;
|
use dom::workerglobalscope::WorkerGlobalScope;
|
||||||
use dom::xmlhttprequesteventtarget::XMLHttpRequestEventTarget;
|
use dom::xmlhttprequesteventtarget::XMLHttpRequestEventTarget;
|
||||||
|
@ -1199,10 +1198,11 @@ impl XMLHttpRequest {
|
||||||
let decoded = charset.decode(&self.response.borrow(), DecoderTrap::Replace).unwrap();
|
let decoded = charset.decode(&self.response.borrow(), DecoderTrap::Replace).unwrap();
|
||||||
let document = self.new_doc(IsHTMLDocument::HTMLDocument);
|
let document = self.new_doc(IsHTMLDocument::HTMLDocument);
|
||||||
// TODO: Disable scripting while parsing
|
// TODO: Disable scripting while parsing
|
||||||
parse_html(&document,
|
ServoParser::parse_html_document(
|
||||||
DOMString::from(decoded),
|
&document,
|
||||||
wr.get_url(),
|
DOMString::from(decoded),
|
||||||
ParseContext::Owner(Some(wr.pipeline_id())));
|
wr.get_url(),
|
||||||
|
Some(wr.pipeline_id()));
|
||||||
document
|
document
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -1212,10 +1212,11 @@ impl XMLHttpRequest {
|
||||||
let decoded = charset.decode(&self.response.borrow(), DecoderTrap::Replace).unwrap();
|
let decoded = charset.decode(&self.response.borrow(), DecoderTrap::Replace).unwrap();
|
||||||
let document = self.new_doc(IsHTMLDocument::NonHTMLDocument);
|
let document = self.new_doc(IsHTMLDocument::NonHTMLDocument);
|
||||||
// TODO: Disable scripting while parsing
|
// TODO: Disable scripting while parsing
|
||||||
parse_xml(&document,
|
ServoParser::parse_xml_document(
|
||||||
DOMString::from(decoded),
|
&document,
|
||||||
wr.get_url(),
|
DOMString::from(decoded),
|
||||||
xml::ParseContext::Owner(Some(wr.pipeline_id())));
|
wr.get_url(),
|
||||||
|
Some(wr.pipeline_id()));
|
||||||
document
|
document
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -51,8 +51,6 @@ use dom::node::{Node, NodeDamage, window_from_node};
|
||||||
use dom::serviceworker::TrustedServiceWorkerAddress;
|
use dom::serviceworker::TrustedServiceWorkerAddress;
|
||||||
use dom::serviceworkerregistration::ServiceWorkerRegistration;
|
use dom::serviceworkerregistration::ServiceWorkerRegistration;
|
||||||
use dom::servoparser::{ParserContext, ServoParser};
|
use dom::servoparser::{ParserContext, ServoParser};
|
||||||
use dom::servoparser::html::{ParseContext, parse_html};
|
|
||||||
use dom::servoparser::xml::{self, parse_xml};
|
|
||||||
use dom::transitionevent::TransitionEvent;
|
use dom::transitionevent::TransitionEvent;
|
||||||
use dom::uievent::UIEvent;
|
use dom::uievent::UIEvent;
|
||||||
use dom::window::{ReflowReason, Window};
|
use dom::window::{ReflowReason, Window};
|
||||||
|
@ -1779,15 +1777,17 @@ impl ScriptThread {
|
||||||
};
|
};
|
||||||
|
|
||||||
if is_xml {
|
if is_xml {
|
||||||
parse_xml(&document,
|
ServoParser::parse_xml_document(
|
||||||
parse_input,
|
&document,
|
||||||
final_url,
|
parse_input,
|
||||||
xml::ParseContext::Owner(Some(incomplete.pipeline_id)));
|
final_url,
|
||||||
|
Some(incomplete.pipeline_id));
|
||||||
} else {
|
} else {
|
||||||
parse_html(&document,
|
ServoParser::parse_html_document(
|
||||||
parse_input,
|
&document,
|
||||||
final_url,
|
parse_input,
|
||||||
ParseContext::Owner(Some(incomplete.pipeline_id)));
|
final_url,
|
||||||
|
Some(incomplete.pipeline_id));
|
||||||
}
|
}
|
||||||
|
|
||||||
if incomplete.is_frozen {
|
if incomplete.is_frozen {
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue