mirror of
https://github.com/servo/servo.git
synced 2025-06-06 16:45:39 +00:00
193 lines
6.8 KiB
Rust
193 lines
6.8 KiB
Rust
/* This Source Code Form is subject to the terms of the Mozilla Public
|
|
* License, v. 2.0. If a copy of the MPL was not distributed with this
|
|
* file, You can obtain one at http://mozilla.org/MPL/2.0/. */
|
|
|
|
#![allow(unrooted_must_root)]
|
|
|
|
use dom::bindings::codegen::Bindings::HTMLTemplateElementBinding::HTMLTemplateElementMethods;
|
|
use dom::bindings::inheritance::{Castable, CharacterDataTypeId, NodeTypeId};
|
|
use dom::bindings::js::{JS, Root};
|
|
use dom::bindings::trace::JSTraceable;
|
|
use dom::characterdata::CharacterData;
|
|
use dom::document::Document;
|
|
use dom::documenttype::DocumentType;
|
|
use dom::element::Element;
|
|
use dom::htmlscriptelement::HTMLScriptElement;
|
|
use dom::htmltemplateelement::HTMLTemplateElement;
|
|
use dom::node::Node;
|
|
use dom::processinginstruction::ProcessingInstruction;
|
|
use dom::servoparser::Sink;
|
|
use html5ever::QualName;
|
|
use html5ever::buffer_queue::BufferQueue;
|
|
use html5ever::serialize::{AttrRef, Serialize, Serializer};
|
|
use html5ever::serialize::TraversalScope;
|
|
use html5ever::serialize::TraversalScope::{ChildrenOnly, IncludeNode};
|
|
use html5ever::tokenizer::{Tokenizer as HtmlTokenizer, TokenizerOpts, TokenizerResult};
|
|
use html5ever::tree_builder::{Tracer as HtmlTracer, TreeBuilder, TreeBuilderOpts};
|
|
use js::jsapi::JSTracer;
|
|
use servo_url::ServoUrl;
|
|
use std::io;
|
|
|
|
#[derive(HeapSizeOf, JSTraceable)]
|
|
#[must_root]
|
|
pub struct Tokenizer {
|
|
#[ignore_heap_size_of = "Defined in html5ever"]
|
|
inner: HtmlTokenizer<TreeBuilder<JS<Node>, Sink>>,
|
|
}
|
|
|
|
impl Tokenizer {
|
|
pub fn new(
|
|
document: &Document,
|
|
url: ServoUrl,
|
|
fragment_context: Option<super::FragmentContext>)
|
|
-> Self {
|
|
let sink = Sink {
|
|
base_url: url,
|
|
document: JS::from_ref(document),
|
|
current_line: 1,
|
|
script: Default::default(),
|
|
};
|
|
|
|
let options = TreeBuilderOpts {
|
|
ignore_missing_rules: true,
|
|
.. Default::default()
|
|
};
|
|
|
|
let inner = if let Some(fc) = fragment_context {
|
|
let tb = TreeBuilder::new_for_fragment(
|
|
sink,
|
|
JS::from_ref(fc.context_elem),
|
|
fc.form_elem.map(|n| JS::from_ref(n)),
|
|
options);
|
|
|
|
let tok_options = TokenizerOpts {
|
|
initial_state: Some(tb.tokenizer_state_for_context_elem()),
|
|
.. Default::default()
|
|
};
|
|
|
|
HtmlTokenizer::new(tb, tok_options)
|
|
} else {
|
|
HtmlTokenizer::new(TreeBuilder::new(sink, options), Default::default())
|
|
};
|
|
|
|
Tokenizer {
|
|
inner: inner,
|
|
}
|
|
}
|
|
|
|
pub fn feed(&mut self, input: &mut BufferQueue) -> Result<(), Root<HTMLScriptElement>> {
|
|
match self.inner.feed(input) {
|
|
TokenizerResult::Done => Ok(()),
|
|
TokenizerResult::Script(script) => Err(Root::from_ref(script.downcast().unwrap())),
|
|
}
|
|
}
|
|
|
|
pub fn end(&mut self) {
|
|
self.inner.end();
|
|
}
|
|
|
|
pub fn url(&self) -> &ServoUrl {
|
|
&self.inner.sink().sink().base_url
|
|
}
|
|
|
|
pub fn set_plaintext_state(&mut self) {
|
|
self.inner.set_plaintext_state();
|
|
}
|
|
}
|
|
|
|
#[allow(unsafe_code)]
|
|
unsafe impl JSTraceable for HtmlTokenizer<TreeBuilder<JS<Node>, Sink>> {
|
|
unsafe fn trace(&self, trc: *mut JSTracer) {
|
|
struct Tracer(*mut JSTracer);
|
|
let tracer = Tracer(trc);
|
|
|
|
impl HtmlTracer for Tracer {
|
|
type Handle = JS<Node>;
|
|
#[allow(unrooted_must_root)]
|
|
fn trace_handle(&self, node: &JS<Node>) {
|
|
unsafe { node.trace(self.0); }
|
|
}
|
|
}
|
|
|
|
let tree_builder = self.sink();
|
|
tree_builder.trace_handles(&tracer);
|
|
tree_builder.sink().trace(trc);
|
|
}
|
|
}
|
|
|
|
impl<'a> Serialize for &'a Node {
|
|
fn serialize<S: Serializer>(&self, serializer: &mut S,
|
|
traversal_scope: TraversalScope) -> io::Result<()> {
|
|
let node = *self;
|
|
match (traversal_scope, node.type_id()) {
|
|
(_, NodeTypeId::Element(..)) => {
|
|
let elem = node.downcast::<Element>().unwrap();
|
|
let name = QualName::new(None, elem.namespace().clone(),
|
|
elem.local_name().clone());
|
|
if traversal_scope == IncludeNode {
|
|
let attrs = elem.attrs().iter().map(|attr| {
|
|
let qname = QualName::new(None, attr.namespace().clone(),
|
|
attr.local_name().clone());
|
|
let value = attr.value().clone();
|
|
(qname, value)
|
|
}).collect::<Vec<_>>();
|
|
let attr_refs = attrs.iter().map(|&(ref qname, ref value)| {
|
|
let ar: AttrRef = (&qname, &**value);
|
|
ar
|
|
});
|
|
try!(serializer.start_elem(name.clone(), attr_refs));
|
|
}
|
|
|
|
let children = if let Some(tpl) = node.downcast::<HTMLTemplateElement>() {
|
|
// https://github.com/w3c/DOM-Parsing/issues/1
|
|
tpl.Content().upcast::<Node>().children()
|
|
} else {
|
|
node.children()
|
|
};
|
|
|
|
for handle in children {
|
|
try!((&*handle).serialize(serializer, IncludeNode));
|
|
}
|
|
|
|
if traversal_scope == IncludeNode {
|
|
try!(serializer.end_elem(name.clone()));
|
|
}
|
|
Ok(())
|
|
},
|
|
|
|
(ChildrenOnly, NodeTypeId::Document(_)) => {
|
|
for handle in node.children() {
|
|
try!((&*handle).serialize(serializer, IncludeNode));
|
|
}
|
|
Ok(())
|
|
},
|
|
|
|
(ChildrenOnly, _) => Ok(()),
|
|
|
|
(IncludeNode, NodeTypeId::DocumentType) => {
|
|
let doctype = node.downcast::<DocumentType>().unwrap();
|
|
serializer.write_doctype(&doctype.name())
|
|
},
|
|
|
|
(IncludeNode, NodeTypeId::CharacterData(CharacterDataTypeId::Text)) => {
|
|
let cdata = node.downcast::<CharacterData>().unwrap();
|
|
serializer.write_text(&cdata.data())
|
|
},
|
|
|
|
(IncludeNode, NodeTypeId::CharacterData(CharacterDataTypeId::Comment)) => {
|
|
let cdata = node.downcast::<CharacterData>().unwrap();
|
|
serializer.write_comment(&cdata.data())
|
|
},
|
|
|
|
(IncludeNode, NodeTypeId::CharacterData(CharacterDataTypeId::ProcessingInstruction)) => {
|
|
let pi = node.downcast::<ProcessingInstruction>().unwrap();
|
|
let data = pi.upcast::<CharacterData>().data();
|
|
serializer.write_processing_instruction(&pi.target(), &data)
|
|
},
|
|
|
|
(IncludeNode, NodeTypeId::DocumentFragment) => Ok(()),
|
|
|
|
(IncludeNode, NodeTypeId::Document(_)) => panic!("Can't serialize Document node itself"),
|
|
}
|
|
}
|
|
}
|