(&mut self, pred: TagSet)
- where TagSet: Fn(ExpandedName) -> bool
- {
- loop {
- if self.current_node_in(|x| pred(x)) {
- break;
- }
- self.open_elems.pop();
- }
- }
-
- // Pop elements until an element from the set has been popped. Returns the
- // number of elements popped.
- fn pop_until(&mut self, pred: P) -> usize
- where P: Fn(ExpandedName) -> bool
- {
- let mut n = 0;
- loop {
- n += 1;
- match self.open_elems.pop() {
- None => break,
- Some(elem) => if pred(self.sink.elem_name(&elem)) { break; },
- }
- }
- n
- }
-
- fn pop_until_named(&mut self, name: LocalName) -> usize {
- self.pop_until(|p| *p.ns == ns!(html) && *p.local == name)
- }
-
- // Pop elements until one with the specified name has been popped.
- // Signal an error if it was not the first one.
- fn expect_to_close(&mut self, name: LocalName) {
- if self.pop_until_named(name.clone()) != 1 {
- self.sink.parse_error(format_if!(self.opts.exact_errors,
- "Unexpected open element",
- "Unexpected open element while closing {:?}", name));
- }
- }
-
- fn close_p_element(&mut self) {
- declare_tag_set!(implied = [cursory_implied_end] - "p");
- self.generate_implied_end(implied);
- self.expect_to_close(local_name!("p"));
- }
-
- fn close_p_element_in_button_scope(&mut self) {
- if self.in_scope_named(button_scope, local_name!("p")) {
- self.close_p_element();
- }
- }
-
- // Check tags for type=hidden
- fn is_type_hidden(&self, tag: &Tag) -> bool {
- match tag.attrs.iter().find(|&at| at.name.expanded() == expanded_name!("", "type")) {
- None => false,
- Some(at) => (&*at.value).eq_ignore_ascii_case("hidden"),
- }
- }
-
- fn foster_parent_in_body(&mut self, token: Token) -> ProcessResult {
- warn!("foster parenting not implemented");
- self.foster_parenting = true;
- let res = self.step(InBody, token);
- // FIXME: what if res is Reprocess?
- self.foster_parenting = false;
- res
- }
-
- fn process_chars_in_table(&mut self, token: Token) -> ProcessResult {
- declare_tag_set!(table_outer = "table" "tbody" "tfoot" "thead" "tr");
- if self.current_node_in(table_outer) {
- assert!(self.pending_table_text.is_empty());
- self.orig_mode = Some(self.mode);
- Reprocess(InTableText, token)
- } else {
- self.sink.parse_error(format_if!(self.opts.exact_errors,
- "Unexpected characters in table",
- "Unexpected characters {} in table", to_escaped_string(&token)));
- self.foster_parent_in_body(token)
- }
- }
-
- // https://html.spec.whatwg.org/multipage/syntax.html#reset-the-insertion-mode-appropriately
- fn reset_insertion_mode(&mut self) -> InsertionMode {
- for (i, mut node) in self.open_elems.iter().enumerate().rev() {
- let last = i == 0usize;
- if let (true, Some(ctx)) = (last, self.context_elem.as_ref()) {
- node = ctx;
- }
- let name = match self.sink.elem_name(node) {
- ExpandedName { ns: &ns!(html), local } => local,
- _ => continue,
- };
- match *name {
- local_name!("select") => {
- for ancestor in self.open_elems[0..i].iter().rev() {
- if self.html_elem_named(ancestor, local_name!("template")) {
- return InSelect;
- } else if self.html_elem_named(ancestor, local_name!("table")) {
- return InSelectInTable;
- }
- }
- return InSelect;
- },
- local_name!("td") | local_name!("th") => if !last { return InCell; },
- local_name!("tr") => return InRow,
- local_name!("tbody") | local_name!("thead") | local_name!("tfoot") => return InTableBody,
- local_name!("caption") => return InCaption,
- local_name!("colgroup") => return InColumnGroup,
- local_name!("table") => return InTable,
- local_name!("template") => return *self.template_modes.last().unwrap(),
- local_name!("head") => if !last { return InHead },
- local_name!("body") => return InBody,
- local_name!("frameset") => return InFrameset,
- local_name!("html") => match self.head_elem {
- None => return BeforeHead,
- Some(_) => return AfterHead,
- },
-
- _ => (),
- }
- }
- InBody
- }
-
- fn close_the_cell(&mut self) {
- self.generate_implied_end(cursory_implied_end);
- if self.pop_until(td_th) != 1 {
- self.sink.parse_error(Borrowed("expected to close or | with cell"));
- }
- self.clear_active_formatting_to_marker();
- }
-
- fn append_text(&mut self, text: StrTendril) -> ProcessResult {
- self.insert_appropriately(AppendText(text), None);
- Done
- }
-
- fn append_comment(&mut self, text: StrTendril) -> ProcessResult {
- let comment = self.sink.create_comment(text);
- self.insert_appropriately(AppendNode(comment), None);
- Done
- }
-
- fn append_comment_to_doc(&mut self, text: StrTendril) -> ProcessResult {
- let comment = self.sink.create_comment(text);
- self.sink.append(&self.doc_handle, AppendNode(comment));
- Done
- }
-
- fn append_comment_to_html(&mut self, text: StrTendril) -> ProcessResult {
- let target = html_elem(&self.open_elems);
- let comment = self.sink.create_comment(text);
- self.sink.append(target, AppendNode(comment));
- Done
- }
-
- //§ creating-and-inserting-nodes
- fn create_root(&mut self, attrs: Vec) {
- let elem = create_element(
- &mut self.sink, QualName::new(None, ns!(html), local_name!("html")),
- attrs);
- self.push(&elem);
- self.sink.append(&self.doc_handle, AppendNode(elem));
- // FIXME: application cache selection algorithm
- }
-
- // https://html.spec.whatwg.org/multipage/#create-an-element-for-the-token
- fn insert_element(&mut self, push: PushFlag, ns: Namespace, name: LocalName, attrs: Vec)
- -> Handle {
- declare_tag_set!(form_associatable =
- "button" "fieldset" "input" "object"
- "output" "select" "textarea" "img");
-
- declare_tag_set!(listed = [form_associatable] - "img");
-
- // Step 7.
- let qname = QualName::new(None, ns, name);
- let elem = create_element(&mut self.sink, qname.clone(), attrs.clone());
-
- let insertion_point = self.appropriate_place_for_insertion(None);
- let tree_node = match insertion_point {
- LastChild(ref p) |
- BeforeSibling(ref p) => p.clone()
- };
-
- // Step 12.
- if form_associatable(qname.expanded()) &&
- self.form_elem.is_some() &&
- !self.in_html_elem_named(local_name!("template")) &&
- !(listed(qname.expanded()) &&
- attrs.iter().any(|a| a.name.expanded() == expanded_name!("", "form"))) {
-
- let form = self.form_elem.as_ref().unwrap().clone();
- if self.sink.same_tree(&tree_node, &form) {
- self.sink.associate_with_form(&elem, &form)
- }
- }
-
- self.insert_at(insertion_point, AppendNode(elem.clone()));
-
- match push {
- Push => self.push(&elem),
- NoPush => (),
- }
- // FIXME: Remove from the stack if we can't append?
- elem
- }
-
- fn insert_element_for(&mut self, tag: Tag) -> Handle {
- self.insert_element(Push, ns!(html), tag.name, tag.attrs)
- }
-
- fn insert_and_pop_element_for(&mut self, tag: Tag) -> Handle {
- self.insert_element(NoPush, ns!(html), tag.name, tag.attrs)
- }
-
- fn insert_phantom(&mut self, name: LocalName) -> Handle {
- self.insert_element(Push, ns!(html), name, vec!())
- }
- //§ END
-
- fn create_formatting_element_for(&mut self, tag: Tag) -> Handle {
- // FIXME: This really wants unit tests.
- let mut first_match = None;
- let mut matches = 0usize;
- for (i, _, old_tag) in self.active_formatting_end_to_marker() {
- if tag.equiv_modulo_attr_order(old_tag) {
- first_match = Some(i);
- matches += 1;
- }
- }
-
- if matches >= 3 {
- self.active_formatting.remove(first_match.expect("matches with no index"));
- }
-
- let elem = self.insert_element(Push, ns!(html), tag.name.clone(), tag.attrs.clone());
- self.active_formatting.push(Element(elem.clone(), tag));
- elem
- }
-
- fn clear_active_formatting_to_marker(&mut self) {
- loop {
- match self.active_formatting.pop() {
- None | Some(Marker) => break,
- _ => (),
- }
- }
- }
-
- fn process_end_tag_in_body(&mut self, tag: Tag) {
- // Look back for a matching open element.
- let mut match_idx = None;
- for (i, elem) in self.open_elems.iter().enumerate().rev() {
- if self.html_elem_named(elem, tag.name.clone()) {
- match_idx = Some(i);
- break;
- }
-
- if self.elem_in(elem, special_tag) {
- self.sink.parse_error(Borrowed("Found special tag while closing generic tag"));
- return;
- }
- }
-
- // Can't use unwrap_or_return!() due to rust-lang/rust#16617.
- let match_idx = match match_idx {
- None => {
- // I believe this is impossible, because the root
- // element is in special_tag.
- self.unexpected(&tag);
- return;
- }
- Some(x) => x,
- };
-
- self.generate_implied_end_except(tag.name.clone());
-
- if match_idx != self.open_elems.len() - 1 {
- // mis-nested tags
- self.unexpected(&tag);
- }
- self.open_elems.truncate(match_idx);
- }
-
- fn handle_misnested_a_tags(&mut self, tag: &Tag) {
- let node = unwrap_or_return!(
- self.active_formatting_end_to_marker()
- .filter(|&(_, n, _)| self.html_elem_named(n, local_name!("a")))
- .next()
- .map(|(_, n, _)| n.clone()),
-
- ()
- );
-
- self.unexpected(tag);
- self.adoption_agency(local_name!("a"));
- self.position_in_active_formatting(&node)
- .map(|index| self.active_formatting.remove(index));
- self.remove_from_stack(&node);
- }
-
- //§ tree-construction
- fn is_foreign(&mut self, token: &Token) -> bool {
- if let EOFToken = *token {
- return false;
- }
-
- if self.open_elems.len() == 0 {
- return false;
- }
-
- let name = self.sink.elem_name(self.adjusted_current_node());
- if let ns!(html) = *name.ns {
- return false;
- }
-
- if mathml_text_integration_point(name) {
- match *token {
- CharacterTokens(..) | NullCharacterToken => return false,
- TagToken(Tag { kind: StartTag, ref name, .. })
- if !matches!(*name, local_name!("mglyph") | local_name!("malignmark")) => return false,
- _ => (),
- }
- }
-
- if svg_html_integration_point(name) {
- match *token {
- CharacterTokens(..) | NullCharacterToken => return false,
- TagToken(Tag { kind: StartTag, .. }) => return false,
- _ => (),
- }
- }
-
- if let expanded_name!(mathml "annotation-xml") = name {
- match *token {
- TagToken(Tag { kind: StartTag, name: local_name!("svg"), .. }) => return false,
- CharacterTokens(..) | NullCharacterToken |
- TagToken(Tag { kind: StartTag, .. }) => {
- return !self.sink.is_mathml_annotation_xml_integration_point(
- self.adjusted_current_node())
- }
- _ => {}
- };
- }
-
- true
- }
- //§ END
-
- fn enter_foreign(&mut self, mut tag: Tag, ns: Namespace) -> ProcessResult {
- match ns {
- ns!(mathml) => self.adjust_mathml_attributes(&mut tag),
- ns!(svg) => self.adjust_svg_attributes(&mut tag),
- _ => (),
- }
- self.adjust_foreign_attributes(&mut tag);
-
- if tag.self_closing {
- self.insert_element(NoPush, ns, tag.name, tag.attrs);
- DoneAckSelfClosing
- } else {
- self.insert_element(Push, ns, tag.name, tag.attrs);
- Done
- }
- }
-
- fn adjust_svg_tag_name(&mut self, tag: &mut Tag) {
- let Tag { ref mut name, .. } = *tag;
- match *name {
- local_name!("altglyph") => *name = local_name!("altGlyph"),
- local_name!("altglyphdef") => *name = local_name!("altGlyphDef"),
- local_name!("altglyphitem") => *name = local_name!("altGlyphItem"),
- local_name!("animatecolor") => *name = local_name!("animateColor"),
- local_name!("animatemotion") => *name = local_name!("animateMotion"),
- local_name!("animatetransform") => *name = local_name!("animateTransform"),
- local_name!("clippath") => *name = local_name!("clipPath"),
- local_name!("feblend") => *name = local_name!("feBlend"),
- local_name!("fecolormatrix") => *name = local_name!("feColorMatrix"),
- local_name!("fecomponenttransfer") => *name = local_name!("feComponentTransfer"),
- local_name!("fecomposite") => *name = local_name!("feComposite"),
- local_name!("feconvolvematrix") => *name = local_name!("feConvolveMatrix"),
- local_name!("fediffuselighting") => *name = local_name!("feDiffuseLighting"),
- local_name!("fedisplacementmap") => *name = local_name!("feDisplacementMap"),
- local_name!("fedistantlight") => *name = local_name!("feDistantLight"),
- local_name!("fedropshadow") => *name = local_name!("feDropShadow"),
- local_name!("feflood") => *name = local_name!("feFlood"),
- local_name!("fefunca") => *name = local_name!("feFuncA"),
- local_name!("fefuncb") => *name = local_name!("feFuncB"),
- local_name!("fefuncg") => *name = local_name!("feFuncG"),
- local_name!("fefuncr") => *name = local_name!("feFuncR"),
- local_name!("fegaussianblur") => *name = local_name!("feGaussianBlur"),
- local_name!("feimage") => *name = local_name!("feImage"),
- local_name!("femerge") => *name = local_name!("feMerge"),
- local_name!("femergenode") => *name = local_name!("feMergeNode"),
- local_name!("femorphology") => *name = local_name!("feMorphology"),
- local_name!("feoffset") => *name = local_name!("feOffset"),
- local_name!("fepointlight") => *name = local_name!("fePointLight"),
- local_name!("fespecularlighting") => *name = local_name!("feSpecularLighting"),
- local_name!("fespotlight") => *name = local_name!("feSpotLight"),
- local_name!("fetile") => *name = local_name!("feTile"),
- local_name!("feturbulence") => *name = local_name!("feTurbulence"),
- local_name!("foreignobject") => *name = local_name!("foreignObject"),
- local_name!("glyphref") => *name = local_name!("glyphRef"),
- local_name!("lineargradient") => *name = local_name!("linearGradient"),
- local_name!("radialgradient") => *name = local_name!("radialGradient"),
- local_name!("textpath") => *name = local_name!("textPath"),
- _ => (),
- }
- }
-
- fn adjust_attributes(&mut self, tag: &mut Tag, mut map: F)
- where F: FnMut(LocalName) -> Option,
- {
- for &mut Attribute { ref mut name, .. } in &mut tag.attrs {
- if let Some(replacement) = map(name.local.clone()) {
- *name = replacement;
- }
- }
- }
-
- fn adjust_svg_attributes(&mut self, tag: &mut Tag) {
- self.adjust_attributes(tag, |k| match k {
- local_name!("attributename") => Some(qualname!("", "attributeName")),
- local_name!("attributetype") => Some(qualname!("", "attributeType")),
- local_name!("basefrequency") => Some(qualname!("", "baseFrequency")),
- local_name!("baseprofile") => Some(qualname!("", "baseProfile")),
- local_name!("calcmode") => Some(qualname!("", "calcMode")),
- local_name!("clippathunits") => Some(qualname!("", "clipPathUnits")),
- local_name!("diffuseconstant") => Some(qualname!("", "diffuseConstant")),
- local_name!("edgemode") => Some(qualname!("", "edgeMode")),
- local_name!("filterunits") => Some(qualname!("", "filterUnits")),
- local_name!("glyphref") => Some(qualname!("", "glyphRef")),
- local_name!("gradienttransform") => Some(qualname!("", "gradientTransform")),
- local_name!("gradientunits") => Some(qualname!("", "gradientUnits")),
- local_name!("kernelmatrix") => Some(qualname!("", "kernelMatrix")),
- local_name!("kernelunitlength") => Some(qualname!("", "kernelUnitLength")),
- local_name!("keypoints") => Some(qualname!("", "keyPoints")),
- local_name!("keysplines") => Some(qualname!("", "keySplines")),
- local_name!("keytimes") => Some(qualname!("", "keyTimes")),
- local_name!("lengthadjust") => Some(qualname!("", "lengthAdjust")),
- local_name!("limitingconeangle") => Some(qualname!("", "limitingConeAngle")),
- local_name!("markerheight") => Some(qualname!("", "markerHeight")),
- local_name!("markerunits") => Some(qualname!("", "markerUnits")),
- local_name!("markerwidth") => Some(qualname!("", "markerWidth")),
- local_name!("maskcontentunits") => Some(qualname!("", "maskContentUnits")),
- local_name!("maskunits") => Some(qualname!("", "maskUnits")),
- local_name!("numoctaves") => Some(qualname!("", "numOctaves")),
- local_name!("pathlength") => Some(qualname!("", "pathLength")),
- local_name!("patterncontentunits") => Some(qualname!("", "patternContentUnits")),
- local_name!("patterntransform") => Some(qualname!("", "patternTransform")),
- local_name!("patternunits") => Some(qualname!("", "patternUnits")),
- local_name!("pointsatx") => Some(qualname!("", "pointsAtX")),
- local_name!("pointsaty") => Some(qualname!("", "pointsAtY")),
- local_name!("pointsatz") => Some(qualname!("", "pointsAtZ")),
- local_name!("preservealpha") => Some(qualname!("", "preserveAlpha")),
- local_name!("preserveaspectratio") => Some(qualname!("", "preserveAspectRatio")),
- local_name!("primitiveunits") => Some(qualname!("", "primitiveUnits")),
- local_name!("refx") => Some(qualname!("", "refX")),
- local_name!("refy") => Some(qualname!("", "refY")),
- local_name!("repeatcount") => Some(qualname!("", "repeatCount")),
- local_name!("repeatdur") => Some(qualname!("", "repeatDur")),
- local_name!("requiredextensions") => Some(qualname!("", "requiredExtensions")),
- local_name!("requiredfeatures") => Some(qualname!("", "requiredFeatures")),
- local_name!("specularconstant") => Some(qualname!("", "specularConstant")),
- local_name!("specularexponent") => Some(qualname!("", "specularExponent")),
- local_name!("spreadmethod") => Some(qualname!("", "spreadMethod")),
- local_name!("startoffset") => Some(qualname!("", "startOffset")),
- local_name!("stddeviation") => Some(qualname!("", "stdDeviation")),
- local_name!("stitchtiles") => Some(qualname!("", "stitchTiles")),
- local_name!("surfacescale") => Some(qualname!("", "surfaceScale")),
- local_name!("systemlanguage") => Some(qualname!("", "systemLanguage")),
- local_name!("tablevalues") => Some(qualname!("", "tableValues")),
- local_name!("targetx") => Some(qualname!("", "targetX")),
- local_name!("targety") => Some(qualname!("", "targetY")),
- local_name!("textlength") => Some(qualname!("", "textLength")),
- local_name!("viewbox") => Some(qualname!("", "viewBox")),
- local_name!("viewtarget") => Some(qualname!("", "viewTarget")),
- local_name!("xchannelselector") => Some(qualname!("", "xChannelSelector")),
- local_name!("ychannelselector") => Some(qualname!("", "yChannelSelector")),
- local_name!("zoomandpan") => Some(qualname!("", "zoomAndPan")),
- _ => None,
- });
- }
-
- fn adjust_mathml_attributes(&mut self, tag: &mut Tag) {
- self.adjust_attributes(tag, |k| match k {
- local_name!("definitionurl") => Some(qualname!("", "definitionURL")),
- _ => None,
- });
- }
-
- fn adjust_foreign_attributes(&mut self, tag: &mut Tag) {
- self.adjust_attributes(tag, |k| match k {
- local_name!("xlink:actuate") => Some(qualname!("xlink" xlink "actuate")),
- local_name!("xlink:arcrole") => Some(qualname!("xlink" xlink "arcrole")),
- local_name!("xlink:href") => Some(qualname!("xlink" xlink "href")),
- local_name!("xlink:role") => Some(qualname!("xlink" xlink "role")),
- local_name!("xlink:show") => Some(qualname!("xlink" xlink "show")),
- local_name!("xlink:title") => Some(qualname!("xlink" xlink "title")),
- local_name!("xlink:type") => Some(qualname!("xlink" xlink "type")),
- local_name!("xml:base") => Some(qualname!("xml" xml "base")),
- local_name!("xml:lang") => Some(qualname!("xml" xml "lang")),
- local_name!("xml:space") => Some(qualname!("xml" xml "space")),
- local_name!("xmlns") => Some(qualname!("" xmlns "xmlns")),
- local_name!("xmlns:xlink") => Some(qualname!("xmlns" xmlns "xlink")),
- _ => None,
- });
- }
-
- fn foreign_start_tag(&mut self, mut tag: Tag) -> ProcessResult {
- let current_ns = self.sink.elem_name(self.adjusted_current_node()).ns.clone();
- match current_ns {
- ns!(mathml) => self.adjust_mathml_attributes(&mut tag),
- ns!(svg) => {
- self.adjust_svg_tag_name(&mut tag);
- self.adjust_svg_attributes(&mut tag);
- }
- _ => (),
- }
- self.adjust_foreign_attributes(&mut tag);
- if tag.self_closing {
- // FIXME(#118): in SVG
- self.insert_element(NoPush, current_ns, tag.name, tag.attrs);
- DoneAckSelfClosing
- } else {
- self.insert_element(Push, current_ns, tag.name, tag.attrs);
- Done
- }
- }
-
- fn unexpected_start_tag_in_foreign_content(&mut self, tag: Tag) -> ProcessResult {
- self.unexpected(&tag);
- if self.is_fragment() {
- self.foreign_start_tag(tag)
- } else {
- self.pop();
- while !self.current_node_in(|n| {
- *n.ns == ns!(html) ||
- mathml_text_integration_point(n) ||
- svg_html_integration_point(n)
- }) {
- self.pop();
- }
- ReprocessForeign(TagToken(tag))
- }
- }
-}
diff --git a/html5ever/src/tree_builder/mod.rs b/html5ever/src/tree_builder/mod.rs
index fc2c6c8c..d6480129 100644
--- a/html5ever/src/tree_builder/mod.rs
+++ b/html5ever/src/tree_builder/mod.rs
@@ -12,39 +12,41 @@
//! The HTML5 tree builder.
pub use interface::{QuirksMode, Quirks, LimitedQuirks, NoQuirks};
-pub use interface::{NodeOrText, AppendNode, AppendText};
+pub use interface::{NodeOrText, AppendNode, AppendText, Attribute};
pub use interface::{TreeSink, Tracer, NextParserState, create_element, ElementFlags};
use self::types::*;
-use self::actions::TreeBuilderActions;
-use self::rules::TreeBuilderStep;
-use ExpandedName;
-use QualName;
+use {ExpandedName, QualName, LocalName, Namespace};
use tendril::StrTendril;
use tokenizer;
-use tokenizer::{Doctype, StartTag, Tag, TokenSink, TokenSinkResult};
+use tokenizer::{Doctype, StartTag, Tag, EndTag, TokenSink, TokenSinkResult};
use tokenizer::states as tok_state;
use util::str::is_ascii_whitespace;
-use std::default::Default;
-use std::mem::replace;
+use std::{slice, fmt};
+use std::ascii::AsciiExt;
use std::borrow::Cow::Borrowed;
use std::collections::VecDeque;
+use std::default::Default;
+use std::iter::{Rev, Enumerate};
+use std::mem::replace;
+
+use tokenizer::states::{RawData, RawKind};
+use tree_builder::types::*;
+use tree_builder::tag_sets::*;
+use util::str::to_escaped_string;
+
+pub use self::PushFlag::*;
#[macro_use] mod tag_sets;
mod data;
mod types;
-mod actions;
-
-mod rules {
- //! The tree builder rules, as a single, enormous nested match expression.
- include!(concat!(env!("OUT_DIR"), "/rules.rs"));
-}
+include!(concat!(env!("OUT_DIR"), "/rules.rs"));
/// Tree builder options, with an impl for Default.
#[derive(Copy, Clone)]
@@ -486,6 +488,1065 @@ impl TokenSink
}
}
+pub fn html_elem(open_elems: &[Handle]) -> &Handle {
+ &open_elems[0]
+}
+
+pub struct ActiveFormattingIter<'a, Handle: 'a> {
+ iter: Rev>>>,
+}
+
+impl<'a, Handle> Iterator for ActiveFormattingIter<'a, Handle> {
+ type Item = (usize, &'a Handle, &'a Tag);
+ fn next(&mut self) -> Option<(usize, &'a Handle, &'a Tag)> {
+ match self.iter.next() {
+ None | Some((_, &Marker)) => None,
+ Some((i, &Element(ref h, ref t))) => Some((i, h, t)),
+ }
+ }
+}
+
+pub enum PushFlag {
+ Push,
+ NoPush,
+}
+
+enum Bookmark {
+ Replace(Handle),
+ InsertAfter(Handle),
+}
+
+macro_rules! qualname {
+ ("", $local:tt) => {
+ QualName {
+ prefix: None,
+ ns: ns!(),
+ local: local_name!($local),
+ }
+ };
+ ($prefix: tt $ns:tt $local:tt) => {
+ QualName {
+ prefix: Some(namespace_prefix!($prefix)),
+ ns: ns!($ns),
+ local: local_name!($local),
+ }
+ }
+}
+
+#[doc(hidden)]
+impl TreeBuilder
+ where Handle: Clone,
+ Sink: TreeSink,
+{
+ fn unexpected(&mut self, _thing: &T) -> ProcessResult {
+ self.sink.parse_error(format_if!(
+ self.opts.exact_errors,
+ "Unexpected token",
+ "Unexpected token {} in insertion mode {:?}", to_escaped_string(_thing), self.mode));
+ Done
+ }
+
+ fn assert_named(&mut self, node: &Handle, name: LocalName) {
+ assert!(self.html_elem_named(&node, name));
+ }
+
+ /// Iterate over the active formatting elements (with index in the list) from the end
+ /// to the last marker, or the beginning if there are no markers.
+ fn active_formatting_end_to_marker<'a>(&'a self) -> ActiveFormattingIter<'a, Handle> {
+ ActiveFormattingIter {
+ iter: self.active_formatting.iter().enumerate().rev(),
+ }
+ }
+
+ fn position_in_active_formatting(&self, element: &Handle) -> Option {
+ self.active_formatting
+ .iter()
+ .position(|n| {
+ match n {
+ &Marker => false,
+ &Element(ref handle, _) => self.sink.same_node(handle, element)
+ }
+ })
+ }
+
+ fn set_quirks_mode(&mut self, mode: QuirksMode) {
+ self.quirks_mode = mode;
+ self.sink.set_quirks_mode(mode);
+ }
+
+ fn stop_parsing(&mut self) -> ProcessResult {
+ warn!("stop_parsing not implemented, full speed ahead!");
+ Done
+ }
+
+ //§ parsing-elements-that-contain-only-text
+ // Switch to `Text` insertion mode, save the old mode, and
+ // switch the tokenizer to a raw-data state.
+ // The latter only takes effect after the current / next
+ // `process_token` of a start tag returns!
+ fn to_raw_text_mode(&mut self, k: RawKind) -> ProcessResult {
+ self.orig_mode = Some(self.mode);
+ self.mode = Text;
+ ToRawData(k)
+ }
+
+ // The generic raw text / RCDATA parsing algorithm.
+ fn parse_raw_data(&mut self, tag: Tag, k: RawKind) -> ProcessResult {
+ self.insert_element_for(tag);
+ self.to_raw_text_mode(k)
+ }
+ //§ END
+
+ fn current_node(&self) -> &Handle {
+ self.open_elems.last().expect("no current element")
+ }
+
+ fn adjusted_current_node(&self) -> &Handle {
+ if self.open_elems.len() == 1 {
+ if let Some(ctx) = self.context_elem.as_ref() {
+ return ctx;
+ }
+ }
+ self.current_node()
+ }
+
+ fn current_node_in(&self, set: TagSet) -> bool
+ where TagSet: Fn(ExpandedName) -> bool
+ {
+ set(self.sink.elem_name(self.current_node()))
+ }
+
+ // Insert at the "appropriate place for inserting a node".
+ fn insert_appropriately(&mut self, child: NodeOrText, override_target: Option) {
+ let insertion_point = self.appropriate_place_for_insertion(override_target);
+ self.insert_at(insertion_point, child);
+ }
+
+ fn adoption_agency(&mut self, subject: LocalName) {
+ // 1.
+ if self.current_node_named(subject.clone()) {
+ if self.position_in_active_formatting(self.current_node()).is_none() {
+ self.pop();
+ return;
+ }
+ }
+
+ // 2. 3. 4.
+ for _ in 0..8 {
+ // 5.
+ let (fmt_elem_index, fmt_elem, fmt_elem_tag) = unwrap_or_return!(
+ // We clone the Handle and Tag so they don't cause an immutable borrow of self.
+ self.active_formatting_end_to_marker()
+ .filter(|&(_, _, tag)| tag.name == subject)
+ .next()
+ .map(|(i, h, t)| (i, h.clone(), t.clone())),
+
+ {
+ self.process_end_tag_in_body(Tag {
+ kind: EndTag,
+ name: subject,
+ self_closing: false,
+ attrs: vec!(),
+ });
+ }
+ );
+
+ let fmt_elem_stack_index = unwrap_or_return!(
+ self.open_elems.iter()
+ .rposition(|n| self.sink.same_node(n, &fmt_elem)),
+
+ {
+ self.sink.parse_error(Borrowed("Formatting element not open"));
+ self.active_formatting.remove(fmt_elem_index);
+ }
+ );
+
+ // 7.
+ if !self.in_scope(default_scope, |n| self.sink.same_node(&n, &fmt_elem)) {
+ self.sink.parse_error(Borrowed("Formatting element not in scope"));
+ return;
+ }
+
+ // 8.
+ if !self.sink.same_node(self.current_node(), &fmt_elem) {
+ self.sink.parse_error(Borrowed("Formatting element not current node"));
+ }
+
+ // 9.
+ let (furthest_block_index, furthest_block) = unwrap_or_return!(
+ self.open_elems.iter()
+ .enumerate()
+ .skip(fmt_elem_stack_index)
+ .filter(|&(_, open_element)| self.elem_in(open_element, special_tag))
+ .next()
+ .map(|(i, h)| (i, h.clone())),
+
+ // 10.
+ {
+ self.open_elems.truncate(fmt_elem_stack_index);
+ self.active_formatting.remove(fmt_elem_index);
+ }
+ );
+
+ // 11.
+ let common_ancestor = self.open_elems[fmt_elem_stack_index - 1].clone();
+
+ // 12.
+ let mut bookmark = Bookmark::Replace(fmt_elem.clone());
+
+ // 13.
+ let mut node;
+ let mut node_index = furthest_block_index;
+ let mut last_node = furthest_block.clone();
+
+ // 13.1.
+ let mut inner_counter = 0;
+ loop {
+ // 13.2.
+ inner_counter += 1;
+
+ // 13.3.
+ node_index -= 1;
+ node = self.open_elems[node_index].clone();
+
+ // 13.4.
+ if self.sink.same_node(&node, &fmt_elem) {
+ break;
+ }
+
+ // 13.5.
+ if inner_counter > 3 {
+ self.position_in_active_formatting(&node)
+ .map(|position| self.active_formatting.remove(position));
+ self.open_elems.remove(node_index);
+ continue;
+ }
+
+ let node_formatting_index = unwrap_or_else!(
+ self.position_in_active_formatting(&node),
+
+ // 13.6.
+ {
+ self.open_elems.remove(node_index);
+ continue;
+ }
+ );
+
+ // 13.7.
+ let tag = match self.active_formatting[node_formatting_index] {
+ Element(ref h, ref t) => {
+ assert!(self.sink.same_node(h, &node));
+ t.clone()
+ }
+ Marker => panic!("Found marker during adoption agency"),
+ };
+ // FIXME: Is there a way to avoid cloning the attributes twice here (once on their
+ // own, once as part of t.clone() above)?
+ let new_element = create_element(
+ &mut self.sink, QualName::new(None, ns!(html), tag.name.clone()),
+ tag.attrs.clone());
+ self.open_elems[node_index] = new_element.clone();
+ self.active_formatting[node_formatting_index] = Element(new_element.clone(), tag);
+ node = new_element;
+
+ // 13.8.
+ if self.sink.same_node(&last_node, &furthest_block) {
+ bookmark = Bookmark::InsertAfter(node.clone());
+ }
+
+ // 13.9.
+ self.sink.remove_from_parent(&last_node);
+ self.sink.append(&node, AppendNode(last_node.clone()));
+
+ // 13.10.
+ last_node = node.clone();
+
+ // 13.11.
+ }
+
+ // 14.
+ self.sink.remove_from_parent(&last_node);
+ self.insert_appropriately(AppendNode(last_node.clone()), Some(common_ancestor));
+
+ // 15.
+ // FIXME: Is there a way to avoid cloning the attributes twice here (once on their own,
+ // once as part of t.clone() above)?
+ let new_element = create_element(
+ &mut self.sink, QualName::new(None, ns!(html), fmt_elem_tag.name.clone()),
+ fmt_elem_tag.attrs.clone());
+ let new_entry = Element(new_element.clone(), fmt_elem_tag);
+
+ // 16.
+ self.sink.reparent_children(&furthest_block, &new_element);
+
+ // 17.
+ self.sink.append(&furthest_block, AppendNode(new_element.clone()));
+
+ // 18.
+ // FIXME: We could probably get rid of the position_in_active_formatting() calls here
+ // if we had a more clever Bookmark representation.
+ match bookmark {
+ Bookmark::Replace(to_replace) => {
+ let index = self.position_in_active_formatting(&to_replace)
+ .expect("bookmark not found in active formatting elements");
+ self.active_formatting[index] = new_entry;
+ }
+ Bookmark::InsertAfter(previous) => {
+ let index = self.position_in_active_formatting(&previous)
+ .expect("bookmark not found in active formatting elements") + 1;
+ self.active_formatting.insert(index, new_entry);
+ let old_index = self.position_in_active_formatting(&fmt_elem)
+ .expect("formatting element not found in active formatting elements");
+ self.active_formatting.remove(old_index);
+ }
+ }
+
+ // 19.
+ self.remove_from_stack(&fmt_elem);
+ let new_furthest_block_index = self.open_elems.iter()
+ .position(|n| self.sink.same_node(n, &furthest_block))
+ .expect("furthest block missing from open element stack");
+ self.open_elems.insert(new_furthest_block_index + 1, new_element);
+
+ // 20.
+ }
+ }
+
+ fn push(&mut self, elem: &Handle) {
+ self.open_elems.push(elem.clone());
+ }
+
+ fn pop(&mut self) -> Handle {
+ let elem = self.open_elems.pop().expect("no current element");
+ self.sink.pop(&elem);
+ elem
+ }
+
+ fn remove_from_stack(&mut self, elem: &Handle) {
+ let sink = &mut self.sink;
+ let position = self.open_elems
+ .iter()
+ .rposition(|x| sink.same_node(elem, &x));
+ if let Some(position) = position {
+ self.open_elems.remove(position);
+ sink.pop(elem);
+ }
+ }
+
+ fn is_marker_or_open(&self, entry: &FormatEntry) -> bool {
+ match *entry {
+ Marker => true,
+ Element(ref node, _) => {
+ self.open_elems.iter()
+ .rev()
+ .any(|n| self.sink.same_node(&n, &node))
+ }
+ }
+ }
+
+ /// Reconstruct the active formatting elements.
+ fn reconstruct_formatting(&mut self) {
+ {
+ let last = unwrap_or_return!(self.active_formatting.last(), ());
+ if self.is_marker_or_open(last) {
+ return
+ }
+ }
+
+ let mut entry_index = self.active_formatting.len() - 1;
+ loop {
+ if entry_index == 0 {
+ break
+ }
+ entry_index -= 1;
+ if self.is_marker_or_open(&self.active_formatting[entry_index]) {
+ entry_index += 1;
+ break
+ }
+ }
+
+ loop {
+ let tag = match self.active_formatting[entry_index] {
+ Element(_, ref t) => t.clone(),
+ Marker => panic!("Found marker during formatting element reconstruction"),
+ };
+
+ // FIXME: Is there a way to avoid cloning the attributes twice here (once on their own,
+ // once as part of t.clone() above)?
+ let new_element = self.insert_element(Push, ns!(html), tag.name.clone(),
+ tag.attrs.clone());
+ self.active_formatting[entry_index] = Element(new_element, tag);
+ if entry_index == self.active_formatting.len() - 1 {
+ break
+ }
+ entry_index += 1;
+ }
+ }
+
+ /// Get the first element on the stack, which will be the element.
+ fn html_elem(&self) -> &Handle {
+ &self.open_elems[0]
+ }
+
+ /// Get the second element on the stack, if it's a HTML body element.
+ fn body_elem(&self) -> Option<&Handle> {
+ if self.open_elems.len() <= 1 {
+ return None;
+ }
+
+ let node = &self.open_elems[1];
+ if self.html_elem_named(node, local_name!("body")) {
+ Some(node)
+ } else {
+ None
+ }
+ }
+
+ /// Signal an error depending on the state of the stack of open elements at
+ /// the end of the body.
+ fn check_body_end(&mut self) {
+ declare_tag_set!(body_end_ok =
+ "dd" "dt" "li" "optgroup" "option" "p" "rp" "rt" "tbody" "td" "tfoot" "th"
+ "thead" "tr" "body" "html");
+
+ for elem in self.open_elems.iter() {
+ let error;
+ {
+ let name = self.sink.elem_name(elem);
+ if body_end_ok(name) {
+ continue
+ }
+ error = format_if!(self.opts.exact_errors,
+ "Unexpected open tag at end of body",
+ "Unexpected open tag {:?} at end of body", name);
+ }
+ self.sink.parse_error(error);
+ // FIXME: Do we keep checking after finding one bad tag?
+ // The spec suggests not.
+ return;
+ }
+ }
+
+ fn in_scope(&self, scope: TagSet, pred: Pred) -> bool
+ where TagSet: Fn(ExpandedName) -> bool, Pred: Fn(Handle) -> bool
+ {
+ for node in self.open_elems.iter().rev() {
+ if pred(node.clone()) {
+ return true;
+ }
+ if scope(self.sink.elem_name(node)) {
+ return false;
+ }
+ }
+
+ // supposed to be impossible, because is always in scope
+
+ false
+ }
+
+ fn elem_in(&self, elem: &Handle, set: TagSet) -> bool
+ where TagSet: Fn(ExpandedName) -> bool
+ {
+ set(self.sink.elem_name(elem))
+ }
+
+ fn html_elem_named(&self, elem: &Handle, name: LocalName) -> bool {
+ let expanded = self.sink.elem_name(elem);
+ *expanded.ns == ns!(html) && *expanded.local == name
+ }
+
+ fn in_html_elem_named(&self, name: LocalName) -> bool {
+ self.open_elems.iter().any(|elem| self.html_elem_named(elem, name.clone()))
+ }
+
+ fn current_node_named(&self, name: LocalName) -> bool {
+ self.html_elem_named(self.current_node(), name)
+ }
+
+ fn in_scope_named(&self, scope: TagSet, name: LocalName) -> bool
+ where TagSet: Fn(ExpandedName) -> bool
+ {
+ self.in_scope(scope, |elem| self.html_elem_named(&elem, name.clone()))
+ }
+
+ //§ closing-elements-that-have-implied-end-tags
+ fn generate_implied_end(&mut self, set: TagSet)
+ where TagSet: Fn(ExpandedName) -> bool
+ {
+ loop {
+ {
+ let elem = unwrap_or_return!(self.open_elems.last(), ());
+ let nsname = self.sink.elem_name(elem);
+ if !set(nsname) { return; }
+ }
+ self.pop();
+ }
+ }
+
+ fn generate_implied_end_except(&mut self, except: LocalName) {
+ self.generate_implied_end(|p| {
+ if *p.ns == ns!(html) && *p.local == except {
+ false
+ } else {
+ cursory_implied_end(p)
+ }
+ });
+ }
+ //§ END
+
+ // Pop elements until the current element is in the set.
+ fn pop_until_current(&mut self, pred: TagSet)
+ where TagSet: Fn(ExpandedName) -> bool
+ {
+ loop {
+ if self.current_node_in(|x| pred(x)) {
+ break;
+ }
+ self.open_elems.pop();
+ }
+ }
+
+ // Pop elements until an element from the set has been popped. Returns the
+ // number of elements popped.
+ fn pop_until (&mut self, pred: P) -> usize
+ where P: Fn(ExpandedName) -> bool
+ {
+ let mut n = 0;
+ loop {
+ n += 1;
+ match self.open_elems.pop() {
+ None => break,
+ Some(elem) => if pred(self.sink.elem_name(&elem)) { break; },
+ }
+ }
+ n
+ }
+
+ fn pop_until_named(&mut self, name: LocalName) -> usize {
+ self.pop_until(|p| *p.ns == ns!(html) && *p.local == name)
+ }
+
+ // Pop elements until one with the specified name has been popped.
+ // Signal an error if it was not the first one.
+ fn expect_to_close(&mut self, name: LocalName) {
+ if self.pop_until_named(name.clone()) != 1 {
+ self.sink.parse_error(format_if!(self.opts.exact_errors,
+ "Unexpected open element",
+ "Unexpected open element while closing {:?}", name));
+ }
+ }
+
+ fn close_p_element(&mut self) {
+ declare_tag_set!(implied = [cursory_implied_end] - "p");
+ self.generate_implied_end(implied);
+ self.expect_to_close(local_name!("p"));
+ }
+
+ fn close_p_element_in_button_scope(&mut self) {
+ if self.in_scope_named(button_scope, local_name!("p")) {
+ self.close_p_element();
+ }
+ }
+
+ // Check tags for type=hidden
+ fn is_type_hidden(&self, tag: &Tag) -> bool {
+ match tag.attrs.iter().find(|&at| at.name.expanded() == expanded_name!("", "type")) {
+ None => false,
+ Some(at) => (&*at.value).eq_ignore_ascii_case("hidden"),
+ }
+ }
+
+ fn foster_parent_in_body(&mut self, token: Token) -> ProcessResult {
+ warn!("foster parenting not implemented");
+ self.foster_parenting = true;
+ let res = self.step(InBody, token);
+ // FIXME: what if res is Reprocess?
+ self.foster_parenting = false;
+ res
+ }
+
+ fn process_chars_in_table(&mut self, token: Token) -> ProcessResult {
+ declare_tag_set!(table_outer = "table" "tbody" "tfoot" "thead" "tr");
+ if self.current_node_in(table_outer) {
+ assert!(self.pending_table_text.is_empty());
+ self.orig_mode = Some(self.mode);
+ Reprocess(InTableText, token)
+ } else {
+ self.sink.parse_error(format_if!(self.opts.exact_errors,
+ "Unexpected characters in table",
+ "Unexpected characters {} in table", to_escaped_string(&token)));
+ self.foster_parent_in_body(token)
+ }
+ }
+
+ // https://html.spec.whatwg.org/multipage/syntax.html#reset-the-insertion-mode-appropriately
+ fn reset_insertion_mode(&mut self) -> InsertionMode {
+ for (i, mut node) in self.open_elems.iter().enumerate().rev() {
+ let last = i == 0usize;
+ if let (true, Some(ctx)) = (last, self.context_elem.as_ref()) {
+ node = ctx;
+ }
+ let name = match self.sink.elem_name(node) {
+ ExpandedName { ns: &ns!(html), local } => local,
+ _ => continue,
+ };
+ match *name {
+ local_name!("select") => {
+ for ancestor in self.open_elems[0..i].iter().rev() {
+ if self.html_elem_named(ancestor, local_name!("template")) {
+ return InSelect;
+ } else if self.html_elem_named(ancestor, local_name!("table")) {
+ return InSelectInTable;
+ }
+ }
+ return InSelect;
+ },
+ local_name!("td") | local_name!("th") => if !last { return InCell; },
+ local_name!("tr") => return InRow,
+ local_name!("tbody") | local_name!("thead") | local_name!("tfoot") => return InTableBody,
+ local_name!("caption") => return InCaption,
+ local_name!("colgroup") => return InColumnGroup,
+ local_name!("table") => return InTable,
+ local_name!("template") => return *self.template_modes.last().unwrap(),
+ local_name!("head") => if !last { return InHead },
+ local_name!("body") => return InBody,
+ local_name!("frameset") => return InFrameset,
+ local_name!("html") => match self.head_elem {
+ None => return BeforeHead,
+ Some(_) => return AfterHead,
+ },
+
+ _ => (),
+ }
+ }
+ InBody
+ }
+
+ fn close_the_cell(&mut self) {
+ self.generate_implied_end(cursory_implied_end);
+ if self.pop_until(td_th) != 1 {
+ self.sink.parse_error(Borrowed("expected to close or | with cell"));
+ }
+ self.clear_active_formatting_to_marker();
+ }
+
+ fn append_text(&mut self, text: StrTendril) -> ProcessResult {
+ self.insert_appropriately(AppendText(text), None);
+ Done
+ }
+
+ fn append_comment(&mut self, text: StrTendril) -> ProcessResult {
+ let comment = self.sink.create_comment(text);
+ self.insert_appropriately(AppendNode(comment), None);
+ Done
+ }
+
+ fn append_comment_to_doc(&mut self, text: StrTendril) -> ProcessResult {
+ let comment = self.sink.create_comment(text);
+ self.sink.append(&self.doc_handle, AppendNode(comment));
+ Done
+ }
+
+ fn append_comment_to_html(&mut self, text: StrTendril) -> ProcessResult {
+ let target = html_elem(&self.open_elems);
+ let comment = self.sink.create_comment(text);
+ self.sink.append(target, AppendNode(comment));
+ Done
+ }
+
+ //§ creating-and-inserting-nodes
+ fn create_root(&mut self, attrs: Vec) {
+ let elem = create_element(
+ &mut self.sink, QualName::new(None, ns!(html), local_name!("html")),
+ attrs);
+ self.push(&elem);
+ self.sink.append(&self.doc_handle, AppendNode(elem));
+ // FIXME: application cache selection algorithm
+ }
+
+ // https://html.spec.whatwg.org/multipage/#create-an-element-for-the-token
+ fn insert_element(&mut self, push: PushFlag, ns: Namespace, name: LocalName, attrs: Vec)
+ -> Handle {
+ declare_tag_set!(form_associatable =
+ "button" "fieldset" "input" "object"
+ "output" "select" "textarea" "img");
+
+ declare_tag_set!(listed = [form_associatable] - "img");
+
+ // Step 7.
+ let qname = QualName::new(None, ns, name);
+ let elem = create_element(&mut self.sink, qname.clone(), attrs.clone());
+
+ let insertion_point = self.appropriate_place_for_insertion(None);
+ let tree_node = match insertion_point {
+ LastChild(ref p) |
+ BeforeSibling(ref p) => p.clone()
+ };
+
+ // Step 12.
+ if form_associatable(qname.expanded()) &&
+ self.form_elem.is_some() &&
+ !self.in_html_elem_named(local_name!("template")) &&
+ !(listed(qname.expanded()) &&
+ attrs.iter().any(|a| a.name.expanded() == expanded_name!("", "form"))) {
+
+ let form = self.form_elem.as_ref().unwrap().clone();
+ if self.sink.same_tree(&tree_node, &form) {
+ self.sink.associate_with_form(&elem, &form)
+ }
+ }
+
+ self.insert_at(insertion_point, AppendNode(elem.clone()));
+
+ match push {
+ Push => self.push(&elem),
+ NoPush => (),
+ }
+ // FIXME: Remove from the stack if we can't append?
+ elem
+ }
+
+ fn insert_element_for(&mut self, tag: Tag) -> Handle {
+ self.insert_element(Push, ns!(html), tag.name, tag.attrs)
+ }
+
+ fn insert_and_pop_element_for(&mut self, tag: Tag) -> Handle {
+ self.insert_element(NoPush, ns!(html), tag.name, tag.attrs)
+ }
+
+ fn insert_phantom(&mut self, name: LocalName) -> Handle {
+ self.insert_element(Push, ns!(html), name, vec!())
+ }
+ //§ END
+
+ fn create_formatting_element_for(&mut self, tag: Tag) -> Handle {
+ // FIXME: This really wants unit tests.
+ let mut first_match = None;
+ let mut matches = 0usize;
+ for (i, _, old_tag) in self.active_formatting_end_to_marker() {
+ if tag.equiv_modulo_attr_order(old_tag) {
+ first_match = Some(i);
+ matches += 1;
+ }
+ }
+
+ if matches >= 3 {
+ self.active_formatting.remove(first_match.expect("matches with no index"));
+ }
+
+ let elem = self.insert_element(Push, ns!(html), tag.name.clone(), tag.attrs.clone());
+ self.active_formatting.push(Element(elem.clone(), tag));
+ elem
+ }
+
+ fn clear_active_formatting_to_marker(&mut self) {
+ loop {
+ match self.active_formatting.pop() {
+ None | Some(Marker) => break,
+ _ => (),
+ }
+ }
+ }
+
+ fn process_end_tag_in_body(&mut self, tag: Tag) {
+ // Look back for a matching open element.
+ let mut match_idx = None;
+ for (i, elem) in self.open_elems.iter().enumerate().rev() {
+ if self.html_elem_named(elem, tag.name.clone()) {
+ match_idx = Some(i);
+ break;
+ }
+
+ if self.elem_in(elem, special_tag) {
+ self.sink.parse_error(Borrowed("Found special tag while closing generic tag"));
+ return;
+ }
+ }
+
+ // Can't use unwrap_or_return!() due to rust-lang/rust#16617.
+ let match_idx = match match_idx {
+ None => {
+ // I believe this is impossible, because the root
+ // element is in special_tag.
+ self.unexpected(&tag);
+ return;
+ }
+ Some(x) => x,
+ };
+
+ self.generate_implied_end_except(tag.name.clone());
+
+ if match_idx != self.open_elems.len() - 1 {
+ // mis-nested tags
+ self.unexpected(&tag);
+ }
+ self.open_elems.truncate(match_idx);
+ }
+
+ fn handle_misnested_a_tags(&mut self, tag: &Tag) {
+ let node = unwrap_or_return!(
+ self.active_formatting_end_to_marker()
+ .filter(|&(_, n, _)| self.html_elem_named(n, local_name!("a")))
+ .next()
+ .map(|(_, n, _)| n.clone()),
+
+ ()
+ );
+
+ self.unexpected(tag);
+ self.adoption_agency(local_name!("a"));
+ self.position_in_active_formatting(&node)
+ .map(|index| self.active_formatting.remove(index));
+ self.remove_from_stack(&node);
+ }
+
+ //§ tree-construction
+ fn is_foreign(&mut self, token: &Token) -> bool {
+ if let EOFToken = *token {
+ return false;
+ }
+
+ if self.open_elems.len() == 0 {
+ return false;
+ }
+
+ let name = self.sink.elem_name(self.adjusted_current_node());
+ if let ns!(html) = *name.ns {
+ return false;
+ }
+
+ if mathml_text_integration_point(name) {
+ match *token {
+ CharacterTokens(..) | NullCharacterToken => return false,
+ TagToken(Tag { kind: StartTag, ref name, .. })
+ if !matches!(*name, local_name!("mglyph") | local_name!("malignmark")) => return false,
+ _ => (),
+ }
+ }
+
+ if svg_html_integration_point(name) {
+ match *token {
+ CharacterTokens(..) | NullCharacterToken => return false,
+ TagToken(Tag { kind: StartTag, .. }) => return false,
+ _ => (),
+ }
+ }
+
+ if let expanded_name!(mathml "annotation-xml") = name {
+ match *token {
+ TagToken(Tag { kind: StartTag, name: local_name!("svg"), .. }) => return false,
+ CharacterTokens(..) | NullCharacterToken |
+ TagToken(Tag { kind: StartTag, .. }) => {
+ return !self.sink.is_mathml_annotation_xml_integration_point(
+ self.adjusted_current_node())
+ }
+ _ => {}
+ };
+ }
+
+ true
+ }
+ //§ END
+
+ fn enter_foreign(&mut self, mut tag: Tag, ns: Namespace) -> ProcessResult {
+ match ns {
+ ns!(mathml) => self.adjust_mathml_attributes(&mut tag),
+ ns!(svg) => self.adjust_svg_attributes(&mut tag),
+ _ => (),
+ }
+ self.adjust_foreign_attributes(&mut tag);
+
+ if tag.self_closing {
+ self.insert_element(NoPush, ns, tag.name, tag.attrs);
+ DoneAckSelfClosing
+ } else {
+ self.insert_element(Push, ns, tag.name, tag.attrs);
+ Done
+ }
+ }
+
+ fn adjust_svg_tag_name(&mut self, tag: &mut Tag) {
+ let Tag { ref mut name, .. } = *tag;
+ match *name {
+ local_name!("altglyph") => *name = local_name!("altGlyph"),
+ local_name!("altglyphdef") => *name = local_name!("altGlyphDef"),
+ local_name!("altglyphitem") => *name = local_name!("altGlyphItem"),
+ local_name!("animatecolor") => *name = local_name!("animateColor"),
+ local_name!("animatemotion") => *name = local_name!("animateMotion"),
+ local_name!("animatetransform") => *name = local_name!("animateTransform"),
+ local_name!("clippath") => *name = local_name!("clipPath"),
+ local_name!("feblend") => *name = local_name!("feBlend"),
+ local_name!("fecolormatrix") => *name = local_name!("feColorMatrix"),
+ local_name!("fecomponenttransfer") => *name = local_name!("feComponentTransfer"),
+ local_name!("fecomposite") => *name = local_name!("feComposite"),
+ local_name!("feconvolvematrix") => *name = local_name!("feConvolveMatrix"),
+ local_name!("fediffuselighting") => *name = local_name!("feDiffuseLighting"),
+ local_name!("fedisplacementmap") => *name = local_name!("feDisplacementMap"),
+ local_name!("fedistantlight") => *name = local_name!("feDistantLight"),
+ local_name!("fedropshadow") => *name = local_name!("feDropShadow"),
+ local_name!("feflood") => *name = local_name!("feFlood"),
+ local_name!("fefunca") => *name = local_name!("feFuncA"),
+ local_name!("fefuncb") => *name = local_name!("feFuncB"),
+ local_name!("fefuncg") => *name = local_name!("feFuncG"),
+ local_name!("fefuncr") => *name = local_name!("feFuncR"),
+ local_name!("fegaussianblur") => *name = local_name!("feGaussianBlur"),
+ local_name!("feimage") => *name = local_name!("feImage"),
+ local_name!("femerge") => *name = local_name!("feMerge"),
+ local_name!("femergenode") => *name = local_name!("feMergeNode"),
+ local_name!("femorphology") => *name = local_name!("feMorphology"),
+ local_name!("feoffset") => *name = local_name!("feOffset"),
+ local_name!("fepointlight") => *name = local_name!("fePointLight"),
+ local_name!("fespecularlighting") => *name = local_name!("feSpecularLighting"),
+ local_name!("fespotlight") => *name = local_name!("feSpotLight"),
+ local_name!("fetile") => *name = local_name!("feTile"),
+ local_name!("feturbulence") => *name = local_name!("feTurbulence"),
+ local_name!("foreignobject") => *name = local_name!("foreignObject"),
+ local_name!("glyphref") => *name = local_name!("glyphRef"),
+ local_name!("lineargradient") => *name = local_name!("linearGradient"),
+ local_name!("radialgradient") => *name = local_name!("radialGradient"),
+ local_name!("textpath") => *name = local_name!("textPath"),
+ _ => (),
+ }
+ }
+
+ fn adjust_attributes(&mut self, tag: &mut Tag, mut map: F)
+ where F: FnMut(LocalName) -> Option,
+ {
+ for &mut Attribute { ref mut name, .. } in &mut tag.attrs {
+ if let Some(replacement) = map(name.local.clone()) {
+ *name = replacement;
+ }
+ }
+ }
+
+ fn adjust_svg_attributes(&mut self, tag: &mut Tag) {
+ self.adjust_attributes(tag, |k| match k {
+ local_name!("attributename") => Some(qualname!("", "attributeName")),
+ local_name!("attributetype") => Some(qualname!("", "attributeType")),
+ local_name!("basefrequency") => Some(qualname!("", "baseFrequency")),
+ local_name!("baseprofile") => Some(qualname!("", "baseProfile")),
+ local_name!("calcmode") => Some(qualname!("", "calcMode")),
+ local_name!("clippathunits") => Some(qualname!("", "clipPathUnits")),
+ local_name!("diffuseconstant") => Some(qualname!("", "diffuseConstant")),
+ local_name!("edgemode") => Some(qualname!("", "edgeMode")),
+ local_name!("filterunits") => Some(qualname!("", "filterUnits")),
+ local_name!("glyphref") => Some(qualname!("", "glyphRef")),
+ local_name!("gradienttransform") => Some(qualname!("", "gradientTransform")),
+ local_name!("gradientunits") => Some(qualname!("", "gradientUnits")),
+ local_name!("kernelmatrix") => Some(qualname!("", "kernelMatrix")),
+ local_name!("kernelunitlength") => Some(qualname!("", "kernelUnitLength")),
+ local_name!("keypoints") => Some(qualname!("", "keyPoints")),
+ local_name!("keysplines") => Some(qualname!("", "keySplines")),
+ local_name!("keytimes") => Some(qualname!("", "keyTimes")),
+ local_name!("lengthadjust") => Some(qualname!("", "lengthAdjust")),
+ local_name!("limitingconeangle") => Some(qualname!("", "limitingConeAngle")),
+ local_name!("markerheight") => Some(qualname!("", "markerHeight")),
+ local_name!("markerunits") => Some(qualname!("", "markerUnits")),
+ local_name!("markerwidth") => Some(qualname!("", "markerWidth")),
+ local_name!("maskcontentunits") => Some(qualname!("", "maskContentUnits")),
+ local_name!("maskunits") => Some(qualname!("", "maskUnits")),
+ local_name!("numoctaves") => Some(qualname!("", "numOctaves")),
+ local_name!("pathlength") => Some(qualname!("", "pathLength")),
+ local_name!("patterncontentunits") => Some(qualname!("", "patternContentUnits")),
+ local_name!("patterntransform") => Some(qualname!("", "patternTransform")),
+ local_name!("patternunits") => Some(qualname!("", "patternUnits")),
+ local_name!("pointsatx") => Some(qualname!("", "pointsAtX")),
+ local_name!("pointsaty") => Some(qualname!("", "pointsAtY")),
+ local_name!("pointsatz") => Some(qualname!("", "pointsAtZ")),
+ local_name!("preservealpha") => Some(qualname!("", "preserveAlpha")),
+ local_name!("preserveaspectratio") => Some(qualname!("", "preserveAspectRatio")),
+ local_name!("primitiveunits") => Some(qualname!("", "primitiveUnits")),
+ local_name!("refx") => Some(qualname!("", "refX")),
+ local_name!("refy") => Some(qualname!("", "refY")),
+ local_name!("repeatcount") => Some(qualname!("", "repeatCount")),
+ local_name!("repeatdur") => Some(qualname!("", "repeatDur")),
+ local_name!("requiredextensions") => Some(qualname!("", "requiredExtensions")),
+ local_name!("requiredfeatures") => Some(qualname!("", "requiredFeatures")),
+ local_name!("specularconstant") => Some(qualname!("", "specularConstant")),
+ local_name!("specularexponent") => Some(qualname!("", "specularExponent")),
+ local_name!("spreadmethod") => Some(qualname!("", "spreadMethod")),
+ local_name!("startoffset") => Some(qualname!("", "startOffset")),
+ local_name!("stddeviation") => Some(qualname!("", "stdDeviation")),
+ local_name!("stitchtiles") => Some(qualname!("", "stitchTiles")),
+ local_name!("surfacescale") => Some(qualname!("", "surfaceScale")),
+ local_name!("systemlanguage") => Some(qualname!("", "systemLanguage")),
+ local_name!("tablevalues") => Some(qualname!("", "tableValues")),
+ local_name!("targetx") => Some(qualname!("", "targetX")),
+ local_name!("targety") => Some(qualname!("", "targetY")),
+ local_name!("textlength") => Some(qualname!("", "textLength")),
+ local_name!("viewbox") => Some(qualname!("", "viewBox")),
+ local_name!("viewtarget") => Some(qualname!("", "viewTarget")),
+ local_name!("xchannelselector") => Some(qualname!("", "xChannelSelector")),
+ local_name!("ychannelselector") => Some(qualname!("", "yChannelSelector")),
+ local_name!("zoomandpan") => Some(qualname!("", "zoomAndPan")),
+ _ => None,
+ });
+ }
+
+ fn adjust_mathml_attributes(&mut self, tag: &mut Tag) {
+ self.adjust_attributes(tag, |k| match k {
+ local_name!("definitionurl") => Some(qualname!("", "definitionURL")),
+ _ => None,
+ });
+ }
+
+ fn adjust_foreign_attributes(&mut self, tag: &mut Tag) {
+ self.adjust_attributes(tag, |k| match k {
+ local_name!("xlink:actuate") => Some(qualname!("xlink" xlink "actuate")),
+ local_name!("xlink:arcrole") => Some(qualname!("xlink" xlink "arcrole")),
+ local_name!("xlink:href") => Some(qualname!("xlink" xlink "href")),
+ local_name!("xlink:role") => Some(qualname!("xlink" xlink "role")),
+ local_name!("xlink:show") => Some(qualname!("xlink" xlink "show")),
+ local_name!("xlink:title") => Some(qualname!("xlink" xlink "title")),
+ local_name!("xlink:type") => Some(qualname!("xlink" xlink "type")),
+ local_name!("xml:base") => Some(qualname!("xml" xml "base")),
+ local_name!("xml:lang") => Some(qualname!("xml" xml "lang")),
+ local_name!("xml:space") => Some(qualname!("xml" xml "space")),
+ local_name!("xmlns") => Some(qualname!("" xmlns "xmlns")),
+ local_name!("xmlns:xlink") => Some(qualname!("xmlns" xmlns "xlink")),
+ _ => None,
+ });
+ }
+
+ fn foreign_start_tag(&mut self, mut tag: Tag) -> ProcessResult {
+ let current_ns = self.sink.elem_name(self.adjusted_current_node()).ns.clone();
+ match current_ns {
+ ns!(mathml) => self.adjust_mathml_attributes(&mut tag),
+ ns!(svg) => {
+ self.adjust_svg_tag_name(&mut tag);
+ self.adjust_svg_attributes(&mut tag);
+ }
+ _ => (),
+ }
+ self.adjust_foreign_attributes(&mut tag);
+ if tag.self_closing {
+ // FIXME(#118): in SVG
+ self.insert_element(NoPush, current_ns, tag.name, tag.attrs);
+ DoneAckSelfClosing
+ } else {
+ self.insert_element(Push, current_ns, tag.name, tag.attrs);
+ Done
+ }
+ }
+
+ fn unexpected_start_tag_in_foreign_content(&mut self, tag: Tag) -> ProcessResult {
+ self.unexpected(&tag);
+ if self.is_fragment() {
+ self.foreign_start_tag(tag)
+ } else {
+ self.pop();
+ while !self.current_node_in(|n| {
+ *n.ns == ns!(html) ||
+ mathml_text_integration_point(n) ||
+ svg_html_integration_point(n)
+ }) {
+ self.pop();
+ }
+ ReprocessForeign(TagToken(tag))
+ }
+ }
+}
+
#[cfg(test)]
#[allow(non_snake_case)]
mod test {
@@ -494,8 +1555,6 @@ mod test {
use markup5ever::interface::{TreeSink, Tracer, ElementFlags};
use super::types::*;
- use super::actions::TreeBuilderActions;
- use super::rules::TreeBuilderStep;
use ExpandedName;
use QualName;
diff --git a/html5ever/src/tree_builder/rules.rs b/html5ever/src/tree_builder/rules.rs
index aedc8d50..5b5b8bc4 100644
--- a/html5ever/src/tree_builder/rules.rs
+++ b/html5ever/src/tree_builder/rules.rs
@@ -9,40 +9,25 @@
// The tree builder rules, as a single, enormous nested match expression.
-use {ExpandedName, QualName};
-use interface::{Attribute, TreeSink, Quirks, AppendNode, create_element};
use tree_builder::types::*;
use tree_builder::tag_sets::*;
-use tree_builder::actions::{NoPush, Push, TreeBuilderActions, html_elem};
-use tokenizer::{EndTag, StartTag, Tag};
use tokenizer::states::{Rcdata, Rawtext, ScriptData, Plaintext};
-use util::str::is_ascii_whitespace;
-use std::ascii::AsciiExt;
-use std::mem::replace;
-use std::borrow::Cow::Borrowed;
use std::borrow::ToOwned;
-use tendril::{StrTendril, SliceExt};
+use tendril::SliceExt;
fn any_not_whitespace(x: &StrTendril) -> bool {
// FIXME: this might be much faster as a byte scan
x.chars().any(|c| !is_ascii_whitespace(c))
}
-// This goes in a trait so that we can control visibility.
-pub trait TreeBuilderStep {
- fn step(&mut self, mode: InsertionMode, token: Token) -> ProcessResult;
- fn step_foreign(&mut self, token: Token) -> ProcessResult;
-}
-
fn current_node(open_elems: &[Handle]) -> &Handle {
open_elems.last().expect("no current element")
}
#[doc(hidden)]
-impl TreeBuilderStep
- for super::TreeBuilder
+impl TreeBuilder
where Handle: Clone,
Sink: TreeSink,
{
diff --git a/xml5ever/src/tree_builder/actions.rs b/xml5ever/src/tree_builder/actions.rs
deleted file mode 100644
index 695ec994..00000000
--- a/xml5ever/src/tree_builder/actions.rs
+++ /dev/null
@@ -1,246 +0,0 @@
-// Copyright 2014-2017 The html5ever Project Developers. See the
-// COPYRIGHT file at the top-level directory of this distribution.
-//
-// Licensed under the Apache License, Version 2.0 or the MIT license
-// , at your
-// option. This file may not be copied, modified, or distributed
-// except according to those terms.
-
-use std::borrow::Cow::Borrowed;
-
-use tendril::{StrTendril, Tendril};
-
-use interface::{NodeOrText, TreeSink, AppendNode, create_element};
-use interface::{AppendText, ExpandedName, NextParserState};
-use tokenizer::{Tag, Pi, Doctype};
-use tokenizer::states::Quiescent;
-use tree_builder::types::{XmlProcessResult, Done};
-
-
-/// Trait that encapsulates common XML tree actions.
-pub trait XmlTreeBuilderActions {
- /// Returns current node of in the XmlTreeBuilder.
- fn current_node(&self) -> &Handle;
-
- /// Inserts node or text to its appropriate place in the tree.
- fn insert_appropriately(&mut self, child: NodeOrText);
-
- /// Inserts tag into the tree and adds it to list of open elements.
- fn insert_tag(&mut self, tag: Tag) -> XmlProcessResult;
-
- /// Appends current tag to the root of the document.
- fn append_tag(&mut self, tag: Tag) -> XmlProcessResult;
-
- /// Appends tag to the root of the document.
- fn append_tag_to_doc(&mut self, tag: Tag) -> Handle;
-
- /// Adds element to list of open elements (this should only apply to Tag).
- fn add_to_open_elems(&mut self, el: Handle) -> XmlProcessResult;
-
- /// Appends comment to root of the document.
- fn append_comment_to_doc(&mut self, comment: StrTendril) -> XmlProcessResult;
-
- /// Appends comment to the current tag.
- fn append_comment_to_tag(&mut self, text: StrTendril) -> XmlProcessResult;
-
- /// Appends Doctype to root of the document.
- fn append_doctype_to_doc(&mut self, doctype: Doctype) -> XmlProcessResult;
-
- /// Appends Processing Instruction to the root of the document
- fn append_pi_to_doc(&mut self, pi: Pi) -> XmlProcessResult;
-
- /// Appends Processing Instruction to the current tag.
- fn append_pi_to_tag(&mut self, pi: Pi) -> XmlProcessResult;
-
- /// Appends text to appropriate element.
- fn append_text(&mut self, chars: StrTendril) -> XmlProcessResult;
-
- /// Checks if given tag is the list of open elements.
- fn tag_in_open_elems(&self, tag: &Tag) -> bool;
-
- /// Pops elements from list of open elements, until predicate
- /// `pred` returns true
- fn pop_until(&mut self, pred: TagSet) where TagSet: Fn(ExpandedName) -> bool;
-
- /// Checks if current node is in given TagSet
- fn current_node_in(&self, set: TagSet) -> bool where TagSet: Fn(ExpandedName) -> bool;
-
- /// Close given tag.
- fn close_tag(&mut self, tag: Tag) -> XmlProcessResult;
-
- /// Returns whether or not there are any elements in list of
- /// open elements.
- fn no_open_elems(&self) -> bool;
-
- /// Removes last element from list of open elements and returns its value.
- fn pop(&mut self) -> Handle ;
-
- /// Stops parsing of XML file.
- fn stop_parsing(&mut self) -> XmlProcessResult;
-
- /// Indicated a `script` element is complete and can be prepared
- fn complete_script(&mut self);
-}
-
-fn current_node(open_elems: &[Handle]) -> &Handle {
- open_elems.last().expect("no current element")
-}
-
-#[doc(hidden)]
-impl XmlTreeBuilderActions
- for super::XmlTreeBuilder
- where Handle: Clone,
- Sink: TreeSink,
-{
-
- fn current_node(&self) -> &Handle {
- self.open_elems.last().expect("no current element")
- }
-
- fn insert_appropriately(&mut self, child: NodeOrText){
- let target = current_node(&self.open_elems);
- self.sink.append(target, child);
- }
-
- fn insert_tag(&mut self, tag: Tag) -> XmlProcessResult {
- let child = create_element(&mut self.sink, tag.name, tag.attrs);
- self.insert_appropriately(AppendNode(child.clone()));
- self.add_to_open_elems(child)
- }
-
- fn append_tag(&mut self, tag: Tag) -> XmlProcessResult {
- let child = create_element(&mut self.sink, tag.name, tag.attrs);
- self.insert_appropriately(AppendNode(child.clone()));
- self.sink.pop(&child);
- Done
- }
-
- fn append_tag_to_doc(&mut self, tag: Tag) -> Handle {
- let child = create_element(&mut self.sink, tag.name, tag.attrs);
-
- self.sink.append(&self.doc_handle, AppendNode(child.clone()));
- child
- }
-
- fn add_to_open_elems(&mut self, el: Handle) -> XmlProcessResult {
- self.open_elems.push(el);
-
- Done
- }
-
- fn append_comment_to_doc(&mut self, text: StrTendril) -> XmlProcessResult {
- let comment = self.sink.create_comment(text);
- self.sink.append(&self.doc_handle, AppendNode(comment));
- Done
- }
-
- fn append_comment_to_tag(&mut self, text: StrTendril) -> XmlProcessResult {
- let target = current_node(&self.open_elems);
- let comment = self.sink.create_comment(text);
- self.sink.append(target, AppendNode(comment));
- Done
- }
-
- fn append_doctype_to_doc(&mut self, doctype: Doctype) -> XmlProcessResult {
- fn get_tendril(opt: Option) -> StrTendril {
- match opt {
- Some(expr) => expr,
- None => Tendril::new(),
- }
- };
- self.sink.append_doctype_to_document(
- get_tendril(doctype.name),
- get_tendril(doctype.public_id),
- get_tendril(doctype.system_id),
- );
- Done
- }
-
- fn append_pi_to_doc(&mut self, pi: Pi) -> XmlProcessResult {
- let pi = self.sink.create_pi(pi.target, pi.data);
- self.sink.append(&self.doc_handle, AppendNode(pi));
- Done
- }
-
- fn append_pi_to_tag(&mut self, pi: Pi) -> XmlProcessResult {
- let target = current_node(&self.open_elems);
- let pi = self.sink.create_pi(pi.target, pi.data);
- self.sink.append(target, AppendNode(pi));
- Done
- }
-
-
- fn append_text(&mut self, chars: StrTendril)
- -> XmlProcessResult {
- self.insert_appropriately(AppendText(chars));
- Done
- }
-
- fn tag_in_open_elems(&self, tag: &Tag) -> bool {
- self.open_elems
- .iter()
- .any(|a| self.sink.elem_name(a) == tag.name.expanded())
- }
-
- // Pop elements until an element from the set has been popped. Returns the
- // number of elements popped.
- fn pop_until (&mut self, pred: P)
- where P: Fn(ExpandedName) -> bool
- {
- loop {
- if self.current_node_in(|x| pred(x)) {
- break;
- }
- self.pop();
- }
- }
-
- fn current_node_in(&self, set: TagSet) -> bool
- where TagSet: Fn(ExpandedName) -> bool
- {
- // FIXME: take namespace into consideration:
- set(self.sink.elem_name(self.current_node()))
- }
-
- fn close_tag(&mut self, tag: Tag) -> XmlProcessResult {
- debug!("Close tag: current_node.name {:?} \n Current tag {:?}",
- self.sink.elem_name(self.current_node()), &tag.name);
-
- if *self.sink.elem_name(self.current_node()).local != tag.name.local {
- self.sink.parse_error(Borrowed("Current node doesn't match tag"));
- }
-
- let is_closed = self.tag_in_open_elems(&tag);
-
- if is_closed {
- self.pop_until(|p| p == tag.name.expanded());
- self.pop();
- }
-
- Done
- }
-
- fn no_open_elems(&self) -> bool {
- self.open_elems.is_empty()
- }
-
- fn pop(&mut self) -> Handle {
- self.namespace_stack.pop();
- let node = self.open_elems.pop().expect("no current element");
- self.sink.pop(&node);
- node
- }
-
- fn stop_parsing(&mut self) -> XmlProcessResult {
- warn!("stop_parsing for XML5 not implemented, full speed ahead!");
- Done
- }
-
- fn complete_script(&mut self) {
- let current = current_node(&self.open_elems);
- if self.sink.complete_script(current) == NextParserState::Suspend {
- self.next_tokenizer_state = Some(Quiescent);
- }
- }
-}
diff --git a/xml5ever/src/tree_builder/mod.rs b/xml5ever/src/tree_builder/mod.rs
index a54bf4df..bef966c4 100644
--- a/xml5ever/src/tree_builder/mod.rs
+++ b/xml5ever/src/tree_builder/mod.rs
@@ -7,8 +7,6 @@
// option. This file may not be copied, modified, or distributed
// except according to those terms.
-mod actions;
-mod rules;
mod types;
use std::borrow::{Cow};
@@ -19,14 +17,17 @@ use std::fmt::{Formatter, Debug, Error};
use std::result::Result;
use std::mem;
-
use {Prefix, Namespace, LocalName};
-use interface::{self, QualName, Attribute};
-use tokenizer::{self, TokenSink, Tag, StartTag};
+use interface::{self, QualName, Attribute, AppendNode, create_element};
+use interface::{AppendText, ExpandedName};
+use tokenizer::{self, TokenSink, Tag, StartTag, EndTag};
+use tokenizer::{ShortTag, EmptyTag, Pi, Doctype};
+use tokenizer::states::Quiescent;
pub use self::interface::{TreeSink, Tracer, NodeOrText, NextParserState};
-use self::rules::XmlTreeBuilderStep;
use self::types::*;
+use tendril::{StrTendril, Tendril};
+
static XML_URI: &'static str = "http://www.w3.org/XML/1998/namespace";
static XMLNS_URI: &'static str = "http://www.w3.org/2000/xmlns/";
@@ -434,3 +435,329 @@ impl TokenSink
self.next_tokenizer_state.take()
}
}
+
+fn current_node(open_elems: &[Handle]) -> &Handle {
+ open_elems.last().expect("no current element")
+}
+
+#[doc(hidden)]
+impl XmlTreeBuilder
+ where Handle: Clone,
+ Sink: TreeSink,
+{
+
+ fn current_node(&self) -> &Handle {
+ self.open_elems.last().expect("no current element")
+ }
+
+ fn insert_appropriately(&mut self, child: NodeOrText){
+ let target = current_node(&self.open_elems);
+ self.sink.append(target, child);
+ }
+
+ fn insert_tag(&mut self, tag: Tag) -> XmlProcessResult {
+ let child = create_element(&mut self.sink, tag.name, tag.attrs);
+ self.insert_appropriately(AppendNode(child.clone()));
+ self.add_to_open_elems(child)
+ }
+
+ fn append_tag(&mut self, tag: Tag) -> XmlProcessResult {
+ let child = create_element(&mut self.sink, tag.name, tag.attrs);
+ self.insert_appropriately(AppendNode(child.clone()));
+ self.sink.pop(&child);
+ Done
+ }
+
+ fn append_tag_to_doc(&mut self, tag: Tag) -> Handle {
+ let child = create_element(&mut self.sink, tag.name, tag.attrs);
+
+ self.sink.append(&self.doc_handle, AppendNode(child.clone()));
+ child
+ }
+
+ fn add_to_open_elems(&mut self, el: Handle) -> XmlProcessResult {
+ self.open_elems.push(el);
+
+ Done
+ }
+
+ fn append_comment_to_doc(&mut self, text: StrTendril) -> XmlProcessResult {
+ let comment = self.sink.create_comment(text);
+ self.sink.append(&self.doc_handle, AppendNode(comment));
+ Done
+ }
+
+ fn append_comment_to_tag(&mut self, text: StrTendril) -> XmlProcessResult {
+ let target = current_node(&self.open_elems);
+ let comment = self.sink.create_comment(text);
+ self.sink.append(target, AppendNode(comment));
+ Done
+ }
+
+ fn append_doctype_to_doc(&mut self, doctype: Doctype) -> XmlProcessResult {
+ fn get_tendril(opt: Option) -> StrTendril {
+ match opt {
+ Some(expr) => expr,
+ None => Tendril::new(),
+ }
+ };
+ self.sink.append_doctype_to_document(
+ get_tendril(doctype.name),
+ get_tendril(doctype.public_id),
+ get_tendril(doctype.system_id),
+ );
+ Done
+ }
+
+ fn append_pi_to_doc(&mut self, pi: Pi) -> XmlProcessResult {
+ let pi = self.sink.create_pi(pi.target, pi.data);
+ self.sink.append(&self.doc_handle, AppendNode(pi));
+ Done
+ }
+
+ fn append_pi_to_tag(&mut self, pi: Pi) -> XmlProcessResult {
+ let target = current_node(&self.open_elems);
+ let pi = self.sink.create_pi(pi.target, pi.data);
+ self.sink.append(target, AppendNode(pi));
+ Done
+ }
+
+
+ fn append_text(&mut self, chars: StrTendril)
+ -> XmlProcessResult {
+ self.insert_appropriately(AppendText(chars));
+ Done
+ }
+
+ fn tag_in_open_elems(&self, tag: &Tag) -> bool {
+ self.open_elems
+ .iter()
+ .any(|a| self.sink.elem_name(a) == tag.name.expanded())
+ }
+
+ // Pop elements until an element from the set has been popped. Returns the
+ // number of elements popped.
+ fn pop_until(&mut self, pred: P)
+ where P: Fn(ExpandedName) -> bool
+ {
+ loop {
+ if self.current_node_in(|x| pred(x)) {
+ break;
+ }
+ self.pop();
+ }
+ }
+
+ fn current_node_in(&self, set: TagSet) -> bool
+ where TagSet: Fn(ExpandedName) -> bool
+ {
+ // FIXME: take namespace into consideration:
+ set(self.sink.elem_name(self.current_node()))
+ }
+
+ fn close_tag(&mut self, tag: Tag) -> XmlProcessResult {
+ debug!("Close tag: current_node.name {:?} \n Current tag {:?}",
+ self.sink.elem_name(self.current_node()), &tag.name);
+
+ if *self.sink.elem_name(self.current_node()).local != tag.name.local {
+ self.sink.parse_error(Borrowed("Current node doesn't match tag"));
+ }
+
+ let is_closed = self.tag_in_open_elems(&tag);
+
+ if is_closed {
+ self.pop_until(|p| p == tag.name.expanded());
+ self.pop();
+ }
+
+ Done
+ }
+
+ fn no_open_elems(&self) -> bool {
+ self.open_elems.is_empty()
+ }
+
+ fn pop(&mut self) -> Handle {
+ self.namespace_stack.pop();
+ let node = self.open_elems.pop().expect("no current element");
+ self.sink.pop(&node);
+ node
+ }
+
+ fn stop_parsing(&mut self) -> XmlProcessResult {
+ warn!("stop_parsing for XML5 not implemented, full speed ahead!");
+ Done
+ }
+
+ fn complete_script(&mut self) {
+ let current = current_node(&self.open_elems);
+ if self.sink.complete_script(current) == NextParserState::Suspend {
+ self.next_tokenizer_state = Some(Quiescent);
+ }
+ }
+}
+
+fn any_not_whitespace(x: &StrTendril) -> bool {
+ !x.bytes().all(|b| matches!(b, b'\t' | b'\r' | b'\n' | b'\x0C' | b' '))
+}
+
+#[doc(hidden)]
+impl XmlTreeBuilder
+ where Handle: Clone,
+ Sink: TreeSink,
+{
+
+ fn step(&mut self, mode: XmlPhase, token: Token) -> XmlProcessResult {
+ self.debug_step(mode, &token);
+
+ match mode {
+ StartPhase => match token {
+ TagToken(Tag{kind: StartTag, name, attrs}) => {
+ let tag = {
+ let mut tag = Tag {
+ kind: StartTag,
+ name: name,
+ attrs: attrs,
+ };
+ self.process_namespaces(&mut tag);
+ tag
+ };
+ self.phase = MainPhase;
+ let handle = self.append_tag_to_doc(tag);
+ self.add_to_open_elems(handle)
+ },
+ TagToken(Tag{kind: EmptyTag, name, attrs}) => {
+ let tag = {
+ let mut tag = Tag {
+ kind: EmptyTag,
+ name: name,
+ attrs: attrs,
+ };
+ self.process_namespaces(&mut tag);
+ tag
+ };
+ self.phase = EndPhase;
+ let handle = self.append_tag_to_doc(tag);
+ self.sink.pop(&handle);
+ Done
+ },
+ CommentToken(comment) => {
+ self.append_comment_to_doc(comment)
+ },
+ PIToken(pi) => {
+ self.append_pi_to_doc(pi)
+ },
+ CharacterTokens(ref chars)
+ if !any_not_whitespace(chars) => {
+ Done
+ },
+ EOFToken => {
+ self.sink.parse_error(Borrowed("Unexpected EOF in start phase"));
+ Reprocess(EndPhase, EOFToken)
+ },
+ DoctypeToken(d) => {
+ self.append_doctype_to_doc(d);
+ Done
+ },
+ _ => {
+ self.sink.parse_error(Borrowed("Unexpected element in start phase"));
+ Done
+ },
+ },
+ MainPhase => match token {
+ CharacterTokens(chs) => {
+ self.append_text(chs)
+ },
+ TagToken(Tag{kind: StartTag, name, attrs}) => {
+ let tag = {
+ let mut tag = Tag {
+ kind: StartTag,
+ name: name,
+ attrs: attrs,
+ };
+ self.process_namespaces(&mut tag);
+ tag
+ };
+ self.insert_tag(tag)
+ },
+ TagToken(Tag{kind: EmptyTag, name, attrs}) => {
+ let tag = {
+ let mut tag = Tag {
+ kind: EmptyTag,
+ name: name,
+ attrs: attrs,
+ };
+ self.process_namespaces(&mut tag);
+ tag
+ };
+ if tag.name.local == local_name!("script") {
+ self.insert_tag(tag.clone());
+ self.complete_script();
+ self.close_tag(tag)
+ } else {
+ self.append_tag(tag)
+ }
+ },
+ TagToken(Tag{kind: EndTag, name, attrs}) => {
+ let tag = {
+ let mut tag = Tag {
+ kind: EndTag,
+ name: name,
+ attrs: attrs,
+ };
+ self.process_namespaces(&mut tag);
+ tag
+ };
+ if tag.name.local == local_name!("script") {
+ self.complete_script();
+ }
+ let retval = self.close_tag(tag);
+ if self.no_open_elems() {
+ self.phase = EndPhase;
+ }
+ retval
+ },
+ TagToken(Tag{kind: ShortTag, ..}) => {
+ self.pop();
+ if self.no_open_elems() {
+ self.phase = EndPhase;
+ }
+ Done
+ },
+ CommentToken(comment) => {
+ self.append_comment_to_tag(comment)
+ },
+ PIToken(pi) => {
+ self.append_pi_to_tag(pi)
+ },
+ EOFToken | NullCharacterToken=> {
+ Reprocess(EndPhase, EOFToken)
+ }
+ DoctypeToken(_) => {
+ self.sink.parse_error(Borrowed("Unexpected element in main phase"));
+ Done
+ }
+ },
+ EndPhase => match token {
+ CommentToken(comment) => {
+ self.append_comment_to_doc(comment)
+ },
+ PIToken(pi) => {
+ self.append_pi_to_doc(pi)
+ },
+ CharacterTokens(ref chars)
+ if !any_not_whitespace(chars) => {
+ Done
+ },
+ EOFToken => {
+ self.stop_parsing()
+ }
+ _ => {
+ self.sink.parse_error(Borrowed("Unexpected element in end phase"));
+ Done
+ }
+ },
+
+ }
+ }
+}
diff --git a/xml5ever/src/tree_builder/rules.rs b/xml5ever/src/tree_builder/rules.rs
deleted file mode 100644
index 036b1214..00000000
--- a/xml5ever/src/tree_builder/rules.rs
+++ /dev/null
@@ -1,189 +0,0 @@
-// Copyright 2014-2017 The html5ever Project Developers. See the
-// COPYRIGHT file at the top-level directory of this distribution.
-//
-// Licensed under the Apache License, Version 2.0 or the MIT license
-// , at your
-// option. This file may not be copied, modified, or distributed
-// except according to those terms.
-
-use interface::TreeSink;
-use std::borrow::Cow::Borrowed;
-use tendril::StrTendril;
-use tokenizer::{Tag, StartTag, EndTag, ShortTag, EmptyTag};
-use tree_builder::types::*;
-use tree_builder::actions::XmlTreeBuilderActions;
-
-fn any_not_whitespace(x: &StrTendril) -> bool {
- !x.bytes().all(|b| matches!(b, b'\t' | b'\r' | b'\n' | b'\x0C' | b' '))
-}
-
-/// Encapsulates rules needed to build a tree representation.
-pub trait XmlTreeBuilderStep {
-
- /// Each step presents resolving received Token, in a
- /// given XmlPhase.
- fn step(&mut self, mode: XmlPhase, token: Token) -> XmlProcessResult;
-}
-
-#[doc(hidden)]
-impl XmlTreeBuilderStep
- for super::XmlTreeBuilder
- where Handle: Clone,
- Sink: TreeSink,
-{
-
- fn step(&mut self, mode: XmlPhase, token: Token) -> XmlProcessResult {
- self.debug_step(mode, &token);
-
- match mode {
- StartPhase => match token {
- TagToken(Tag{kind: StartTag, name, attrs}) => {
- let tag = {
- let mut tag = Tag {
- kind: StartTag,
- name: name,
- attrs: attrs,
- };
- self.process_namespaces(&mut tag);
- tag
- };
- self.phase = MainPhase;
- let handle = self.append_tag_to_doc(tag);
- self.add_to_open_elems(handle)
- },
- TagToken(Tag{kind: EmptyTag, name, attrs}) => {
- let tag = {
- let mut tag = Tag {
- kind: EmptyTag,
- name: name,
- attrs: attrs,
- };
- self.process_namespaces(&mut tag);
- tag
- };
- self.phase = EndPhase;
- let handle = self.append_tag_to_doc(tag);
- self.sink.pop(&handle);
- Done
- },
- CommentToken(comment) => {
- self.append_comment_to_doc(comment)
- },
- PIToken(pi) => {
- self.append_pi_to_doc(pi)
- },
- CharacterTokens(ref chars)
- if !any_not_whitespace(chars) => {
- Done
- },
- EOFToken => {
- self.sink.parse_error(Borrowed("Unexpected EOF in start phase"));
- Reprocess(EndPhase, EOFToken)
- },
- DoctypeToken(d) => {
- self.append_doctype_to_doc(d);
- Done
- },
- _ => {
- self.sink.parse_error(Borrowed("Unexpected element in start phase"));
- Done
- },
- },
- MainPhase => match token {
- CharacterTokens(chs) => {
- self.append_text(chs)
- },
- TagToken(Tag{kind: StartTag, name, attrs}) => {
- let tag = {
- let mut tag = Tag {
- kind: StartTag,
- name: name,
- attrs: attrs,
- };
- self.process_namespaces(&mut tag);
- tag
- };
- self.insert_tag(tag)
- },
- TagToken(Tag{kind: EmptyTag, name, attrs}) => {
- let tag = {
- let mut tag = Tag {
- kind: EmptyTag,
- name: name,
- attrs: attrs,
- };
- self.process_namespaces(&mut tag);
- tag
- };
- if tag.name.local == local_name!("script") {
- self.insert_tag(tag.clone());
- self.complete_script();
- self.close_tag(tag)
- } else {
- self.append_tag(tag)
- }
- },
- TagToken(Tag{kind: EndTag, name, attrs}) => {
- let tag = {
- let mut tag = Tag {
- kind: EndTag,
- name: name,
- attrs: attrs,
- };
- self.process_namespaces(&mut tag);
- tag
- };
- if tag.name.local == local_name!("script") {
- self.complete_script();
- }
- let retval = self.close_tag(tag);
- if self.no_open_elems() {
- self.phase = EndPhase;
- }
- retval
- },
- TagToken(Tag{kind: ShortTag, ..}) => {
- self.pop();
- if self.no_open_elems() {
- self.phase = EndPhase;
- }
- Done
- },
- CommentToken(comment) => {
- self.append_comment_to_tag(comment)
- },
- PIToken(pi) => {
- self.append_pi_to_tag(pi)
- },
- EOFToken | NullCharacterToken=> {
- Reprocess(EndPhase, EOFToken)
- }
- DoctypeToken(_) => {
- self.sink.parse_error(Borrowed("Unexpected element in main phase"));
- Done
- }
- },
- EndPhase => match token {
- CommentToken(comment) => {
- self.append_comment_to_doc(comment)
- },
- PIToken(pi) => {
- self.append_pi_to_doc(pi)
- },
- CharacterTokens(ref chars)
- if !any_not_whitespace(chars) => {
- Done
- },
- EOFToken => {
- self.stop_parsing()
- }
- _ => {
- self.sink.parse_error(Borrowed("Unexpected element in end phase"));
- Done
- }
- },
-
- }
- }
-}
| |