// Copyright 2014-2017 The html5ever Project Developers. See the // COPYRIGHT file at the top-level directory of this distribution. // // Licensed under the Apache License, Version 2.0 or the MIT license // , at your // option. This file may not be copied, modified, or distributed // except according to those terms. extern crate markup5ever_arcdom as arcdom; extern crate rustc_test as test; #[macro_use] extern crate html5ever; mod foreach_html5lib_test; use foreach_html5lib_test::foreach_html5lib_test; use std::collections::{HashMap, HashSet}; use std::default::Default; use std::ffi::OsStr; use std::io::BufRead; use std::iter::repeat; use std::mem::replace; use std::path::Path; use std::{env, fs, io}; use test::{DynTestName, TestDesc, TestDescAndFn, TestFn}; use arcdom::{ArcDom, Handle, NodeData}; use html5ever::tendril::{StrTendril, TendrilSink}; use html5ever::{parse_document, parse_fragment, ParseOpts}; use html5ever::{LocalName, QualName}; fn parse_tests>(mut lines: It) -> Vec> { let mut tests = vec![]; let mut test = HashMap::new(); let mut key: Option = None; let mut val = String::new(); macro_rules! finish_val ( () => ( match key.take() { None => (), Some(key) => { assert!(test.insert(key, replace(&mut val, String::new())).is_none()); } } )); macro_rules! finish_test ( () => ( if !test.is_empty() { tests.push(replace(&mut test, HashMap::new())); } )); loop { match lines.next() { None => break, Some(line) => { if line.starts_with("#") { finish_val!(); if line == "#data" { finish_test!(); } key = Some(line[1..].to_string()); } else { val.push_str(&line); val.push('\n'); } } } } finish_val!(); finish_test!(); tests } fn serialize(buf: &mut String, indent: usize, handle: Handle) { buf.push_str("|"); buf.push_str(&repeat(" ").take(indent).collect::()); let node = handle; match node.data { NodeData::Document => panic!("should not reach Document"), NodeData::Doctype { ref name, ref public_id, ref system_id, } => { buf.push_str("\n"); } NodeData::Text { ref contents } => { buf.push_str("\""); buf.push_str(&contents.borrow()); buf.push_str("\"\n"); } NodeData::Comment { ref contents } => { buf.push_str("\n"); } NodeData::Element { ref name, ref attrs, .. } => { buf.push_str("<"); match name.ns { ns!(svg) => buf.push_str("svg "), ns!(mathml) => buf.push_str("math "), _ => (), } buf.push_str(&*name.local); buf.push_str(">\n"); let mut attrs = attrs.borrow().clone(); attrs.sort_by(|x, y| x.name.local.cmp(&y.name.local)); // FIXME: sort by UTF-16 code unit for attr in attrs.into_iter() { buf.push_str("|"); buf.push_str(&repeat(" ").take(indent + 2).collect::()); match attr.name.ns { ns!(xlink) => buf.push_str("xlink "), ns!(xml) => buf.push_str("xml "), ns!(xmlns) => buf.push_str("xmlns "), _ => (), } buf.push_str(&format!("{}=\"{}\"\n", attr.name.local, attr.value)); } } NodeData::ProcessingInstruction { .. } => unreachable!(), } for child in node.children.borrow().iter() { serialize(buf, indent + 2, child.clone()); } if let NodeData::Element { template_contents: Some(ref content), .. } = node.data { buf.push_str("|"); buf.push_str(&repeat(" ").take(indent + 2).collect::()); buf.push_str("content\n"); for child in content.children.borrow().iter() { serialize(buf, indent + 4, child.clone()); } } } fn make_test( tests: &mut Vec, ignores: &HashSet, filename: &str, idx: usize, fields: HashMap, ) { let scripting_flags = &[false, true]; let scripting_flags = if fields.contains_key("script-off") { &scripting_flags[0..1] } else if fields.contains_key("script-on") { &scripting_flags[1..2] } else { &scripting_flags[0..2] }; let name = format!("tb: {}-{}", filename, idx); for scripting_enabled in scripting_flags { let test = make_test_desc_with_scripting_flag(ignores, &name, &fields, *scripting_enabled); tests.push(test); } } fn make_test_desc_with_scripting_flag( ignores: &HashSet, name: &str, fields: &HashMap, scripting_enabled: bool, ) -> TestDescAndFn { let get_field = |key| { let field = fields.get(key).expect("missing field"); field.trim_end_matches('\n').to_string() }; let mut data = fields.get("data").expect("missing data").to_string(); data.pop(); let expected = get_field("document"); let context = fields .get("document-fragment") .map(|field| context_name(field.trim_end_matches('\n'))); let ignore = ignores.contains(name); let mut name = name.to_owned(); if scripting_enabled { name.push_str(" (scripting enabled)"); } else { name.push_str(" (scripting disabled)"); }; let mut opts: ParseOpts = Default::default(); opts.tree_builder.scripting_enabled = scripting_enabled; TestDescAndFn { desc: TestDesc { ignore: ignore, ..TestDesc::new(DynTestName(name)) }, testfn: TestFn::dyn_test_fn(move || { // Do this here because Tendril isn't Send. let data = StrTendril::from_slice(&data); let mut result = String::new(); match context { None => { let dom = parse_document(ArcDom::default(), opts).one(data.clone()); for child in dom.document.children.borrow().iter() { serialize(&mut result, 1, child.clone()); } } Some(ref context) => { let dom = parse_fragment(ArcDom::default(), opts, context.clone(), vec![]) .one(data.clone()); // fragment case: serialize children of the html element // rather than children of the document let doc = &dom.document; let root = &doc.children.borrow()[0]; for child in root.children.borrow().iter() { serialize(&mut result, 1, child.clone()); } } }; let len = result.len(); result.truncate(len - 1); // drop the trailing newline if result != expected { panic!( "\ninput: {}\ngot:\n{}\nexpected:\n{}\n", data, result, expected ); } }), } } fn context_name(context: &str) -> QualName { if context.starts_with("svg ") { QualName::new(None, ns!(svg), LocalName::from(&context[4..])) } else if context.starts_with("math ") { QualName::new(None, ns!(mathml), LocalName::from(&context[5..])) } else { QualName::new(None, ns!(html), LocalName::from(context)) } } fn tests(src_dir: &Path, ignores: &HashSet) -> Vec { let mut tests = vec![]; foreach_html5lib_test( src_dir, "tree-construction", OsStr::new("dat"), |path, file| { let buf = io::BufReader::new(file); let lines = buf.lines().map(|res| res.ok().expect("couldn't read")); let data = parse_tests(lines); for (i, test) in data.into_iter().enumerate() { make_test( &mut tests, ignores, path.file_name().unwrap().to_str().unwrap(), i, test, ); } }, ); tests } fn main() { let args: Vec<_> = env::args().collect(); let src_dir = Path::new(env!("CARGO_MANIFEST_DIR")); let mut ignores = HashSet::new(); { let f = fs::File::open(&src_dir.join("data/test/ignore")).unwrap(); let r = io::BufReader::new(f); for ln in r.lines() { ignores.insert(ln.unwrap().trim_end().to_string()); } } test::test_main(&args, tests(src_dir, &ignores)); }