diff options
Diffstat (limited to 'vendor/markup5ever/build.rs')
-rw-r--r-- | vendor/markup5ever/build.rs | 131 |
1 files changed, 131 insertions, 0 deletions
diff --git a/vendor/markup5ever/build.rs b/vendor/markup5ever/build.rs new file mode 100644 index 000000000..38b4fdddc --- /dev/null +++ b/vendor/markup5ever/build.rs @@ -0,0 +1,131 @@ +// Copyright 2014-2017 The html5ever Project Developers. See the +// COPYRIGHT file at the top-level directory of this distribution. +// +// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or +// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license +// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your +// option. This file may not be copied, modified, or distributed +// except according to those terms. + +extern crate phf_codegen; +extern crate string_cache_codegen; + +use std::collections::HashMap; +use std::env; +use std::fs::File; +use std::io::{BufRead, BufReader, BufWriter, Write}; +use std::path::Path; + +mod entities; + +static NAMESPACES: &[(&str, &str)] = &[ + ("", ""), + ("*", "*"), + ("html", "http://www.w3.org/1999/xhtml"), + ("xml", "http://www.w3.org/XML/1998/namespace"), + ("xmlns", "http://www.w3.org/2000/xmlns/"), + ("xlink", "http://www.w3.org/1999/xlink"), + ("svg", "http://www.w3.org/2000/svg"), + ("mathml", "http://www.w3.org/1998/Math/MathML"), +]; + +fn main() { + let generated = Path::new(&env::var("OUT_DIR").unwrap()).join("generated.rs"); + let mut generated = BufWriter::new(File::create(&generated).unwrap()); + + named_entities_to_phf(&Path::new(&env::var("OUT_DIR").unwrap()).join("named_entities.rs")); + + // Create a string cache for local names + let local_names = Path::new(&env::var("CARGO_MANIFEST_DIR").unwrap()).join("local_names.txt"); + let mut local_names_atom = string_cache_codegen::AtomType::new("LocalName", "local_name!"); + for line in BufReader::new(File::open(&local_names).unwrap()).lines() { + let local_name = line.unwrap(); + local_names_atom.atom(&local_name); + local_names_atom.atom(&local_name.to_ascii_lowercase()); + } + local_names_atom + .with_macro_doc("Takes a local name as a string and returns its key in the string cache.") + .write_to(&mut generated) + .unwrap(); + + // Create a string cache for namespace prefixes + string_cache_codegen::AtomType::new("Prefix", "namespace_prefix!") + .with_macro_doc("Takes a namespace prefix string and returns its key in a string cache.") + .atoms(NAMESPACES.iter().map(|&(prefix, _url)| prefix)) + .write_to(&mut generated) + .unwrap(); + + // Create a string cache for namespace urls + string_cache_codegen::AtomType::new("Namespace", "namespace_url!") + .with_macro_doc("Takes a namespace url string and returns its key in a string cache.") + .atoms(NAMESPACES.iter().map(|&(_prefix, url)| url)) + .write_to(&mut generated) + .unwrap(); + + writeln!( + generated, + r#" + /// Maps the input of [`namespace_prefix!`](macro.namespace_prefix.html) to + /// the output of [`namespace_url!`](macro.namespace_url.html). + /// + #[macro_export] macro_rules! ns {{ + "# + ) + .unwrap(); + for &(prefix, url) in NAMESPACES { + writeln!( + generated, + "({}) => {{ namespace_url!({:?}) }};", + prefix, url + ) + .unwrap(); + } + writeln!(generated, "}}").unwrap(); +} + +fn named_entities_to_phf(to: &Path) { + let mut entities: HashMap<&str, (u32, u32)> = entities::NAMED_ENTITIES + .iter() + .map(|(name, cp1, cp2)| { + assert!(name.starts_with('&')); + (&name[1..], (*cp1, *cp2)) + }) + .collect(); + + // Add every missing prefix of those keys, mapping to NULL characters. + for key in entities.keys().cloned().collect::<Vec<_>>() { + for n in 1..key.len() { + entities.entry(&key[..n]).or_insert((0, 0)); + } + } + entities.insert("", (0, 0)); + + let mut phf_map = phf_codegen::Map::new(); + for (key, value) in entities { + phf_map.entry(key, &format!("{:?}", value)); + } + + let mut file = File::create(to).unwrap(); + writeln!( + &mut file, + r#" +/// A map of entity names to their codepoints. The second codepoint will +/// be 0 if the entity contains a single codepoint. Entities have their preceeding '&' removed. +/// +/// # Examples +/// +/// ``` +/// use markup5ever::data::NAMED_ENTITIES; +/// +/// assert_eq!(NAMED_ENTITIES.get("gt;").unwrap(), &(62, 0)); +/// ``` +"# + ) + .unwrap(); + writeln!( + &mut file, + "pub static NAMED_ENTITIES: Map<&'static str, (u32, u32)> = {};", + phf_map.build(), + ) + .unwrap(); +} |