summaryrefslogtreecommitdiffstats
path: root/third_party/rust/regex/examples/shootout-regex-dna-bytes.rs
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-28 14:29:10 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-28 14:29:10 +0000
commit2aa4a82499d4becd2284cdb482213d541b8804dd (patch)
treeb80bf8bf13c3766139fbacc530efd0dd9d54394c /third_party/rust/regex/examples/shootout-regex-dna-bytes.rs
parentInitial commit. (diff)
downloadfirefox-2aa4a82499d4becd2284cdb482213d541b8804dd.tar.xz
firefox-2aa4a82499d4becd2284cdb482213d541b8804dd.zip
Adding upstream version 86.0.1.upstream/86.0.1upstream
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'third_party/rust/regex/examples/shootout-regex-dna-bytes.rs')
-rw-r--r--third_party/rust/regex/examples/shootout-regex-dna-bytes.rs70
1 files changed, 70 insertions, 0 deletions
diff --git a/third_party/rust/regex/examples/shootout-regex-dna-bytes.rs b/third_party/rust/regex/examples/shootout-regex-dna-bytes.rs
new file mode 100644
index 0000000000..a763385c38
--- /dev/null
+++ b/third_party/rust/regex/examples/shootout-regex-dna-bytes.rs
@@ -0,0 +1,70 @@
+// The Computer Language Benchmarks Game
+// http://benchmarksgame.alioth.debian.org/
+//
+// contributed by the Rust Project Developers
+// contributed by TeXitoi
+// contributed by BurntSushi
+
+extern crate regex;
+
+use std::io::{self, Read};
+use std::sync::Arc;
+use std::thread;
+
+macro_rules! regex {
+ ($re:expr) => {
+ ::regex::bytes::Regex::new($re).unwrap()
+ };
+}
+
+fn main() {
+ let mut seq = Vec::with_capacity(51 * (1 << 20));
+ io::stdin().read_to_end(&mut seq).unwrap();
+ let ilen = seq.len();
+
+ seq = regex!(">[^\n]*\n|\n").replace_all(&seq, &b""[..]).into_owned();
+ let clen = seq.len();
+ let seq_arc = Arc::new(seq.clone());
+
+ let variants = vec![
+ regex!("agggtaaa|tttaccct"),
+ regex!("[cgt]gggtaaa|tttaccc[acg]"),
+ regex!("a[act]ggtaaa|tttacc[agt]t"),
+ regex!("ag[act]gtaaa|tttac[agt]ct"),
+ regex!("agg[act]taaa|ttta[agt]cct"),
+ regex!("aggg[acg]aaa|ttt[cgt]ccct"),
+ regex!("agggt[cgt]aa|tt[acg]accct"),
+ regex!("agggta[cgt]a|t[acg]taccct"),
+ regex!("agggtaa[cgt]|[acg]ttaccct"),
+ ];
+ let mut counts = vec![];
+ for variant in variants {
+ let seq = seq_arc.clone();
+ let restr = variant.to_string();
+ let future = thread::spawn(move || variant.find_iter(&seq).count());
+ counts.push((restr, future));
+ }
+
+ let substs = vec![
+ (regex!("B"), &b"(c|g|t)"[..]),
+ (regex!("D"), &b"(a|g|t)"[..]),
+ (regex!("H"), &b"(a|c|t)"[..]),
+ (regex!("K"), &b"(g|t)"[..]),
+ (regex!("M"), &b"(a|c)"[..]),
+ (regex!("N"), &b"(a|c|g|t)"[..]),
+ (regex!("R"), &b"(a|g)"[..]),
+ (regex!("S"), &b"(c|g)"[..]),
+ (regex!("V"), &b"(a|c|g)"[..]),
+ (regex!("W"), &b"(a|t)"[..]),
+ (regex!("Y"), &b"(c|t)"[..]),
+ ];
+ let mut seq = seq;
+ for (re, replacement) in substs {
+ seq = re.replace_all(&seq, replacement).into_owned();
+ }
+
+ for (variant, count) in counts {
+ println!("{} {}", variant, count.join().unwrap());
+ }
+ println!("\n{}\n{}\n{}", ilen, clen, seq.len());
+}