systemd-cron-next/vendor/regex/examples/shootout-regex-dna-single.rs
2024-11-12 15:03:58 +03:00

56 lines
1.6 KiB
Rust

// The Computer Language Benchmarks Game
// http://benchmarksgame.alioth.debian.org/
//
// contributed by the Rust Project Developers
// contributed by TeXitoi
// contributed by BurntSushi
extern crate regex;
use std::io::{self, Read};
macro_rules! regex { ($re:expr) => { ::regex::Regex::new($re).unwrap() } }
fn main() {
let mut seq = String::with_capacity(50 * (1 << 20));
io::stdin().read_to_string(&mut seq).unwrap();
let ilen = seq.len();
seq = regex!(">[^\n]*\n|\n").replace_all(&seq, "");
let clen = seq.len();
let variants = vec![
regex!("agggtaaa|tttaccct"),
regex!("[cgt]gggtaaa|tttaccc[acg]"),
regex!("a[act]ggtaaa|tttacc[agt]t"),
regex!("ag[act]gtaaa|tttac[agt]ct"),
regex!("agg[act]taaa|ttta[agt]cct"),
regex!("aggg[acg]aaa|ttt[cgt]ccct"),
regex!("agggt[cgt]aa|tt[acg]accct"),
regex!("agggta[cgt]a|t[acg]taccct"),
regex!("agggtaa[cgt]|[acg]ttaccct"),
];
for re in variants {
println!("{} {}", re.to_string(), re.find_iter(&seq).count());
}
let substs = vec![
(regex!("B"), "(c|g|t)"),
(regex!("D"), "(a|g|t)"),
(regex!("H"), "(a|c|t)"),
(regex!("K"), "(g|t)"),
(regex!("M"), "(a|c)"),
(regex!("N"), "(a|c|g|t)"),
(regex!("R"), "(a|g)"),
(regex!("S"), "(c|g)"),
(regex!("V"), "(a|c|g)"),
(regex!("W"), "(a|t)"),
(regex!("Y"), "(c|t)"),
];
let mut seq = seq;
for (re, replacement) in substs.into_iter() {
seq = re.replace_all(&seq, replacement);
}
println!("\n{}\n{}\n{}", ilen, clen, seq.len());
}