| // The Computer Language Benchmarks Game |
| // http://benchmarksgame.alioth.debian.org/ |
| // |
| // contributed by the Rust Project Developers |
| // contributed by TeXitoi |
| // contributed by BurntSushi |
| |
| extern crate regex; |
| |
| use std::io::{self, Read}; |
| |
| macro_rules! regex { ($re:expr) => { ::regex::Regex::new($re).unwrap() } } |
| |
| fn main() { |
| let mut seq = String::with_capacity(50 * (1 << 20)); |
| io::stdin().read_to_string(&mut seq).unwrap(); |
| let ilen = seq.len(); |
| |
| seq = regex!(">[^\n]*\n|\n").replace_all(&seq, "").into_owned(); |
| let clen = seq.len(); |
| |
| let variants = vec![ |
| regex!("agggtaaa|tttaccct"), |
| regex!("[cgt]gggtaaa|tttaccc[acg]"), |
| regex!("a[act]ggtaaa|tttacc[agt]t"), |
| regex!("ag[act]gtaaa|tttac[agt]ct"), |
| regex!("agg[act]taaa|ttta[agt]cct"), |
| regex!("aggg[acg]aaa|ttt[cgt]ccct"), |
| regex!("agggt[cgt]aa|tt[acg]accct"), |
| regex!("agggta[cgt]a|t[acg]taccct"), |
| regex!("agggtaa[cgt]|[acg]ttaccct"), |
| ]; |
| for re in variants { |
| println!("{} {}", re.to_string(), re.find_iter(&seq).count()); |
| } |
| |
| let substs = vec![ |
| (regex!("B"), "(c|g|t)"), |
| (regex!("D"), "(a|g|t)"), |
| (regex!("H"), "(a|c|t)"), |
| (regex!("K"), "(g|t)"), |
| (regex!("M"), "(a|c)"), |
| (regex!("N"), "(a|c|g|t)"), |
| (regex!("R"), "(a|g)"), |
| (regex!("S"), "(c|g)"), |
| (regex!("V"), "(a|c|g)"), |
| (regex!("W"), "(a|t)"), |
| (regex!("Y"), "(c|t)"), |
| ]; |
| let mut seq = seq; |
| for (re, replacement) in substs { |
| seq = re.replace_all(&seq, replacement).into_owned(); |
| } |
| println!("\n{}\n{}\n{}", ilen, clen, seq.len()); |
| } |