source code
# The Computer Language Benchmarks Game
# http://benchmarksgame.alioth.debian.org
#
# regex-dna program contributed by jose fco. gonzalez
# optimized & parallelized by Rick Branson
# optimized for ruby2 by Aaron Tavistock
# converted from regex-dna program
seq = STDIN.readlines.join
ilen = seq.size
seq.gsub!(/>.*\n|\n/,"")
clen = seq.length
MATCHERS = [
/agggtaaa|tttaccct/,
/[cgt]gggtaaa|tttaccc[acg]/,
/a[act]ggtaaa|tttacc[agt]t/,
/ag[act]gtaaa|tttac[agt]ct/,
/agg[act]taaa|ttta[agt]cct/,
/aggg[acg]aaa|ttt[cgt]ccct/,
/agggt[cgt]aa|tt[acg]accct/,
/agggta[cgt]a|t[acg]taccct/,
/agggtaa[cgt]|[acg]ttaccct/
]
threads = MATCHERS.map do |f|
Thread.new do
Thread.current[:result] = "#{f.source} #{seq.scan(f).size}"
end
end
threads.each do |t|
t.join
end
match_results = threads.map do |t|
t[:result]
end
{
/tHa[Nt]/ => '<4>',
/aND|caN|Ha[DS]|WaS/ => '<3>',
/a[NSt]|BY/ => '<2>',
/<[^>]*>/ => '|',
/\|[^|][^|]*\|/ => '-'
}.each { |f,r| seq.gsub!(f,r) }
puts "#{match_results.join("\n")}\n\n#{ilen}\n#{clen}\n#{seq.length}"