2009-08-05 14:03:46 -06:00
|
|
|
/*
|
|
|
|
Redistribution and use in source and binary forms, with or without
|
|
|
|
modification, are permitted provided that the following conditions are met:
|
|
|
|
|
|
|
|
* Redistributions of source code must retain the above copyright
|
|
|
|
notice, this list of conditions and the following disclaimer.
|
|
|
|
|
|
|
|
* Redistributions in binary form must reproduce the above copyright
|
|
|
|
notice, this list of conditions and the following disclaimer in the
|
|
|
|
documentation and/or other materials provided with the distribution.
|
|
|
|
|
|
|
|
* Neither the name of "The Computer Language Benchmarks Game" nor the
|
|
|
|
name of "The Computer Language Shootout Benchmarks" nor the names of
|
|
|
|
its contributors may be used to endorse or promote products derived
|
|
|
|
from this software without specific prior written permission.
|
|
|
|
|
|
|
|
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
|
|
|
AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
|
|
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
|
|
ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
|
|
|
LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
|
|
CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
|
|
SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
|
|
INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
|
|
CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
|
|
ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
|
|
|
POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
*/
|
|
|
|
|
|
|
|
/* The Computer Language Benchmarks Game
|
|
|
|
* http://shootout.alioth.debian.org/
|
|
|
|
*
|
|
|
|
* contributed by The Go Authors.
|
|
|
|
*/
|
|
|
|
|
|
|
|
package main
|
|
|
|
|
|
|
|
import (
|
|
|
|
"fmt";
|
2009-12-02 23:02:14 -07:00
|
|
|
"io/ioutil";
|
2009-08-05 14:03:46 -06:00
|
|
|
"os";
|
|
|
|
"regexp";
|
2009-08-05 18:25:38 -06:00
|
|
|
"strings";
|
2009-08-05 14:03:46 -06:00
|
|
|
)
|
|
|
|
|
2009-11-20 14:11:42 -07:00
|
|
|
var variants = []string{
|
2009-08-05 14:03:46 -06:00
|
|
|
"agggtaaa|tttaccct",
|
|
|
|
"[cgt]gggtaaa|tttaccc[acg]",
|
|
|
|
"a[act]ggtaaa|tttacc[agt]t",
|
|
|
|
"ag[act]gtaaa|tttac[agt]ct",
|
|
|
|
"agg[act]taaa|ttta[agt]cct",
|
|
|
|
"aggg[acg]aaa|ttt[cgt]ccct",
|
|
|
|
"agggt[cgt]aa|tt[acg]accct",
|
|
|
|
"agggta[cgt]a|t[acg]taccct",
|
|
|
|
"agggtaa[cgt]|[acg]ttaccct",
|
|
|
|
}
|
|
|
|
|
|
|
|
type Subst struct {
|
2009-11-20 14:11:42 -07:00
|
|
|
pat, repl string;
|
2009-08-05 14:03:46 -06:00
|
|
|
}
|
|
|
|
|
2009-11-20 14:11:42 -07:00
|
|
|
var substs = []Subst{
|
|
|
|
Subst{"B", "(c|g|t)"},
|
|
|
|
Subst{"D", "(a|g|t)"},
|
|
|
|
Subst{"H", "(a|c|t)"},
|
|
|
|
Subst{"K", "(g|t)"},
|
|
|
|
Subst{"M", "(a|c)"},
|
|
|
|
Subst{"N", "(a|c|g|t)"},
|
|
|
|
Subst{"R", "(a|g)"},
|
|
|
|
Subst{"S", "(c|g)"},
|
|
|
|
Subst{"V", "(a|c|g)"},
|
|
|
|
Subst{"W", "(a|t)"},
|
|
|
|
Subst{"Y", "(c|t)"},
|
2009-08-05 14:03:46 -06:00
|
|
|
}
|
|
|
|
|
2009-08-05 18:25:38 -06:00
|
|
|
func countMatches(pat string, bytes []byte) int {
|
2009-11-02 12:37:52 -07:00
|
|
|
re := regexp.MustCompile(pat);
|
2009-08-05 14:03:46 -06:00
|
|
|
n := 0;
|
|
|
|
for {
|
2009-08-05 18:25:38 -06:00
|
|
|
e := re.Execute(bytes);
|
2009-08-05 14:03:46 -06:00
|
|
|
if len(e) == 0 {
|
2009-11-20 14:11:42 -07:00
|
|
|
break
|
2009-08-05 14:03:46 -06:00
|
|
|
}
|
|
|
|
n++;
|
2009-11-20 14:11:42 -07:00
|
|
|
bytes = bytes[e[1]:];
|
2009-08-05 14:03:46 -06:00
|
|
|
}
|
|
|
|
return n;
|
|
|
|
}
|
|
|
|
|
|
|
|
func main() {
|
2009-12-02 23:02:14 -07:00
|
|
|
bytes, err := ioutil.ReadFile("/dev/stdin");
|
2009-08-05 14:03:46 -06:00
|
|
|
if err != nil {
|
|
|
|
fmt.Fprintf(os.Stderr, "can't read input: %s\n", err);
|
|
|
|
os.Exit(2);
|
|
|
|
}
|
2009-08-05 18:25:38 -06:00
|
|
|
ilen := len(bytes);
|
2009-08-05 14:03:46 -06:00
|
|
|
// Delete the comment lines and newlines
|
2009-11-02 12:37:52 -07:00
|
|
|
bytes = regexp.MustCompile("(>[^\n]+)?\n").ReplaceAll(bytes, []byte{});
|
2009-08-05 18:25:38 -06:00
|
|
|
clen := len(bytes);
|
2009-09-15 13:42:24 -06:00
|
|
|
for _, s := range variants {
|
2009-11-20 14:11:42 -07:00
|
|
|
fmt.Printf("%s %d\n", s, countMatches(s, bytes))
|
2009-08-05 14:03:46 -06:00
|
|
|
}
|
2009-09-15 13:42:24 -06:00
|
|
|
for _, sub := range substs {
|
2009-11-20 14:11:42 -07:00
|
|
|
bytes = regexp.MustCompile(sub.pat).ReplaceAll(bytes, strings.Bytes(sub.repl))
|
2009-08-05 14:03:46 -06:00
|
|
|
}
|
2009-08-05 18:25:38 -06:00
|
|
|
fmt.Printf("\n%d\n%d\n%d\n", ilen, clen, len(bytes));
|
2009-08-05 14:03:46 -06:00
|
|
|
}
|