diff --git a/seed/system-eval.sh b/seed/system-eval.sh index 08d06b1c29f2d154fd74ac4b2cfa0b1fb83648d3..2e77c447357500582ac51d0c21fb21d819c5135e 100755 --- a/seed/system-eval.sh +++ b/seed/system-eval.sh @@ -1,20 +1,28 @@ #!/bin/sh -PATH="/usr/local/bin:/usr/local/libexec/mecab:/bin:/usr/lib/mecab:/usr/local/Cellar/mecab/0.994/libexec/mecab" +PATH="/usr/local/bin:/usr/local/libexec/mecab:/bin:/usr/lib/mecab:/usr/local/Cellar/mecab/0.996/libexec/mecab" export PATH export LANG=ja_JP.UTF-8 +cat corpus.misc.mc corpus.kanjikai.mc corpus.ryomou.mc \ + > corpus.non-KT.mc + +cat corpus.KT2.mc corpus.misc.mc corpus.kanjikai.mc corpus.ryomou.mc \ + > corpus.mixed.mc + +cat corpus.KT0.mc corpus.misc.mc corpus.kanjikai.mc corpus.ryomou.mc \ + > corpus.all.mc + #CORPUS_LIST="misc kanjikai ryomou jts-wa jts-JP" -CORPUS_LIST="misc kanjikai ryomou" +CORPUS_LIST="KT0 KT2 misc kanjikai ryomou non-KT mixed all" for i in $CORPUS_LIST do mecab-test-gen < "corpus.$i.mc" > "test.$i" done -#cat corpus \ -#cat corpus.*.txt \ +#cat corpus.*.mc \ #| grep -v EOS | sed 's/ /,0,0,0,/' | sort | uniq > misc.corpus.csv