https://github.com/moses-smt/mosesdecoder/tree/RELEASE-4.0
https://github.com/moses-smt/giza-pp
http://www.speech.sri.com/projects/srilm/download.html
~/mosesdecoder/scripts/training/clean-corpus-n.perl corpus/test id pnk corpus/clean 1 50
~/mosesdecoder/scripts/tokenizer/lowercase.perl < corpus/clean.id > corpus/lowercased.id
~/mosesdecoder/scripts/tokenizer/lowercase.perl < corpus/clean.pnk > corpus/lowercased.pnk
~/mosesdecoder/scripts/tokenizer/tokenizer.perl < corpus/lowercased.id > corpus/tokenized.id
~/mosesdecoder/scripts/tokenizer/tokenizer.perl < corpus/lowercased.pnk > corpus/tokenized.pnk
~/srilm-1.7.2/bin/i686-m64/ngram-count -order 3 interpolate -unk -text corpus/tokenized.pnk -lm lm/pnk.lm
~/mosesdecoder/scripts/training/train-model.perl -root-dir . --corpus corpus/tokenized --f id --e pnk --lm 0:3:/home/tikuntan/mosestest/lm/pnk.lm -external-bin-dir ~/mosesdecoder/bin
~/mosesdecoder/bin/moses -f model/moses.ini
BLEU
~/mosesdecoder/bin/moses -f model/moses.ini < intest > out
~/mosesdecoder/scripts/generic/multi-bleu.perl ref < out
Contoh aplikasi :