From 7d1c9ea3140bc5c2f3f9bf252c745151c4b64a85 Mon Sep 17 00:00:00 2001 From: Vu Cong Duy Hoang Date: Thu, 5 Apr 2018 19:06:51 +0200 Subject: [PATCH] fixed minor bug in get_ende_bleu.sh (#685) --- tensor2tensor/utils/get_ende_bleu.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tensor2tensor/utils/get_ende_bleu.sh b/tensor2tensor/utils/get_ende_bleu.sh index 0de433e33..805347231 100755 --- a/tensor2tensor/utils/get_ende_bleu.sh +++ b/tensor2tensor/utils/get_ende_bleu.sh @@ -13,7 +13,7 @@ perl $mosesdecoder/scripts/tokenizer/tokenizer.perl -l de < $decodes_file > $dec # 'Also, for historical reasons, we split compound words, e.g., # "rich-text format" --> rich ##AT##-##AT## text format."' perl -ple 's{(\S)-(\S)}{$1 ##AT##-##AT## $2}g' < $tok_gold_targets > $tok_gold_targets.atat -perl -ple 's{(\S)-(\S)}{$1 ##AT##-##AT## $2}g' < $decodes_file.tok > $decodes_file.atat +perl -ple 's{(\S)-(\S)}{$1 ##AT##-##AT## $2}g' < $decodes_file.tok > $decodes_file.tok.atat # Get BLEU. perl $mosesdecoder/scripts/generic/multi-bleu.perl $tok_gold_targets.atat < $decodes_file.tok.atat