multilingual_fairseq_gen.sh 594 Bytes
Newer Older
Sugon_ldc's avatar
Sugon_ldc committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
#!/bin/bash

lang_pairs="en-fr,en-cs,fr-en,cs-en"
path_2_data=$1 # <path to data>
lang_list=$2 # <path to a file which contains list of languages separted by new lines>
model=$3  # <path to a trained model>
source_lang=cs
target_lang=en

fairseq-generate "$path_2_data" \
  --path "$model" \
  --task translation_multi_simple_epoch \
  --gen-subset test \
  --source-lang "$source_lang" \
  --target-lang "$target_lang" \
  --sacrebleu --remove-bpe 'sentencepiece'\
  --batch-size 32 \
  --encoder-langtok "src" \
  --decoder-langtok \
  --lang-dict "$lang_list" \
  --lang-pairs "$lang_pairs"