Commit efa4a6cf authored by Justas Zemgulys's avatar Justas Zemgulys Committed by drpngx
Browse files

Fix vocabulary naming (input/output vocabulary no longer has same name) (#946)

parent 5723fcca
...@@ -300,8 +300,8 @@ def prepare_data(data_dir, from_train_path, to_train_path, from_dev_path, to_dev ...@@ -300,8 +300,8 @@ def prepare_data(data_dir, from_train_path, to_train_path, from_dev_path, to_dev
(6) path to the "to language" vocabulary file. (6) path to the "to language" vocabulary file.
""" """
# Create vocabularies of the appropriate sizes. # Create vocabularies of the appropriate sizes.
to_vocab_path = os.path.join(data_dir, "vocab%d" % to_vocabulary_size) to_vocab_path = os.path.join(data_dir, "vocab%d.to" % to_vocabulary_size)
from_vocab_path = os.path.join(data_dir, "vocab%d" % from_vocabulary_size) from_vocab_path = os.path.join(data_dir, "vocab%d.from" % from_vocabulary_size)
create_vocabulary(to_vocab_path, to_train_path , to_vocabulary_size, tokenizer) create_vocabulary(to_vocab_path, to_train_path , to_vocabulary_size, tokenizer)
create_vocabulary(from_vocab_path, from_train_path , from_vocabulary_size, tokenizer) create_vocabulary(from_vocab_path, from_train_path , from_vocabulary_size, tokenizer)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment