Fixed the issue that no space in string converted from tensor

Summary: Pull Request resolved: https://github.com/pytorch/fairseq/pull/548 Differential Revision: D14286021 Pulled By: myleott fbshipit-source-id: 7c725304185e63787220371a812ec860e178872c

Fixed the issue that no space in string converted from tensor
Summary: Pull Request resolved: https://github.com/pytorch/fairseq/pull/548 Differential Revision: D14286021 Pulled By: myleott fbshipit-source-id: 7c725304185e63787220371a812ec860e178872c
88bf8b56 · James King · Facebook Github Bot · 66262a38 · 88bf8b56 · 88bf8b56
Commit 88bf8b56 authored Mar 01, 2019 by James King Committed by Facebook Github Bot Mar 01, 2019
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 2 deletions

fairseq/data/data_utils.py fairseq/data/data_utils.py +1 -1

fairseq/data/dictionary.py fairseq/data/dictionary.py +1 -1

No files found.
--- a/fairseq/data/data_utils.py
+++ b/fairseq/data/data_utils.py
@@ -176,7 +176,7 @@ def batch_by_size(

 def process_bpe_symbol(sentence: str, bpe_symbol: str):
    if bpe_symbol == 'sentencepiece':
-        sentence = sentence.replace('\u2581', ' ').strip()
+        sentence = sentence.replace(' ','').replace('\u2581', ' ').strip()
    elif bpe_symbol is not None:
        sentence = (sentence + ' ').replace(bpe_symbol, '').rstrip()
    return sentence
--- a/fairseq/data/dictionary.py
+++ b/fairseq/data/dictionary.py
@@ -62,7 +62,7 @@ class Dictionary(object):
            else:
                return self[i]

-        sent = ''.join(token_string(i) for i in tensor if i != self.eos())
+        sent = ' '.join(token_string(i) for i in tensor if i != self.eos())
        return data_utils.process_bpe_symbol(sent, bpe_symbol)

    def unk_string(self, escape=False):