fix xlm lang_embeddings loading

160b5d60 · thomwolf · 26497d11 · 160b5d60
Commit 160b5d60 authored Sep 18, 2019 by thomwolf
Show whitespace changes
Inline Side-by-side

Showing with 7 additions and 4 deletions

pytorch_transformers/modeling_tf_xlm.py pytorch_transformers/modeling_tf_xlm.py +7 -4

No files found.
--- a/pytorch_transformers/modeling_tf_xlm.py
+++ b/pytorch_transformers/modeling_tf_xlm.py
@@ -47,10 +47,13 @@ TF_XLM_PRETRAINED_MODEL_ARCHIVE_MAP = {
 def load_xlm_pt_weights_in_tf2(tf_model, pytorch_checkpoint_path):
    # build the network
-    inputs_list = [[7, 6, 0, 0, 1], [1, 2, 3, 0, 0], [0, 0, 0, 4, 5]]
+    inputs_list = tf.constant([[7, 6, 0, 0, 1], [1, 2, 3, 0, 0], [0, 0, 0, 4, 5]])
-    attns_list = [[1, 1, 0, 0, 1], [1, 1, 1, 0, 0], [1, 0, 0, 1, 1]]
+    attns_list = tf.constant([[1, 1, 0, 0, 1], [1, 1, 1, 0, 0], [1, 0, 0, 1, 1]])
-    langs_list = [[1, 1, 0, 0, 1], [1, 1, 1, 0, 0], [1, 0, 0, 1, 1]]
+    if tf_model.config.use_lang_emb and tf_model.config.n_langs > 1:
-    tf_inputs = [tf.constant(inputs_list), tf.constant(attns_list), tf.constant(langs_list)]
+        langs_list = tf.constant([[1, 1, 0, 0, 1], [1, 1, 1, 0, 0], [1, 0, 0, 1, 1]])
+    else:
+        langs_list = None
+    tf_inputs = [inputs_list, attns_list), langs_list]
    tfo = tf_model(tf_inputs, training=False)
    return load_pytorch_checkpoint_in_tf2_model(tf_model, pytorch_checkpoint_path, tf_inputs=tf_inputs)