clean up a little bit PT <=> TF conversion

f8fb4335 · thomwolf · bebaa140 · f8fb4335 · f8fb4335
Commit f8fb4335 authored Dec 05, 2019 by thomwolf
Show whitespace changes
Inline Side-by-side

Showing with 7 additions and 5 deletions

transformers/convert_pytorch_checkpoint_to_tf2.py transformers/convert_pytorch_checkpoint_to_tf2.py +5 -4

transformers/modeling_utils.py transformers/modeling_utils.py +2 -1

No files found.
--- a/transformers/convert_pytorch_checkpoint_to_tf2.py
+++ b/transformers/convert_pytorch_checkpoint_to_tf2.py
@@ -119,10 +119,11 @@ def convert_pt_checkpoint_to_tf(model_type, pytorch_checkpoint_path, config_file
        tf_inputs = tf.constant(inputs_list)
        tfo = tf_model(tf_inputs, training=False)  # build the network
-        pt_model = pt_model_class.from_pretrained(None,
+        pt_model = pt_model_class(config)
-                                                  config=config,
+        pt_model.load_state_dict(torch.load(pytorch_checkpoint_path, map_location='cpu'),
-                                                  state_dict=torch.load(pytorch_checkpoint_path,
+                                 strict-False)
-                                                                        map_location='cpu'))
+        pt_model.eval()
        pt_inputs = torch.tensor(inputs_list)
        with torch.no_grad():
            pto = pt_model(pt_inputs)

--- a/transformers/modeling_utils.py
+++ b/transformers/modeling_utils.py
@@ -318,7 +318,8 @@ class PreTrainedModel(nn.Module):
            model = BertModel.from_pretrained('./tf_model/my_tf_checkpoint.ckpt.index', from_tf=True, config=config)
        """
-        if "albert" in pretrained_model_name_or_path and "v2" in pretrained_model_name_or_path:
+        if pretrained_model_name_or_path is not None and (
+                "albert" in pretrained_model_name_or_path and "v2" in pretrained_model_name_or_path):
            logger.warning("There is currently an upstream reproducibility issue with ALBERT v2 models. Please see " +
                           "https://github.com/google-research/google-research/issues/119 for more information.")