fix test (#9669)

12c1b5b8 · Patrick von Platen · GitHub · 357fb1c5 · 12c1b5b8 · 12c1b5b8
Unverified Commit 12c1b5b8 authored Jan 19, 2021 by Patrick von Platen Committed by GitHub Jan 19, 2021
7 changed files
--- a/tests/test_modeling_bart.py
+++ b/tests/test_modeling_bart.py
@@ -61,9 +61,9 @@ def prepare_bart_inputs_dict(
    if decoder_attention_mask is None:
        decoder_attention_mask = decoder_input_ids.ne(config.pad_token_id)
    if head_mask is None:
-        head_mask = torch.ones(config.encoder_layers, config.encoder_attention_heads)
+        head_mask = torch.ones(config.encoder_layers, config.encoder_attention_heads, device=torch_device)
    if decoder_head_mask is None:
-        decoder_head_mask = torch.ones(config.decoder_layers, config.decoder_attention_heads)
+        decoder_head_mask = torch.ones(config.decoder_layers, config.decoder_attention_heads, device=torch_device)
    return {
        "input_ids": input_ids,
        "decoder_input_ids": decoder_input_ids,

--- a/tests/test_modeling_blenderbot.py
+++ b/tests/test_modeling_blenderbot.py
@@ -48,9 +48,9 @@ def prepare_blenderbot_inputs_dict(
    if decoder_attention_mask is None:
        decoder_attention_mask = decoder_input_ids.ne(config.pad_token_id)
    if head_mask is None:
-        head_mask = torch.ones(config.encoder_layers, config.encoder_attention_heads)
+        head_mask = torch.ones(config.encoder_layers, config.encoder_attention_heads, device=torch_device)
    if decoder_head_mask is None:
-        decoder_head_mask = torch.ones(config.decoder_layers, config.decoder_attention_heads)
+        decoder_head_mask = torch.ones(config.decoder_layers, config.decoder_attention_heads, device=torch_device)
    return {
        "input_ids": input_ids,
        "decoder_input_ids": decoder_input_ids,

--- a/tests/test_modeling_blenderbot_small.py
+++ b/tests/test_modeling_blenderbot_small.py
@@ -56,9 +56,9 @@ def prepare_blenderbot_small_inputs_dict(
    if decoder_attention_mask is None:
        decoder_attention_mask = decoder_input_ids.ne(config.pad_token_id)
    if head_mask is None:
-        head_mask = torch.ones(config.encoder_layers, config.encoder_attention_heads)
+        head_mask = torch.ones(config.encoder_layers, config.encoder_attention_heads, device=torch_device)
    if decoder_head_mask is None:
-        decoder_head_mask = torch.ones(config.decoder_layers, config.decoder_attention_heads)
+        decoder_head_mask = torch.ones(config.decoder_layers, config.decoder_attention_heads, device=torch_device)
    return {
        "input_ids": input_ids,
        "decoder_input_ids": decoder_input_ids,

--- a/tests/test_modeling_common.py
+++ b/tests/test_modeling_common.py
@@ -1073,7 +1073,7 @@ class ModelTesterMixin:

        # some params shouldn't be scattered by nn.DataParallel
        # so just remove them if they are present.
-        blacklist_non_batched_params = ["head_mask"]
+        blacklist_non_batched_params = ["head_mask", "decoder_head_mask"]
        for k in blacklist_non_batched_params:
            inputs_dict.pop(k, None)


--- a/tests/test_modeling_marian.py
+++ b/tests/test_modeling_marian.py
@@ -62,9 +62,9 @@ def prepare_marian_inputs_dict(
    if decoder_attention_mask is None:
        decoder_attention_mask = decoder_input_ids.ne(config.pad_token_id)
    if head_mask is None:
-        head_mask = torch.ones(config.encoder_layers, config.encoder_attention_heads)
+        head_mask = torch.ones(config.encoder_layers, config.encoder_attention_heads, device=torch_device)
    if decoder_head_mask is None:
-        decoder_head_mask = torch.ones(config.decoder_layers, config.decoder_attention_heads)
+        decoder_head_mask = torch.ones(config.decoder_layers, config.decoder_attention_heads, device=torch_device)
    return {
        "input_ids": input_ids,
        "decoder_input_ids": decoder_input_ids,

--- a/tests/test_modeling_mbart.py
+++ b/tests/test_modeling_mbart.py
@@ -57,9 +57,9 @@ def prepare_mbart_inputs_dict(
    if decoder_attention_mask is None:
        decoder_attention_mask = decoder_input_ids.ne(config.pad_token_id)
    if head_mask is None:
-        head_mask = torch.ones(config.encoder_layers, config.encoder_attention_heads)
+        head_mask = torch.ones(config.encoder_layers, config.encoder_attention_heads, device=torch_device)
    if decoder_head_mask is None:
-        decoder_head_mask = torch.ones(config.decoder_layers, config.decoder_attention_heads)
+        decoder_head_mask = torch.ones(config.decoder_layers, config.decoder_attention_heads, device=torch_device)
    return {
        "input_ids": input_ids,
        "decoder_input_ids": decoder_input_ids,

--- a/tests/test_modeling_pegasus.py
+++ b/tests/test_modeling_pegasus.py
@@ -49,9 +49,9 @@ def prepare_pegasus_inputs_dict(
    if decoder_attention_mask is None:
        decoder_attention_mask = decoder_input_ids.ne(config.pad_token_id)
    if head_mask is None:
-        head_mask = torch.ones(config.encoder_layers, config.encoder_attention_heads)
+        head_mask = torch.ones(config.encoder_layers, config.encoder_attention_heads, device=torch_device)
    if decoder_head_mask is None:
-        decoder_head_mask = torch.ones(config.decoder_layers, config.decoder_attention_heads)
+        decoder_head_mask = torch.ones(config.decoder_layers, config.decoder_attention_heads, device=torch_device)
    return {
        "input_ids": input_ids,
        "decoder_input_ids": decoder_input_ids,