Unverified Commit 134caef3 authored by Matt's avatar Matt Committed by GitHub
Browse files

Speed up TF tests by reducing hidden layer counts (#24595)

* hidden layers, huh, what are they good for (absolutely nothing)

* Some tests break with 1 hidden layer, use 2

* Use 1 hidden layer in a few slow models

* Use num_hidden_layers=2 everywhere

* Slightly higher tol for groupvit

* Slightly higher tol for groupvit
parent 3441ad7d
...@@ -56,7 +56,7 @@ class TFAlbertModelTester: ...@@ -56,7 +56,7 @@ class TFAlbertModelTester:
vocab_size=99, vocab_size=99,
embedding_size=16, embedding_size=16,
hidden_size=32, hidden_size=32,
num_hidden_layers=5, num_hidden_layers=2,
num_attention_heads=4, num_attention_heads=4,
intermediate_size=37, intermediate_size=37,
hidden_act="gelu", hidden_act="gelu",
...@@ -80,7 +80,7 @@ class TFAlbertModelTester: ...@@ -80,7 +80,7 @@ class TFAlbertModelTester:
self.vocab_size = 99 self.vocab_size = 99
self.embedding_size = 16 self.embedding_size = 16
self.hidden_size = 32 self.hidden_size = 32
self.num_hidden_layers = 5 self.num_hidden_layers = 2
self.num_attention_heads = 4 self.num_attention_heads = 4
self.intermediate_size = 37 self.intermediate_size = 37
self.hidden_act = "gelu" self.hidden_act = "gelu"
......
...@@ -52,7 +52,7 @@ class TFBartModelTester: ...@@ -52,7 +52,7 @@ class TFBartModelTester:
use_labels=False, use_labels=False,
vocab_size=99, vocab_size=99,
hidden_size=32, hidden_size=32,
num_hidden_layers=5, num_hidden_layers=2,
num_attention_heads=4, num_attention_heads=4,
intermediate_size=37, intermediate_size=37,
hidden_dropout_prob=0.1, hidden_dropout_prob=0.1,
......
...@@ -57,7 +57,7 @@ class TFBertModelTester: ...@@ -57,7 +57,7 @@ class TFBertModelTester:
use_labels=True, use_labels=True,
vocab_size=99, vocab_size=99,
hidden_size=32, hidden_size=32,
num_hidden_layers=5, num_hidden_layers=2,
num_attention_heads=4, num_attention_heads=4,
intermediate_size=37, intermediate_size=37,
hidden_act="gelu", hidden_act="gelu",
...@@ -80,7 +80,7 @@ class TFBertModelTester: ...@@ -80,7 +80,7 @@ class TFBertModelTester:
self.use_labels = True self.use_labels = True
self.vocab_size = 99 self.vocab_size = 99
self.hidden_size = 32 self.hidden_size = 32
self.num_hidden_layers = 5 self.num_hidden_layers = 2
self.num_attention_heads = 4 self.num_attention_heads = 4
self.intermediate_size = 37 self.intermediate_size = 37
self.hidden_act = "gelu" self.hidden_act = "gelu"
......
...@@ -48,7 +48,7 @@ class TFBlenderbotModelTester: ...@@ -48,7 +48,7 @@ class TFBlenderbotModelTester:
use_labels=False, use_labels=False,
vocab_size=99, vocab_size=99,
hidden_size=32, hidden_size=32,
num_hidden_layers=5, num_hidden_layers=2,
num_attention_heads=4, num_attention_heads=4,
intermediate_size=37, intermediate_size=37,
hidden_dropout_prob=0.1, hidden_dropout_prob=0.1,
......
...@@ -48,7 +48,7 @@ class TFBlenderbotSmallModelTester: ...@@ -48,7 +48,7 @@ class TFBlenderbotSmallModelTester:
use_labels=False, use_labels=False,
vocab_size=99, vocab_size=99,
hidden_size=32, hidden_size=32,
num_hidden_layers=5, num_hidden_layers=2,
num_attention_heads=4, num_attention_heads=4,
intermediate_size=37, intermediate_size=37,
hidden_dropout_prob=0.1, hidden_dropout_prob=0.1,
......
...@@ -64,7 +64,7 @@ class TFBlipVisionModelTester: ...@@ -64,7 +64,7 @@ class TFBlipVisionModelTester:
is_training=True, is_training=True,
hidden_size=32, hidden_size=32,
projection_dim=32, projection_dim=32,
num_hidden_layers=5, num_hidden_layers=2,
num_attention_heads=4, num_attention_heads=4,
intermediate_size=37, intermediate_size=37,
dropout=0.1, dropout=0.1,
...@@ -207,7 +207,7 @@ class TFBlipTextModelTester: ...@@ -207,7 +207,7 @@ class TFBlipTextModelTester:
vocab_size=99, vocab_size=99,
hidden_size=32, hidden_size=32,
projection_dim=32, projection_dim=32,
num_hidden_layers=5, num_hidden_layers=2,
num_attention_heads=4, num_attention_heads=4,
intermediate_size=37, intermediate_size=37,
dropout=0.1, dropout=0.1,
......
...@@ -46,7 +46,7 @@ class BlipTextModelTester: ...@@ -46,7 +46,7 @@ class BlipTextModelTester:
vocab_size=99, vocab_size=99,
hidden_size=32, hidden_size=32,
projection_dim=32, projection_dim=32,
num_hidden_layers=5, num_hidden_layers=2,
num_attention_heads=4, num_attention_heads=4,
intermediate_size=37, intermediate_size=37,
dropout=0.1, dropout=0.1,
......
...@@ -57,7 +57,7 @@ class TFCLIPVisionModelTester: ...@@ -57,7 +57,7 @@ class TFCLIPVisionModelTester:
num_channels=3, num_channels=3,
is_training=True, is_training=True,
hidden_size=32, hidden_size=32,
num_hidden_layers=5, num_hidden_layers=2,
num_attention_heads=4, num_attention_heads=4,
intermediate_size=37, intermediate_size=37,
dropout=0.1, dropout=0.1,
...@@ -328,7 +328,7 @@ class TFCLIPTextModelTester: ...@@ -328,7 +328,7 @@ class TFCLIPTextModelTester:
use_labels=True, use_labels=True,
vocab_size=99, vocab_size=99,
hidden_size=32, hidden_size=32,
num_hidden_layers=5, num_hidden_layers=2,
num_attention_heads=4, num_attention_heads=4,
intermediate_size=37, intermediate_size=37,
dropout=0.1, dropout=0.1,
......
...@@ -51,7 +51,7 @@ class TFConvBertModelTester: ...@@ -51,7 +51,7 @@ class TFConvBertModelTester:
use_labels=True, use_labels=True,
vocab_size=99, vocab_size=99,
hidden_size=32, hidden_size=32,
num_hidden_layers=5, num_hidden_layers=2,
num_attention_heads=4, num_attention_heads=4,
intermediate_size=37, intermediate_size=37,
hidden_act="gelu", hidden_act="gelu",
...@@ -74,7 +74,7 @@ class TFConvBertModelTester: ...@@ -74,7 +74,7 @@ class TFConvBertModelTester:
self.use_labels = True self.use_labels = True
self.vocab_size = 99 self.vocab_size = 99
self.hidden_size = 384 self.hidden_size = 384
self.num_hidden_layers = 5 self.num_hidden_layers = 2
self.num_attention_heads = 4 self.num_attention_heads = 4
self.intermediate_size = 37 self.intermediate_size = 37
self.hidden_act = "gelu" self.hidden_act = "gelu"
......
...@@ -52,7 +52,7 @@ class TFCTRLModelTester(object): ...@@ -52,7 +52,7 @@ class TFCTRLModelTester(object):
self.use_mc_token_ids = True self.use_mc_token_ids = True
self.vocab_size = 99 self.vocab_size = 99
self.hidden_size = 32 self.hidden_size = 32
self.num_hidden_layers = 5 self.num_hidden_layers = 2
self.num_attention_heads = 4 self.num_attention_heads = 4
self.intermediate_size = 37 self.intermediate_size = 37
self.hidden_act = "gelu" self.hidden_act = "gelu"
......
...@@ -61,7 +61,7 @@ class TFData2VecVisionModelTester: ...@@ -61,7 +61,7 @@ class TFData2VecVisionModelTester:
is_training=True, is_training=True,
use_labels=True, use_labels=True,
hidden_size=32, hidden_size=32,
num_hidden_layers=4, num_hidden_layers=2,
num_attention_heads=4, num_attention_heads=4,
intermediate_size=37, intermediate_size=37,
hidden_act="gelu", hidden_act="gelu",
......
...@@ -50,7 +50,7 @@ class TFDebertaModelTester: ...@@ -50,7 +50,7 @@ class TFDebertaModelTester:
use_labels=True, use_labels=True,
vocab_size=99, vocab_size=99,
hidden_size=32, hidden_size=32,
num_hidden_layers=5, num_hidden_layers=2,
num_attention_heads=4, num_attention_heads=4,
intermediate_size=37, intermediate_size=37,
hidden_act="gelu", hidden_act="gelu",
...@@ -73,7 +73,7 @@ class TFDebertaModelTester: ...@@ -73,7 +73,7 @@ class TFDebertaModelTester:
self.use_labels = True self.use_labels = True
self.vocab_size = 99 self.vocab_size = 99
self.hidden_size = 32 self.hidden_size = 32
self.num_hidden_layers = 5 self.num_hidden_layers = 2
self.num_attention_heads = 4 self.num_attention_heads = 4
self.intermediate_size = 37 self.intermediate_size = 37
self.hidden_act = "gelu" self.hidden_act = "gelu"
......
...@@ -50,7 +50,7 @@ class TFDebertaV2ModelTester: ...@@ -50,7 +50,7 @@ class TFDebertaV2ModelTester:
use_labels=True, use_labels=True,
vocab_size=99, vocab_size=99,
hidden_size=32, hidden_size=32,
num_hidden_layers=5, num_hidden_layers=2,
num_attention_heads=4, num_attention_heads=4,
intermediate_size=37, intermediate_size=37,
hidden_act="gelu", hidden_act="gelu",
......
...@@ -60,7 +60,7 @@ class TFDeiTModelTester: ...@@ -60,7 +60,7 @@ class TFDeiTModelTester:
is_training=True, is_training=True,
use_labels=True, use_labels=True,
hidden_size=32, hidden_size=32,
num_hidden_layers=5, num_hidden_layers=2,
num_attention_heads=4, num_attention_heads=4,
intermediate_size=37, intermediate_size=37,
hidden_act="gelu", hidden_act="gelu",
......
...@@ -54,7 +54,7 @@ class TFDistilBertModelTester: ...@@ -54,7 +54,7 @@ class TFDistilBertModelTester:
self.use_labels = True self.use_labels = True
self.vocab_size = 99 self.vocab_size = 99
self.hidden_size = 32 self.hidden_size = 32
self.num_hidden_layers = 5 self.num_hidden_layers = 2
self.num_attention_heads = 4 self.num_attention_heads = 4
self.intermediate_size = 37 self.intermediate_size = 37
self.hidden_act = "gelu" self.hidden_act = "gelu"
......
...@@ -53,7 +53,7 @@ class TFDPRModelTester: ...@@ -53,7 +53,7 @@ class TFDPRModelTester:
use_labels=True, use_labels=True,
vocab_size=99, vocab_size=99,
hidden_size=32, hidden_size=32,
num_hidden_layers=5, num_hidden_layers=2,
num_attention_heads=4, num_attention_heads=4,
intermediate_size=37, intermediate_size=37,
hidden_act="gelu", hidden_act="gelu",
......
...@@ -54,7 +54,7 @@ class TFElectraModelTester: ...@@ -54,7 +54,7 @@ class TFElectraModelTester:
self.use_labels = True self.use_labels = True
self.vocab_size = 99 self.vocab_size = 99
self.hidden_size = 32 self.hidden_size = 32
self.num_hidden_layers = 5 self.num_hidden_layers = 2
self.num_attention_heads = 4 self.num_attention_heads = 4
self.intermediate_size = 37 self.intermediate_size = 37
self.hidden_act = "gelu" self.hidden_act = "gelu"
......
...@@ -53,7 +53,7 @@ class TFEsmModelTester: ...@@ -53,7 +53,7 @@ class TFEsmModelTester:
self.use_labels = True self.use_labels = True
self.vocab_size = 99 self.vocab_size = 99
self.hidden_size = 32 self.hidden_size = 32
self.num_hidden_layers = 5 self.num_hidden_layers = 2
self.num_attention_heads = 4 self.num_attention_heads = 4
self.intermediate_size = 37 self.intermediate_size = 37
self.hidden_act = "gelu" self.hidden_act = "gelu"
......
...@@ -61,7 +61,7 @@ class TFFlaubertModelTester: ...@@ -61,7 +61,7 @@ class TFFlaubertModelTester:
self.vocab_size = 99 self.vocab_size = 99
self.n_special = 0 self.n_special = 0
self.hidden_size = 32 self.hidden_size = 32
self.num_hidden_layers = 5 self.num_hidden_layers = 2
self.num_attention_heads = 4 self.num_attention_heads = 4
self.hidden_dropout_prob = 0.1 self.hidden_dropout_prob = 0.1
self.attention_probs_dropout_prob = 0.1 self.attention_probs_dropout_prob = 0.1
......
...@@ -55,7 +55,7 @@ class TFGPT2ModelTester: ...@@ -55,7 +55,7 @@ class TFGPT2ModelTester:
self.use_mc_token_ids = True self.use_mc_token_ids = True
self.vocab_size = 99 self.vocab_size = 99
self.hidden_size = 32 self.hidden_size = 32
self.num_hidden_layers = 5 self.num_hidden_layers = 2
self.num_attention_heads = 4 self.num_attention_heads = 4
self.intermediate_size = 37 self.intermediate_size = 37
self.hidden_act = "gelu" self.hidden_act = "gelu"
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment