Skip to content

Commit 46ea7e6

Browse files
authored
[testing] test num_hidden_layers being small in model tester (#40992)
fix Co-authored-by: ydshieh <ydshieh@users.noreply.github.com>
1 parent ebdc17b commit 46ea7e6

32 files changed

+74
-35
lines changed

tests/models/aya_vision/test_modeling_aya_vision.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -71,7 +71,7 @@ def __init__(
7171
"vocab_size": 99,
7272
"hidden_size": 128,
7373
"intermediate_size": 37,
74-
"num_hidden_layers": 4,
74+
"num_hidden_layers": 2,
7575
"num_attention_heads": 4,
7676
"output_channels": 64,
7777
"hidden_act": "silu",

tests/models/bamba/test_modeling_bamba.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -73,7 +73,7 @@ def __init__(
7373
use_labels=True,
7474
vocab_size=99,
7575
hidden_size=32,
76-
num_hidden_layers=4,
76+
num_hidden_layers=2,
7777
num_attention_heads=4,
7878
num_key_value_heads=2,
7979
intermediate_size=64,

tests/models/bitnet/test_modeling_bitnet.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -49,7 +49,7 @@ def __init__(
4949
use_input_mask=True,
5050
vocab_size=99,
5151
hidden_size=64,
52-
num_hidden_layers=5,
52+
num_hidden_layers=2,
5353
num_attention_heads=4,
5454
num_key_value_heads=2,
5555
intermediate_size=37,

tests/models/bros/test_modeling_bros.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -49,7 +49,7 @@ def __init__(
4949
use_labels=True,
5050
vocab_size=99,
5151
hidden_size=64,
52-
num_hidden_layers=5,
52+
num_hidden_layers=2,
5353
num_attention_heads=4,
5454
intermediate_size=37,
5555
hidden_act="gelu",

tests/models/cohere/test_modeling_cohere.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -54,7 +54,7 @@ def __init__(
5454
use_labels=True,
5555
vocab_size=99,
5656
hidden_size=32,
57-
num_hidden_layers=4,
57+
num_hidden_layers=2,
5858
num_attention_heads=4,
5959
intermediate_size=37,
6060
hidden_act="gelu",

tests/models/cohere2_vision/test_modeling_cohere2_vision.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -65,7 +65,7 @@ def __init__(
6565
"vocab_size": 99,
6666
"hidden_size": 128,
6767
"intermediate_size": 37,
68-
"num_hidden_layers": 4,
68+
"num_hidden_layers": 2,
6969
"num_attention_heads": 4,
7070
"output_channels": 64,
7171
"hidden_act": "silu",

tests/models/deepseek_v3/test_modeling_deepseek_v3.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -65,7 +65,7 @@ def __init__(
6565
hidden_size=32,
6666
intermediate_size=37,
6767
moe_intermediate_size=12,
68-
num_hidden_layers=5,
68+
num_hidden_layers=2,
6969
num_attention_heads=4,
7070
num_key_value_heads=4,
7171
n_shared_experts=1,

tests/models/eomt/test_modeling_eomt.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -47,7 +47,7 @@ def __init__(
4747
num_labels=4,
4848
hidden_size=8,
4949
num_attention_heads=2,
50-
num_hidden_layers=4,
50+
num_hidden_layers=2,
5151
):
5252
self.parent = parent
5353
self.batch_size = batch_size

tests/models/falcon/test_modeling_falcon.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -208,7 +208,7 @@ def test_falcon_alibi_sdpa_matches_eager(self):
208208
config = FalconConfig(
209209
vocab_size=1000,
210210
hidden_size=64,
211-
num_hidden_layers=3,
211+
num_hidden_layers=2,
212212
num_attention_heads=4,
213213
new_decoder_architecture=True,
214214
alibi=True,

tests/models/falcon_h1/test_modeling_falcon_h1.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -55,7 +55,7 @@ def __init__(
5555
use_labels=True,
5656
vocab_size=99,
5757
hidden_size=32,
58-
num_hidden_layers=4,
58+
num_hidden_layers=2,
5959
num_attention_heads=4,
6060
num_key_value_heads=2,
6161
intermediate_size=64,

0 commit comments

Comments
 (0)