diff --git a/tests/test_model.py b/tests/test_model.py index 2ddaec0576..df1c9ab0b0 100644 --- a/tests/test_model.py +++ b/tests/test_model.py @@ -645,6 +645,7 @@ def test_against_olmo2(model_name, device, dtype): n_layer=2, n_head=8, n_embd=32, + n_query_groups=2, intermediate_size=86, ) T = 5