@@ -94,7 +94,7 @@ def test_batching(
94
94
)
95
95
96
96
97
- @pytest .mark .parametrize ("model" , SSM_MODELS [0 : 1 ] + HYBRID_MODELS [0 : 2 ])
97
+ @pytest .mark .parametrize ("model" , [ SSM_MODELS [0 ], HYBRID_MODELS [0 ] ])
98
98
@pytest .mark .parametrize ("max_tokens" , [32 ])
99
99
@pytest .mark .parametrize ("num_logprobs" , [5 ])
100
100
@pytest .mark .parametrize ("chunked_prefill_token_size" , [1 , 4 , 16 ])
@@ -130,7 +130,7 @@ def test_chunked_prefill(
130
130
)
131
131
132
132
133
- @pytest .mark .parametrize ("model" , SSM_MODELS [0 : 1 ] + HYBRID_MODELS [0 : 2 ])
133
+ @pytest .mark .parametrize ("model" , [ SSM_MODELS [0 ], HYBRID_MODELS [0 ] ])
134
134
@pytest .mark .parametrize ("max_tokens" , [10 ])
135
135
def test_chunked_prefill_with_parallel_sampling (
136
136
vllm_runner ,
@@ -162,7 +162,7 @@ def test_chunked_prefill_with_parallel_sampling(
162
162
vllm_model .generate (example_prompts , sampling_params )
163
163
164
164
165
- @pytest .mark .parametrize ("model" , SSM_MODELS [0 : 1 ] + HYBRID_MODELS [0 : 2 ])
165
+ @pytest .mark .parametrize ("model" , [ SSM_MODELS [0 ], HYBRID_MODELS [0 ] ])
166
166
@pytest .mark .parametrize ("max_tokens" , [20 ])
167
167
def test_mamba_cache_cg_padding (
168
168
vllm_runner ,
@@ -191,7 +191,7 @@ def test_mamba_cache_cg_padding(
191
191
"Could be related to mamba cache not padded correctly" )
192
192
193
193
194
- @pytest .mark .parametrize ("model" , SSM_MODELS [0 : 1 ] + HYBRID_MODELS [0 : 2 ])
194
+ @pytest .mark .parametrize ("model" , [ SSM_MODELS [0 ], HYBRID_MODELS [0 ] ])
195
195
@pytest .mark .parametrize ("max_tokens" , [20 ])
196
196
def test_models_preemption_recompute (
197
197
vllm_runner ,
@@ -219,7 +219,7 @@ def test_models_preemption_recompute(
219
219
)
220
220
221
221
222
- @pytest .mark .parametrize ("model" , SSM_MODELS [0 : 1 ] + HYBRID_MODELS [0 : 2 ])
222
+ @pytest .mark .parametrize ("model" , [ SSM_MODELS [0 ], HYBRID_MODELS [0 ] ])
223
223
def test_fail_upon_inc_requests_and_finished_requests_lt_available_blocks (
224
224
vllm_runner ,
225
225
example_prompts ,
@@ -242,7 +242,7 @@ def test_fail_upon_inc_requests_and_finished_requests_lt_available_blocks(
242
242
"steps finished requests registered unnecessarily " )
243
243
244
244
245
- @pytest .mark .parametrize ("model" , SSM_MODELS [0 : 1 ] + HYBRID_MODELS [0 : 2 ])
245
+ @pytest .mark .parametrize ("model" , [ SSM_MODELS [0 ], HYBRID_MODELS [0 ] ])
246
246
def test_state_cleanup (
247
247
vllm_runner ,
248
248
example_prompts ,
@@ -263,7 +263,7 @@ def test_state_cleanup(
263
263
"could be related to finished_requests_ids" )
264
264
265
265
266
- @pytest .mark .parametrize ("model" , SSM_MODELS [0 : 1 ] + HYBRID_MODELS [0 : 2 ])
266
+ @pytest .mark .parametrize ("model" , [ SSM_MODELS [0 ], HYBRID_MODELS [0 ] ])
267
267
@pytest .mark .parametrize ("max_tokens" , [64 ])
268
268
def test_multistep_correctness (
269
269
vllm_runner ,
@@ -290,7 +290,7 @@ def test_multistep_correctness(
290
290
291
291
292
292
@multi_gpu_test (num_gpus = 2 )
293
- @pytest .mark .parametrize ("model" , SSM_MODELS [0 : 1 ] + HYBRID_MODELS [0 : 2 ])
293
+ @pytest .mark .parametrize ("model" , [ SSM_MODELS [0 ], HYBRID_MODELS [0 ] ])
294
294
@pytest .mark .parametrize ("max_tokens" , [64 ])
295
295
def test_hybrid_distributed_produces_identical_generation (
296
296
vllm_runner ,
0 commit comments