File tree Expand file tree Collapse file tree 2 files changed +3
-54
lines changed
tests/models/decoder_only/language Expand file tree Collapse file tree 2 files changed +3
-54
lines changed Original file line number Diff line number Diff line change 17
17
"EleutherAI/gpt-j-6b" ,
18
18
# "mosaicml/mpt-7b", # Broken
19
19
# "Qwen/Qwen1.5-0.5B" # Broken,
20
+ "openbmb/MiniCPM3-4B" ,
20
21
]
21
22
22
23
#TODO: remove this after CPU float16 support ready
@@ -39,7 +40,7 @@ def test_models(
39
40
with hf_runner (model , dtype = dtype ) as hf_model :
40
41
hf_outputs = hf_model .generate_greedy (example_prompts , max_tokens )
41
42
42
- with vllm_runner (model , dtype = dtype ) as vllm_model :
43
+ with vllm_runner (model , dtype = dtype , enforce_eager = True ) as vllm_model :
43
44
vllm_outputs = vllm_model .generate_greedy (example_prompts , max_tokens )
44
45
45
46
check_outputs_equal (
@@ -57,7 +58,7 @@ def test_model_print(
57
58
model : str ,
58
59
dtype : str ,
59
60
) -> None :
60
- with vllm_runner (model , dtype = dtype ) as vllm_model :
61
+ with vllm_runner (model , dtype = dtype , enforce_eager = True ) as vllm_model :
61
62
# This test is for verifying whether the model's extra_repr
62
63
# can be printed correctly.
63
64
print (vllm_model .model .llm_engine .model_executor .driver_worker .
Load Diff This file was deleted.
You can’t perform that action at this time.
0 commit comments