File tree 2 files changed +2
-6
lines changed 2 files changed +2
-6
lines changed Original file line number Diff line number Diff line change 13
13
/vllm /model_executor /guided_decoding @ mgoin @ russellb
14
14
/vllm /multimodal @ DarkLight1337 @ ywang96
15
15
/vllm /vllm_flash_attn @ LucasWilkinson
16
+ /vllm /lora @ jeejeelee
16
17
CMakeLists.txt @ tlrmchlsmth
17
18
18
19
# vLLM V1
@@ -40,3 +41,4 @@ CMakeLists.txt @tlrmchlsmth
40
41
/tests /v1 /entrypoints /llm /test_struct_output_generate.py @ mgoin @ russellb
41
42
/tests /v1 /structured_output @ mgoin @ russellb
42
43
/tests /weight_loading @ mgoin @ youkaichao
44
+ /tests /lora @ jeejeelee
Original file line number Diff line number Diff line change 37
37
("yec019/fbopt-350m-8bit" , "read pre-quantized 8-bit opt model" ),
38
38
]
39
39
40
- models_pre_quant_8bit_to_test = [
41
- ('meta-llama/Llama-Guard-3-8B-INT8' ,
42
- 'read pre-quantized llama 8-bit model' ),
43
- ("yec019/fbopt-350m-8bit" , "read pre-quantized 8-bit opt model" ),
44
- ]
45
-
46
40
47
41
@pytest .mark .skipif (not is_quant_method_supported ("bitsandbytes" ),
48
42
reason = 'bitsandbytes is not supported on this GPU type.' )
You can’t perform that action at this time.
0 commit comments