We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 172d1cd commit c5d5535Copy full SHA for c5d5535
vllm/model_executor/layers/quantization/kernels/marlin.py
@@ -38,10 +38,11 @@ def can_implement(cls,
38
"Marlin, supported group sizes are: "\
39
f"{MARLIN_SUPPORTED_GROUP_SIZES}"
40
41
- return check_marlin_supports_shape(c.partition_weight_shape[0],
42
- c.partition_weight_shape[1],
43
- c.full_weight_shape[1],
44
- c.group_size)
+ return check_marlin_supports_shape(
+ c.partition_weight_shape[1], # out_features
+ c.partition_weight_shape[0], # in_features
+ c.full_weight_shape[0], # in_features
45
+ c.group_size)
46
47
# note assumes that
48
# `weight_packed` is: {input_dim = 0, output_dim = 1, packed_dim = 0}
0 commit comments