We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 21e3943 commit 0fc8fa7Copy full SHA for 0fc8fa7
vllm/model_executor/layers/quantization/gptq_marlin.py
@@ -56,7 +56,7 @@ def get_moe_quant_method(
56
# Dynamic per module/layer rules may override base config
57
override_config(cloned_config, prefix=prefix)
58
59
- return moe_method_cls(cloned_config)
+ return moe_method_cls(cloned_config, layer.moe_config)
60
return None
61
62
0 commit comments