fix: gptq marlin weight loading failure (#23066)

This commit is contained in:
Simon Mo
2025-08-17 15:56:07 -07:00
committed by GitHub
parent 21e39436c8
commit 0fc8fa751a

View File

@ -56,7 +56,7 @@ def get_moe_quant_method(
# Dynamic per module/layer rules may override base config
override_config(cloned_config, prefix=prefix)
return moe_method_cls(cloned_config)
return moe_method_cls(cloned_config, layer.moe_config)
return None