mirror of
https://github.com/vllm-project/vllm.git
synced 2025-10-20 14:53:52 +08:00
[rocm] enable torchao quantization for rocm (#24400)
Signed-off-by: Lifan Shen <lifans@meta.com>
This commit is contained in:
@ -171,7 +171,7 @@ class RocmPlatform(Platform):
|
||||
|
||||
supported_quantization: list[str] = [
|
||||
"awq", "gptq", "fp8", "compressed-tensors", "fbgemm_fp8", "gguf",
|
||||
"quark", "ptpc_fp8", "mxfp4", "petit_nvfp4"
|
||||
"quark", "ptpc_fp8", "mxfp4", "petit_nvfp4", "torchao"
|
||||
]
|
||||
|
||||
@classmethod
|
||||
|
Reference in New Issue
Block a user