mirror of
https://github.com/vllm-project/vllm.git
synced 2025-10-20 14:53:52 +08:00
[ROCm][Bugfix] Only enable +rms_norm based on aiter if not explicitly disabled (#25275)
Signed-off-by: Gregory Shtrasberg <Gregory.Shtrasberg@amd.com>
This commit is contained in:
committed by
GitHub
parent
9313be5017
commit
487745ff49
@ -340,7 +340,8 @@ class RocmPlatform(Platform):
|
||||
else:
|
||||
parallel_config.worker_cls = "vllm.worker.worker.Worker"
|
||||
# Aiter rms norm perform best when CUDA Graph capture is enabled.
|
||||
if use_v1 and use_aiter_rms_norm and not is_eager_execution:
|
||||
if (use_v1 and use_aiter_rms_norm and not is_eager_execution
|
||||
and "-rms_norm" not in compilation_config.custom_ops):
|
||||
compilation_config.custom_ops.append("+rms_norm")
|
||||
|
||||
@classmethod
|
||||
|
Reference in New Issue
Block a user