[ROCm][Bugfix] Only enable +rms_norm based on aiter if not explicitly disabled (#25275)

Signed-off-by: Gregory Shtrasberg <Gregory.Shtrasberg@amd.com>
This commit is contained in:
Gregory Shtrasberg
2025-09-24 11:24:39 -04:00
committed by GitHub
parent 9313be5017
commit 487745ff49

View File

@ -340,7 +340,8 @@ class RocmPlatform(Platform):
else:
parallel_config.worker_cls = "vllm.worker.worker.Worker"
# Aiter rms norm perform best when CUDA Graph capture is enabled.
if use_v1 and use_aiter_rms_norm and not is_eager_execution:
if (use_v1 and use_aiter_rms_norm and not is_eager_execution
and "-rms_norm" not in compilation_config.custom_ops):
compilation_config.custom_ops.append("+rms_norm")
@classmethod