[Llama4] Update attn_temperature_tuning (#19997)

Signed-off-by: Brayden Zhong <b8zhong@uwaterloo.ca>
2025-10-20 14:53:52 +08:00 · 2025-06-24 22:42:53 -04:00
parent 0d06b533a0
commit 1afa9948f5
1 changed files with 1 additions and 2 deletions
--- a/vllm/model_executor/models/llama4.py
+++ b/vllm/model_executor/models/llama4.py
@ -148,9 +148,8 @@ class Llama4Attention(nn.Module):
        self.q_size = self.num_heads * self.head_dim
        self.kv_size = self.num_kv_heads * self.head_dim
        self.scaling = self.head_dim**-0.5
-        # TODO: attn_temperature_tuning should be a bool in huggingface
        self.attn_temperature_tuning = self.nope and \
-            config.attn_temperature_tuning > 0
+            config.attn_temperature_tuning

        self.floor_scale = getattr(config, "floor_scale", 8192.0)
        self.attn_scale = getattr(config, "attn_scale", 0.1)