[Bugfix]: Fix is_embedding_layer condition in VocabParallelEmbedding (#15824)

Signed-off-by: alexwl <alexey.a.kiryushin@gmail.com>
2025-10-20 14:53:52 +08:00 · 2025-04-01 05:57:59 +00:00
parent e830b01383
commit 63d8eabed0
1 changed files with 1 additions and 1 deletions
--- a/vllm/model_executor/layers/vocab_parallel_embedding.py
+++ b/vllm/model_executor/layers/vocab_parallel_embedding.py
@ -235,7 +235,7 @@ class VocabParallelEmbedding(torch.nn.Module):
        # If we are making an embedding layer, then our quantization linear
        # method must implement the embedding operation. If we are another
        # layer type like ParallelLMHead, this is not important.
-        is_embedding_layer = type(self.__class__) is VocabParallelEmbedding
+        is_embedding_layer = type(self) is VocabParallelEmbedding
        quant_method_implements_embedding = method_has_implemented_embedding(
            type(quant_method))
        if is_embedding_layer and not quant_method_implements_embedding: