refine comments for lm_head gemma error fix

vllm-project · Mar 21, 2024 · 8c2b7b4 · 8c2b7b4
1 parent 959ceb9
commit 8c2b7b4
Showing 1 changed file with 2 additions and 3 deletions.
diff --git a/vllm/model_executor/models/gemma.py b/vllm/model_executor/models/gemma.py
@@ -340,9 +340,8 @@ def load_weights(self,
                 weight_loader(param, loaded_weight, shard_id)
                 break
             else:
-                # lm_head is not used in vllm as it is tied weight with embed_token.
-                # Sometimes duplicate lm_head layers are added when the structure of the model is newly created by quantization, LORA, etc.
-                # To avoid the error that occurs, skip loading lm_head.weight.
+                # lm_head is not used in vllm as it is tied with embed_token.
+                # To prevent errors, skip loading lm_head.weight.
                 if "lm_head.weight" in name:
                     continue
                 # Skip loading extra bias for GPTQ models.