expand coverage of gpt2 model loading (#271)

vllm-project · Jun 27, 2023 · 4026a04 · 4026a04
1 parent 43710e8
commit 4026a04
Showing 1 changed file with 4 additions and 2 deletions.
diff --git a/vllm/model_executor/models/gpt2.py b/vllm/model_executor/models/gpt2.py
@@ -228,11 +228,13 @@ def load_weights(self, model_name_or_path: str,
                 # GPT-2 ties the weights of the embedding layer and the final
                 # linear layer.
                 continue
-            if ".attn.bias" in name:
+            if ".attn.bias" in name or ".attn.masked_bias" in name:
                 # Skip attention mask.
                 # NOTE: "c_attn.bias" should not be skipped.
                 continue
-            name = "transformer." + name
+
+            if not name.startswith("transformer."):
+                name = "transformer." + name
 
             # The HF's GPT-2 implementation uses Conv1D instead of Linear.
             # Because of this, we need to transpose the weights.