Browse Source

Ignore missing qkv_proj.weight when loading a checkpoint

Max Ryabinin 1 year ago
parent
commit
4644131086
1 changed files with 1 additions and 0 deletions
  1. 1 0
      src/petals/server/from_pretrained.py

+ 1 - 0
src/petals/server/from_pretrained.py

@@ -65,6 +65,7 @@ def load_pretrained_block(
 
     # dummy load, check that keys match
     report = block.load_state_dict(state_dict, strict=False)
+    report.missing_keys.pop("self_attn.qkv_proj.weight", None) # will be filled later
     assert not report.missing_keys, f"Some block weights are missing: {report.missing_keys}"
 
     for param_name, _ in block.named_parameters():