Merge pull request #19 from nat/patch-1

Strip unwanted prefix from state keys when loading model in sample.py
2025-11-08 19:23:02 +00:00 · 2023-01-04 16:46:32 -08:00
parent d562b3e550 2b9e168736
commit 529c967a65
1 changed files with 6 additions and 1 deletions
--- a/sample.py
+++ b/sample.py
@@ -29,7 +29,12 @@ ckpt_path = os.path.join(out_dir, 'ckpt.pt')
 checkpoint = torch.load(ckpt_path, map_location=device)
 gptconf = GPTConfig(**checkpoint['model_args'])
 model = GPT(gptconf)
-model.load_state_dict(checkpoint['model'])
+state_dict = checkpoint['model']
 unwanted_prefix = '_orig_mod.'
 for k,v in list(state_dict.items()):
    if k.startswith(unwanted_prefix):
        state_dict[k[len(unwanted_prefix):]] = state_dict.pop(k)
 model.load_state_dict(state_dict)
 model.eval()
 model.to(device)
 if compile: