1
0
mirror of https://github.com/osmarks/nanogpt-experiments.git synced 2024-11-11 04:19:57 +00:00

rename compile_model to compile, shroter, version 2 stragglers

This commit is contained in:
Andrej Karpathy 2023-01-02 01:15:55 +00:00
parent 35f51974c4
commit 41184a27f5
2 changed files with 3 additions and 3 deletions

View File

@ -15,7 +15,7 @@ torch.manual_seed(1337)
batch_size = 8 batch_size = 8
block_size = 1024 block_size = 1024
dtype = torch.bfloat16 dtype = torch.bfloat16
compile_model = True compile = True
# data loading init # data loading init
real_data = True real_data = True
@ -47,7 +47,7 @@ model.to(device)
optimizer = model.configure_optimizers(weight_decay=1e-2, learning_rate=1e-4, betas=(0.9, 0.95)) optimizer = model.configure_optimizers(weight_decay=1e-2, learning_rate=1e-4, betas=(0.9, 0.95))
if compile_model: if compile:
print("Compiling model...") print("Compiling model...")
model = torch.compile(model) # pytorch 2.0 model = torch.compile(model) # pytorch 2.0

View File

@ -5,7 +5,7 @@ eval_interval = 200
wandb_log = False # feel free to turn on wandb_log = False # feel free to turn on
wandb_project = 'shakespeare' wandb_project = 'shakespeare'
wandb_run_name = 'ft-' + str(time.time()) wandb_run_name = 'ft-' + str(time.time())
compile_model = False # takes too little time to finetune, not worth it compile = False # takes too little time to finetune, not worth it
# save a nice and overfit checkpoint that # save a nice and overfit checkpoint that
# will only speak Shakespeare and forgets # will only speak Shakespeare and forgets