mirror of
https://github.com/osmarks/nanogpt-experiments.git
synced 2024-12-18 14:10:28 +00:00
rename compile_model to compile, shroter, version 2 stragglers
This commit is contained in:
parent
35f51974c4
commit
41184a27f5
4
bench.py
4
bench.py
@ -15,7 +15,7 @@ torch.manual_seed(1337)
|
||||
batch_size = 8
|
||||
block_size = 1024
|
||||
dtype = torch.bfloat16
|
||||
compile_model = True
|
||||
compile = True
|
||||
|
||||
# data loading init
|
||||
real_data = True
|
||||
@ -47,7 +47,7 @@ model.to(device)
|
||||
|
||||
optimizer = model.configure_optimizers(weight_decay=1e-2, learning_rate=1e-4, betas=(0.9, 0.95))
|
||||
|
||||
if compile_model:
|
||||
if compile:
|
||||
print("Compiling model...")
|
||||
model = torch.compile(model) # pytorch 2.0
|
||||
|
||||
|
@ -5,7 +5,7 @@ eval_interval = 200
|
||||
wandb_log = False # feel free to turn on
|
||||
wandb_project = 'shakespeare'
|
||||
wandb_run_name = 'ft-' + str(time.time())
|
||||
compile_model = False # takes too little time to finetune, not worth it
|
||||
compile = False # takes too little time to finetune, not worth it
|
||||
|
||||
# save a nice and overfit checkpoint that
|
||||
# will only speak Shakespeare and forgets
|
||||
|
Loading…
Reference in New Issue
Block a user