mirror of
https://github.com/osmarks/nanogpt-experiments.git
synced 2024-12-18 14:10:28 +00:00
rename compile_model to compile, shroter, version 2 stragglers
This commit is contained in:
parent
35f51974c4
commit
41184a27f5
4
bench.py
4
bench.py
@ -15,7 +15,7 @@ torch.manual_seed(1337)
|
|||||||
batch_size = 8
|
batch_size = 8
|
||||||
block_size = 1024
|
block_size = 1024
|
||||||
dtype = torch.bfloat16
|
dtype = torch.bfloat16
|
||||||
compile_model = True
|
compile = True
|
||||||
|
|
||||||
# data loading init
|
# data loading init
|
||||||
real_data = True
|
real_data = True
|
||||||
@ -47,7 +47,7 @@ model.to(device)
|
|||||||
|
|
||||||
optimizer = model.configure_optimizers(weight_decay=1e-2, learning_rate=1e-4, betas=(0.9, 0.95))
|
optimizer = model.configure_optimizers(weight_decay=1e-2, learning_rate=1e-4, betas=(0.9, 0.95))
|
||||||
|
|
||||||
if compile_model:
|
if compile:
|
||||||
print("Compiling model...")
|
print("Compiling model...")
|
||||||
model = torch.compile(model) # pytorch 2.0
|
model = torch.compile(model) # pytorch 2.0
|
||||||
|
|
||||||
|
@ -5,7 +5,7 @@ eval_interval = 200
|
|||||||
wandb_log = False # feel free to turn on
|
wandb_log = False # feel free to turn on
|
||||||
wandb_project = 'shakespeare'
|
wandb_project = 'shakespeare'
|
||||||
wandb_run_name = 'ft-' + str(time.time())
|
wandb_run_name = 'ft-' + str(time.time())
|
||||||
compile_model = False # takes too little time to finetune, not worth it
|
compile = False # takes too little time to finetune, not worth it
|
||||||
|
|
||||||
# save a nice and overfit checkpoint that
|
# save a nice and overfit checkpoint that
|
||||||
# will only speak Shakespeare and forgets
|
# will only speak Shakespeare and forgets
|
||||||
|
Loading…
Reference in New Issue
Block a user