mirror of
https://github.com/osmarks/nanogpt-experiments.git
synced 2025-09-13 08:16:01 +00:00
experiments
This commit is contained in:
@@ -2,7 +2,7 @@
|
||||
# launch as the following (e.g. in a screen session) and wait ~5 days:
|
||||
# $ torchrun --standalone --nproc_per_node=8 train.py config/train_gpt2.py
|
||||
|
||||
wandb_log = True
|
||||
wandb_log = False
|
||||
wandb_project = 'owt'
|
||||
wandb_run_name='gpt2-124M'
|
||||
|
||||
|
@@ -35,3 +35,4 @@ warmup_iters = 100 # not super necessary potentially
|
||||
# on macbook also add
|
||||
# device = 'cpu' # run on cpu only
|
||||
# compile = False # do not torch compile the model
|
||||
compile = False
|
||||
|
Reference in New Issue
Block a user