1
0
mirror of https://github.com/osmarks/nanogpt-experiments.git synced 2025-09-13 08:16:01 +00:00

experiments

This commit is contained in:
2024-06-24 19:10:15 +00:00
parent 9755682b98
commit 0194d45e43
17 changed files with 184 additions and 39 deletions

View File

@@ -2,7 +2,7 @@
# launch as the following (e.g. in a screen session) and wait ~5 days:
# $ torchrun --standalone --nproc_per_node=8 train.py config/train_gpt2.py
wandb_log = True
wandb_log = False
wandb_project = 'owt'
wandb_run_name='gpt2-124M'

View File

@@ -35,3 +35,4 @@ warmup_iters = 100 # not super necessary potentially
# on macbook also add
# device = 'cpu' # run on cpu only
# compile = False # do not torch compile the model
compile = False