mirror of
https://github.com/osmarks/nanogpt-experiments.git
synced 2025-10-25 20:37:42 +00:00
shuttling the poor mans configurator aside into its own file and adding it to all of train,sample,bench. because i am leaving args in globals() so i can avoid having to prepend every single variable with an args., i have to exec the configurator and the optional configs. so we're left with something very gross by standard convention but also quite simple and functional. *ducks*
This commit is contained in:
35
train.py
35
train.py
@@ -13,7 +13,6 @@ import os
|
||||
import sys
|
||||
import time
|
||||
import math
|
||||
from ast import literal_eval
|
||||
|
||||
import wandb
|
||||
import numpy as np
|
||||
@@ -24,7 +23,7 @@ from torch.distributed import init_process_group, destroy_process_group
|
||||
from model import GPTConfig, GPT
|
||||
|
||||
# -----------------------------------------------------------------------------
|
||||
# default config values
|
||||
# default config values designed to train a gpt2 (124M) on OpenWebText
|
||||
# I/O
|
||||
out_dir = 'out'
|
||||
eval_interval = 2000
|
||||
@@ -62,37 +61,7 @@ min_lr = 6e-5 # minimum learning rate, should be ~= learning_rate/10 per Chinchi
|
||||
backend = 'nccl' # 'nccl', 'gloo', etc.
|
||||
compile = True # use PyTorch 2.0 to compile the model to be faster
|
||||
# -----------------------------------------------------------------------------
|
||||
# poor man's Configurator. Potentially a bad idea. Example usage:
|
||||
# $ python train.py override_file --batch_size=32
|
||||
# this will first run config/override_file.py, then override batch_size to 32
|
||||
for arg in sys.argv[1:]:
|
||||
if '=' not in arg:
|
||||
# assume it's the name of a config file
|
||||
assert not arg.startswith('--')
|
||||
config_file = os.path.join('config', arg + '.py')
|
||||
print(f"Overriding config with {config_file}:")
|
||||
with open(config_file) as f:
|
||||
print(f.read())
|
||||
exec(open(config_file).read())
|
||||
else:
|
||||
# assume it's a --key=value argument
|
||||
assert arg.startswith('--')
|
||||
key, val = arg.split('=')
|
||||
key = key[2:]
|
||||
if key in globals():
|
||||
try:
|
||||
# attempt to eval it it (e.g. if bool, number, or etc)
|
||||
attempt = literal_eval(val)
|
||||
except (SyntaxError, ValueError):
|
||||
# if that goes wrong, just use the string
|
||||
attempt = val
|
||||
# ensure the types match ok
|
||||
assert type(attempt) == type(globals()[key])
|
||||
# cross fingers
|
||||
print(f"Overriding: {key} = {attempt}")
|
||||
globals()[key] = attempt
|
||||
else:
|
||||
raise ValueError(f"Unknown config key: {key}")
|
||||
exec(open('configurator.py').read()) # overrides from command line or config file
|
||||
# -----------------------------------------------------------------------------
|
||||
ddp = int(os.environ.get('LOCAL_RANK', -1)) != -1 # is this a ddp run?
|
||||
if ddp:
|
||||
|
||||
Reference in New Issue
Block a user