mirror of
				https://github.com/osmarks/nanogpt-experiments.git
				synced 2025-10-31 07:13:01 +00:00 
			
		
		
		
	candidate changes to apis, have to think through more
This commit is contained in:
		
							
								
								
									
										22
									
								
								config/finetune_shakespeare.py
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										22
									
								
								config/finetune_shakespeare.py
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,22 @@ | ||||
| import time | ||||
|  | ||||
| out_dir = 'out-shakespeare' | ||||
| eval_interval = 200 | ||||
| wandb_log = False # feel free to turn on | ||||
| wandb_project = 'shakespeare' | ||||
| wandb_run_name = 'ft-' + str(time.time()) | ||||
| compile_model = False # takes too little time to finetune, not worth it | ||||
|  | ||||
| # save a nice and overfit checkpoint that | ||||
| # will only speak Shakespeare and forgets | ||||
| # everything else about the world #dark | ||||
| always_save_checkpoint = True | ||||
|  | ||||
| dataset = 'shakespeare' | ||||
| init_from = 'gpt2-xl' | ||||
| batch_size = 1 | ||||
| block_size = 512 | ||||
|  | ||||
| learning_rate = 1e-5 | ||||
| max_iters = 1000 | ||||
| decay_lr = False | ||||
		Reference in New Issue
	
	Block a user
	 Andrej Karpathy
					Andrej Karpathy