mirror of
				https://github.com/osmarks/nanogpt-experiments.git
				synced 2025-10-30 14:53:01 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			9 lines
		
	
	
		
			208 B
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			9 lines
		
	
	
		
			208 B
		
	
	
	
		
			Python
		
	
	
	
	
	
| # evaluate the base gpt2
 | |
| # n_layer=12, n_head=12, n_embd=768
 | |
| # 124M parameters
 | |
| batch_size = 8
 | |
| eval_iters = 500 # use more iterations to get good estimate
 | |
| eval_only = True
 | |
| wandb_log = False
 | |
| init_from = 'gpt2'
 | 
