diff --git a/sample.py b/sample.py index 6ff0ea2..f02308e 100644 --- a/sample.py +++ b/sample.py @@ -13,7 +13,7 @@ out_dir = 'out' start = "\n" # or "<|endoftext|>" or whatever you like num_samples = 10 # number of samples to draw max_new_tokens = 500 # number of tokens generated in each sample -temperature = 0.8 # higher temperature (up to 1) is more random, lower (down to 0) means more greedy +temperature = 0.8 # 1.0 = no change, < 1.0 = less random, > 1.0 = more random, in predictions top_k = 200 # retain only the top_k most likely tokens, clamp others to have 0 probability seed = 1337 device = 'cuda' # examples: 'cpu', 'cuda', 'cuda:0', 'cuda:1', etc.