| model_config = 'reflow' | |
| out_dir = 'out/reflow-1' | |
| init_from = 'resume' | |
| start = "Q: What is the capital of China?\nA: Beijing\nQ: What is the capital of Japan?\nA: Tokyo\nQ: What is the capital of France?\nA:" | |
| num_samples = 10 | |
| max_new_tokens = 50 | |
| temperature = 0.01 | |
| top_k = 20 | |
| seed = 1337 | |
| device = 'cuda' | |
| dtype = 'float16' | |
| compile = False | |