| { | |
| "epoch": 1.0, | |
| "eval_loss": 1.8534812927246094, | |
| "eval_runtime": 31.7929, | |
| "eval_samples_per_second": 13.745, | |
| "eval_steps_per_second": 1.73, | |
| "perplexity": 6.381998499391311, | |
| "total_flos": 4.13804323012608e+16, | |
| "train_loss": 2.0515993006877538, | |
| "train_runtime": 708.674, | |
| "train_samples_per_second": 6.426, | |
| "train_steps_per_second": 3.213 | |
| } |