| { | |
| "epoch": 1.0, | |
| "eval_loss": 1.8621082305908203, | |
| "eval_runtime": 31.9078, | |
| "eval_samples_per_second": 13.758, | |
| "eval_steps_per_second": 1.724, | |
| "perplexity": 6.437293775421979, | |
| "total_flos": 4.00628735213568e+16, | |
| "train_loss": 2.065633855547224, | |
| "train_runtime": 693.7957, | |
| "train_samples_per_second": 6.355, | |
| "train_steps_per_second": 3.178 | |
| } |