{ "epoch": 1.0, "eval_loss": 2.0968925952911377, "eval_runtime": 9.7787, "eval_samples_per_second": 22.293, "eval_steps_per_second": 2.863, "perplexity": 8.140833703043482, "total_flos": 2.432579616768e+16, "train_loss": 2.2809645715587865, "train_runtime": 351.6588, "train_samples_per_second": 7.595, "train_steps_per_second": 3.799 }