{ "epoch": 1.0, "eval_loss": 1.9502463340759277, "eval_runtime": 68.5306, "eval_samples_per_second": 13.76, "eval_steps_per_second": 1.722, "perplexity": 7.030419199119011, "total_flos": 7.49645512704e+16, "train_loss": 2.070154784231475, "train_runtime": 1281.9871, "train_samples_per_second": 6.435, "train_steps_per_second": 3.218 }