GENOME-gemma-2b-it / oasst1 /trainer_log.jsonl
Estwld's picture
Upload 15 files
41f7b93 verified
{"current_steps": 10, "total_steps": 1090, "loss": 1.8499, "learning_rate": 1.834862385321101e-05, "epoch": 0.045871559633027525, "percentage": 0.92, "elapsed_time": "0:00:09", "remaining_time": "0:17:08"}
{"current_steps": 20, "total_steps": 1090, "loss": 1.7448, "learning_rate": 3.669724770642202e-05, "epoch": 0.09174311926605505, "percentage": 1.83, "elapsed_time": "0:00:16", "remaining_time": "0:15:03"}
{"current_steps": 30, "total_steps": 1090, "loss": 1.5686, "learning_rate": 5.504587155963303e-05, "epoch": 0.13761467889908258, "percentage": 2.75, "elapsed_time": "0:00:24", "remaining_time": "0:14:30"}
{"current_steps": 40, "total_steps": 1090, "loss": 1.4637, "learning_rate": 7.339449541284404e-05, "epoch": 0.1834862385321101, "percentage": 3.67, "elapsed_time": "0:00:33", "remaining_time": "0:14:30"}
{"current_steps": 50, "total_steps": 1090, "loss": 1.4793, "learning_rate": 9.174311926605506e-05, "epoch": 0.22935779816513763, "percentage": 4.59, "elapsed_time": "0:00:41", "remaining_time": "0:14:14"}
{"current_steps": 60, "total_steps": 1090, "loss": 1.3845, "learning_rate": 0.00011009174311926606, "epoch": 0.27522935779816515, "percentage": 5.5, "elapsed_time": "0:00:49", "remaining_time": "0:14:08"}
{"current_steps": 70, "total_steps": 1090, "loss": 1.4139, "learning_rate": 0.00012844036697247707, "epoch": 0.3211009174311927, "percentage": 6.42, "elapsed_time": "0:00:56", "remaining_time": "0:13:48"}
{"current_steps": 80, "total_steps": 1090, "loss": 1.3459, "learning_rate": 0.0001467889908256881, "epoch": 0.3669724770642202, "percentage": 7.34, "elapsed_time": "0:01:04", "remaining_time": "0:13:28"}
{"current_steps": 90, "total_steps": 1090, "loss": 1.4618, "learning_rate": 0.0001651376146788991, "epoch": 0.41284403669724773, "percentage": 8.26, "elapsed_time": "0:01:11", "remaining_time": "0:13:10"}
{"current_steps": 100, "total_steps": 1090, "loss": 1.4328, "learning_rate": 0.00018348623853211012, "epoch": 0.45871559633027525, "percentage": 9.17, "elapsed_time": "0:01:20", "remaining_time": "0:13:13"}
{"current_steps": 110, "total_steps": 1090, "loss": 1.3412, "learning_rate": 0.00019999948721966259, "epoch": 0.5045871559633027, "percentage": 10.09, "elapsed_time": "0:01:28", "remaining_time": "0:13:04"}
{"current_steps": 120, "total_steps": 1090, "loss": 1.3702, "learning_rate": 0.0001999379599421534, "epoch": 0.5504587155963303, "percentage": 11.01, "elapsed_time": "0:01:36", "remaining_time": "0:12:56"}
{"current_steps": 130, "total_steps": 1090, "loss": 1.4099, "learning_rate": 0.00019977394889447524, "epoch": 0.5963302752293578, "percentage": 11.93, "elapsed_time": "0:01:44", "remaining_time": "0:12:52"}
{"current_steps": 140, "total_steps": 1090, "loss": 1.323, "learning_rate": 0.00019950762226567781, "epoch": 0.6422018348623854, "percentage": 12.84, "elapsed_time": "0:01:52", "remaining_time": "0:12:41"}
{"current_steps": 150, "total_steps": 1090, "loss": 1.3934, "learning_rate": 0.00019913925316676945, "epoch": 0.6880733944954128, "percentage": 13.76, "elapsed_time": "0:02:00", "remaining_time": "0:12:37"}
{"current_steps": 160, "total_steps": 1090, "loss": 1.3618, "learning_rate": 0.00019866921935064906, "epoch": 0.7339449541284404, "percentage": 14.68, "elapsed_time": "0:02:08", "remaining_time": "0:12:25"}
{"current_steps": 170, "total_steps": 1090, "loss": 1.3534, "learning_rate": 0.00019809800282473013, "epoch": 0.7798165137614679, "percentage": 15.6, "elapsed_time": "0:02:15", "remaining_time": "0:12:15"}
{"current_steps": 180, "total_steps": 1090, "loss": 1.3299, "learning_rate": 0.00019742618935665476, "epoch": 0.8256880733944955, "percentage": 16.51, "elapsed_time": "0:02:23", "remaining_time": "0:12:05"}
{"current_steps": 190, "total_steps": 1090, "loss": 1.4378, "learning_rate": 0.0001966544678736044, "epoch": 0.8715596330275229, "percentage": 17.43, "elapsed_time": "0:02:30", "remaining_time": "0:11:54"}
{"current_steps": 200, "total_steps": 1090, "loss": 1.3573, "learning_rate": 0.00019578362975582292, "epoch": 0.9174311926605505, "percentage": 18.35, "elapsed_time": "0:02:38", "remaining_time": "0:11:46"}
{"current_steps": 210, "total_steps": 1090, "loss": 1.3869, "learning_rate": 0.0001948145680250766, "epoch": 0.963302752293578, "percentage": 19.27, "elapsed_time": "0:02:45", "remaining_time": "0:11:35"}
{"current_steps": 220, "total_steps": 1090, "loss": 1.3637, "learning_rate": 0.00019374827642888398, "epoch": 1.0091743119266054, "percentage": 20.18, "elapsed_time": "0:02:52", "remaining_time": "0:11:23"}
{"current_steps": 230, "total_steps": 1090, "loss": 1.2397, "learning_rate": 0.00019258584842145343, "epoch": 1.0550458715596331, "percentage": 21.1, "elapsed_time": "0:03:00", "remaining_time": "0:11:13"}
{"current_steps": 240, "total_steps": 1090, "loss": 1.3243, "learning_rate": 0.0001913284760423745, "epoch": 1.1009174311926606, "percentage": 22.02, "elapsed_time": "0:03:07", "remaining_time": "0:11:04"}
{"current_steps": 250, "total_steps": 1090, "loss": 1.4041, "learning_rate": 0.00018997744869421246, "epoch": 1.146788990825688, "percentage": 22.94, "elapsed_time": "0:03:15", "remaining_time": "0:10:55"}
{"current_steps": 260, "total_steps": 1090, "loss": 1.2698, "learning_rate": 0.0001885341518202595, "epoch": 1.1926605504587156, "percentage": 23.85, "elapsed_time": "0:03:22", "remaining_time": "0:10:47"}
{"current_steps": 270, "total_steps": 1090, "loss": 1.2547, "learning_rate": 0.00018700006548379898, "epoch": 1.238532110091743, "percentage": 24.77, "elapsed_time": "0:03:30", "remaining_time": "0:10:39"}
{"current_steps": 280, "total_steps": 1090, "loss": 1.2601, "learning_rate": 0.00018537676285033887, "epoch": 1.2844036697247707, "percentage": 25.69, "elapsed_time": "0:03:38", "remaining_time": "0:10:32"}
{"current_steps": 290, "total_steps": 1090, "loss": 1.3409, "learning_rate": 0.00018366590857437184, "epoch": 1.3302752293577982, "percentage": 26.61, "elapsed_time": "0:03:46", "remaining_time": "0:10:23"}
{"current_steps": 300, "total_steps": 1090, "loss": 1.2916, "learning_rate": 0.00018186925709231532, "epoch": 1.3761467889908257, "percentage": 27.52, "elapsed_time": "0:03:54", "remaining_time": "0:10:17"}
{"current_steps": 310, "total_steps": 1090, "loss": 1.2679, "learning_rate": 0.0001799886508233829, "epoch": 1.4220183486238533, "percentage": 28.44, "elapsed_time": "0:04:02", "remaining_time": "0:10:09"}
{"current_steps": 320, "total_steps": 1090, "loss": 1.3653, "learning_rate": 0.00017802601828023138, "epoch": 1.4678899082568808, "percentage": 29.36, "elapsed_time": "0:04:09", "remaining_time": "0:10:00"}
{"current_steps": 330, "total_steps": 1090, "loss": 1.2496, "learning_rate": 0.0001759833720913214, "epoch": 1.5137614678899083, "percentage": 30.28, "elapsed_time": "0:04:16", "remaining_time": "0:09:51"}
{"current_steps": 340, "total_steps": 1090, "loss": 1.2645, "learning_rate": 0.0001738628069370195, "epoch": 1.5596330275229358, "percentage": 31.19, "elapsed_time": "0:04:24", "remaining_time": "0:09:42"}
{"current_steps": 350, "total_steps": 1090, "loss": 1.2868, "learning_rate": 0.000171666497401558, "epoch": 1.6055045871559632, "percentage": 32.11, "elapsed_time": "0:04:31", "remaining_time": "0:09:33"}
{"current_steps": 360, "total_steps": 1090, "loss": 1.249, "learning_rate": 0.00016939669574305566, "epoch": 1.6513761467889907, "percentage": 33.03, "elapsed_time": "0:04:39", "remaining_time": "0:09:25"}
{"current_steps": 370, "total_steps": 1090, "loss": 1.2305, "learning_rate": 0.00016705572958388576, "epoch": 1.6972477064220184, "percentage": 33.94, "elapsed_time": "0:04:50", "remaining_time": "0:09:25"}
{"current_steps": 380, "total_steps": 1090, "loss": 1.3317, "learning_rate": 0.00016464599952375998, "epoch": 1.7431192660550459, "percentage": 34.86, "elapsed_time": "0:05:01", "remaining_time": "0:09:22"}
{"current_steps": 390, "total_steps": 1090, "loss": 1.3069, "learning_rate": 0.0001621699766779763, "epoch": 1.7889908256880735, "percentage": 35.78, "elapsed_time": "0:05:09", "remaining_time": "0:09:15"}
{"current_steps": 400, "total_steps": 1090, "loss": 1.3093, "learning_rate": 0.00015963020014335438, "epoch": 1.834862385321101, "percentage": 36.7, "elapsed_time": "0:05:17", "remaining_time": "0:09:07"}
{"current_steps": 410, "total_steps": 1090, "loss": 1.2472, "learning_rate": 0.00015702927439445826, "epoch": 1.8807339449541285, "percentage": 37.61, "elapsed_time": "0:05:24", "remaining_time": "0:08:58"}
{"current_steps": 420, "total_steps": 1090, "loss": 1.3159, "learning_rate": 0.00015436986661277577, "epoch": 1.926605504587156, "percentage": 38.53, "elapsed_time": "0:05:32", "remaining_time": "0:08:50"}
{"current_steps": 430, "total_steps": 1090, "loss": 1.3643, "learning_rate": 0.00015165470395159313, "epoch": 1.9724770642201834, "percentage": 39.45, "elapsed_time": "0:05:42", "remaining_time": "0:08:45"}
{"current_steps": 440, "total_steps": 1090, "loss": 1.2591, "learning_rate": 0.00014888657073937076, "epoch": 2.018348623853211, "percentage": 40.37, "elapsed_time": "0:05:49", "remaining_time": "0:08:36"}
{"current_steps": 450, "total_steps": 1090, "loss": 1.1217, "learning_rate": 0.0001460683056244869, "epoch": 2.0642201834862384, "percentage": 41.28, "elapsed_time": "0:05:57", "remaining_time": "0:08:27"}
{"current_steps": 460, "total_steps": 1090, "loss": 1.1943, "learning_rate": 0.00014320279866427796, "epoch": 2.1100917431192663, "percentage": 42.2, "elapsed_time": "0:06:05", "remaining_time": "0:08:20"}
{"current_steps": 470, "total_steps": 1090, "loss": 1.1619, "learning_rate": 0.00014029298836135988, "epoch": 2.1559633027522938, "percentage": 43.12, "elapsed_time": "0:06:13", "remaining_time": "0:08:12"}
{"current_steps": 480, "total_steps": 1090, "loss": 1.127, "learning_rate": 0.0001373418586502706, "epoch": 2.2018348623853212, "percentage": 44.04, "elapsed_time": "0:06:20", "remaining_time": "0:08:03"}
{"current_steps": 490, "total_steps": 1090, "loss": 1.1109, "learning_rate": 0.00013435243583752294, "epoch": 2.2477064220183487, "percentage": 44.95, "elapsed_time": "0:06:29", "remaining_time": "0:07:56"}
{"current_steps": 500, "total_steps": 1090, "loss": 1.2006, "learning_rate": 0.00013132778549820618, "epoch": 2.293577981651376, "percentage": 45.87, "elapsed_time": "0:06:36", "remaining_time": "0:07:47"}
{"current_steps": 510, "total_steps": 1090, "loss": 1.1483, "learning_rate": 0.00012827100933231905, "epoch": 2.3394495412844036, "percentage": 46.79, "elapsed_time": "0:06:43", "remaining_time": "0:07:38"}
{"current_steps": 520, "total_steps": 1090, "loss": 1.1057, "learning_rate": 0.000125185241984057, "epoch": 2.385321100917431, "percentage": 47.71, "elapsed_time": "0:06:50", "remaining_time": "0:07:29"}
{"current_steps": 530, "total_steps": 1090, "loss": 1.2038, "learning_rate": 0.00012207364782731655, "epoch": 2.4311926605504586, "percentage": 48.62, "elapsed_time": "0:06:57", "remaining_time": "0:07:21"}
{"current_steps": 540, "total_steps": 1090, "loss": 1.1714, "learning_rate": 0.00011893941772071249, "epoch": 2.477064220183486, "percentage": 49.54, "elapsed_time": "0:07:06", "remaining_time": "0:07:14"}
{"current_steps": 550, "total_steps": 1090, "loss": 1.1229, "learning_rate": 0.0001157857657354354, "epoch": 2.522935779816514, "percentage": 50.46, "elapsed_time": "0:07:13", "remaining_time": "0:07:05"}
{"current_steps": 560, "total_steps": 1090, "loss": 1.1389, "learning_rate": 0.00011261592585930576, "epoch": 2.5688073394495414, "percentage": 51.38, "elapsed_time": "0:07:21", "remaining_time": "0:06:57"}
{"current_steps": 570, "total_steps": 1090, "loss": 1.1349, "learning_rate": 0.00010943314868040364, "epoch": 2.614678899082569, "percentage": 52.29, "elapsed_time": "0:07:29", "remaining_time": "0:06:50"}
{"current_steps": 580, "total_steps": 1090, "loss": 1.1317, "learning_rate": 0.00010624069805367559, "epoch": 2.6605504587155964, "percentage": 53.21, "elapsed_time": "0:07:36", "remaining_time": "0:06:41"}
{"current_steps": 590, "total_steps": 1090, "loss": 1.1364, "learning_rate": 0.00010304184775393642, "epoch": 2.706422018348624, "percentage": 54.13, "elapsed_time": "0:07:44", "remaining_time": "0:06:33"}
{"current_steps": 600, "total_steps": 1090, "loss": 1.1107, "learning_rate": 9.983987811869862e-05, "epoch": 2.7522935779816513, "percentage": 55.05, "elapsed_time": "0:07:51", "remaining_time": "0:06:25"}
{"current_steps": 610, "total_steps": 1090, "loss": 1.1161, "learning_rate": 9.663807268427198e-05, "epoch": 2.7981651376146788, "percentage": 55.96, "elapsed_time": "0:07:58", "remaining_time": "0:06:16"}
{"current_steps": 620, "total_steps": 1090, "loss": 1.1981, "learning_rate": 9.343971481858246e-05, "epoch": 2.8440366972477067, "percentage": 56.88, "elapsed_time": "0:08:06", "remaining_time": "0:06:09"}
{"current_steps": 630, "total_steps": 1090, "loss": 1.1386, "learning_rate": 9.024808435416434e-05, "epoch": 2.8899082568807337, "percentage": 57.8, "elapsed_time": "0:08:14", "remaining_time": "0:06:00"}
{"current_steps": 640, "total_steps": 1090, "loss": 1.1681, "learning_rate": 8.706645422477739e-05, "epoch": 2.9357798165137616, "percentage": 58.72, "elapsed_time": "0:08:24", "remaining_time": "0:05:54"}
{"current_steps": 650, "total_steps": 1090, "loss": 1.1531, "learning_rate": 8.389808710909881e-05, "epoch": 2.981651376146789, "percentage": 59.63, "elapsed_time": "0:08:31", "remaining_time": "0:05:46"}
{"current_steps": 660, "total_steps": 1090, "loss": 1.1137, "learning_rate": 8.07462320849313e-05, "epoch": 3.0275229357798166, "percentage": 60.55, "elapsed_time": "0:08:38", "remaining_time": "0:05:37"}
{"current_steps": 670, "total_steps": 1090, "loss": 1.0204, "learning_rate": 7.761412129735852e-05, "epoch": 3.073394495412844, "percentage": 61.47, "elapsed_time": "0:08:45", "remaining_time": "0:05:29"}
{"current_steps": 680, "total_steps": 1090, "loss": 1.0303, "learning_rate": 7.450496664426477e-05, "epoch": 3.1192660550458715, "percentage": 62.39, "elapsed_time": "0:08:53", "remaining_time": "0:05:21"}
{"current_steps": 690, "total_steps": 1090, "loss": 1.0359, "learning_rate": 7.142195648261747e-05, "epoch": 3.165137614678899, "percentage": 63.3, "elapsed_time": "0:09:01", "remaining_time": "0:05:13"}
{"current_steps": 700, "total_steps": 1090, "loss": 0.9762, "learning_rate": 6.83682523588902e-05, "epoch": 3.2110091743119265, "percentage": 64.22, "elapsed_time": "0:09:09", "remaining_time": "0:05:05"}
{"current_steps": 710, "total_steps": 1090, "loss": 1.06, "learning_rate": 6.534698576697939e-05, "epoch": 3.2568807339449544, "percentage": 65.14, "elapsed_time": "0:09:16", "remaining_time": "0:04:57"}
{"current_steps": 720, "total_steps": 1090, "loss": 0.9795, "learning_rate": 6.2361254936939e-05, "epoch": 3.302752293577982, "percentage": 66.06, "elapsed_time": "0:09:24", "remaining_time": "0:04:50"}
{"current_steps": 730, "total_steps": 1090, "loss": 1.0335, "learning_rate": 5.941412165782645e-05, "epoch": 3.3486238532110093, "percentage": 66.97, "elapsed_time": "0:09:32", "remaining_time": "0:04:42"}
{"current_steps": 740, "total_steps": 1090, "loss": 0.9486, "learning_rate": 5.650860813791785e-05, "epoch": 3.3944954128440368, "percentage": 67.89, "elapsed_time": "0:09:39", "remaining_time": "0:04:34"}
{"current_steps": 750, "total_steps": 1090, "loss": 0.9524, "learning_rate": 5.364769390551225e-05, "epoch": 3.4403669724770642, "percentage": 68.81, "elapsed_time": "0:09:47", "remaining_time": "0:04:26"}
{"current_steps": 760, "total_steps": 1090, "loss": 0.9839, "learning_rate": 5.0834312753503124e-05, "epoch": 3.4862385321100917, "percentage": 69.72, "elapsed_time": "0:09:55", "remaining_time": "0:04:18"}
{"current_steps": 770, "total_steps": 1090, "loss": 1.0241, "learning_rate": 4.807134973085036e-05, "epoch": 3.532110091743119, "percentage": 70.64, "elapsed_time": "0:10:02", "remaining_time": "0:04:10"}
{"current_steps": 780, "total_steps": 1090, "loss": 0.9814, "learning_rate": 4.53616381840377e-05, "epoch": 3.5779816513761467, "percentage": 71.56, "elapsed_time": "0:10:09", "remaining_time": "0:04:02"}
{"current_steps": 790, "total_steps": 1090, "loss": 0.9867, "learning_rate": 4.2707956851550016e-05, "epoch": 3.623853211009174, "percentage": 72.48, "elapsed_time": "0:10:17", "remaining_time": "0:03:54"}
{"current_steps": 800, "total_steps": 1090, "loss": 0.9978, "learning_rate": 4.011302701434937e-05, "epoch": 3.669724770642202, "percentage": 73.39, "elapsed_time": "0:10:27", "remaining_time": "0:03:47"}
{"current_steps": 810, "total_steps": 1090, "loss": 1.0039, "learning_rate": 3.757950970527249e-05, "epoch": 3.7155963302752295, "percentage": 74.31, "elapsed_time": "0:10:36", "remaining_time": "0:03:39"}
{"current_steps": 820, "total_steps": 1090, "loss": 1.014, "learning_rate": 3.5110002980210975e-05, "epoch": 3.761467889908257, "percentage": 75.23, "elapsed_time": "0:10:44", "remaining_time": "0:03:32"}
{"current_steps": 830, "total_steps": 1090, "loss": 0.9395, "learning_rate": 3.270703925387279e-05, "epoch": 3.8073394495412844, "percentage": 76.15, "elapsed_time": "0:10:52", "remaining_time": "0:03:24"}
{"current_steps": 840, "total_steps": 1090, "loss": 0.9852, "learning_rate": 3.037308270285709e-05, "epoch": 3.853211009174312, "percentage": 77.06, "elapsed_time": "0:11:01", "remaining_time": "0:03:16"}
{"current_steps": 850, "total_steps": 1090, "loss": 0.9882, "learning_rate": 2.8110526738705344e-05, "epoch": 3.8990825688073394, "percentage": 77.98, "elapsed_time": "0:11:09", "remaining_time": "0:03:08"}
{"current_steps": 860, "total_steps": 1090, "loss": 1.0302, "learning_rate": 2.592169155352031e-05, "epoch": 3.944954128440367, "percentage": 78.9, "elapsed_time": "0:11:16", "remaining_time": "0:03:00"}
{"current_steps": 870, "total_steps": 1090, "loss": 1.024, "learning_rate": 2.3808821740669606e-05, "epoch": 3.9908256880733948, "percentage": 79.82, "elapsed_time": "0:11:24", "remaining_time": "0:02:53"}
{"current_steps": 880, "total_steps": 1090, "loss": 0.9714, "learning_rate": 2.1774083993013718e-05, "epoch": 4.036697247706422, "percentage": 80.73, "elapsed_time": "0:11:31", "remaining_time": "0:02:45"}
{"current_steps": 890, "total_steps": 1090, "loss": 0.9184, "learning_rate": 1.9819564881018983e-05, "epoch": 4.08256880733945, "percentage": 81.65, "elapsed_time": "0:11:39", "remaining_time": "0:02:37"}
{"current_steps": 900, "total_steps": 1090, "loss": 0.9778, "learning_rate": 1.7947268713034127e-05, "epoch": 4.128440366972477, "percentage": 82.57, "elapsed_time": "0:11:47", "remaining_time": "0:02:29"}
{"current_steps": 910, "total_steps": 1090, "loss": 0.9174, "learning_rate": 1.6159115479924257e-05, "epoch": 4.174311926605505, "percentage": 83.49, "elapsed_time": "0:11:54", "remaining_time": "0:02:21"}
{"current_steps": 920, "total_steps": 1090, "loss": 0.872, "learning_rate": 1.4456938886170412e-05, "epoch": 4.220183486238533, "percentage": 84.4, "elapsed_time": "0:12:04", "remaining_time": "0:02:13"}
{"current_steps": 930, "total_steps": 1090, "loss": 0.9987, "learning_rate": 1.2842484469453365e-05, "epoch": 4.26605504587156, "percentage": 85.32, "elapsed_time": "0:12:12", "remaining_time": "0:02:06"}
{"current_steps": 940, "total_steps": 1090, "loss": 0.9002, "learning_rate": 1.1317407810650372e-05, "epoch": 4.3119266055045875, "percentage": 86.24, "elapsed_time": "0:12:20", "remaining_time": "0:01:58"}
{"current_steps": 950, "total_steps": 1090, "loss": 0.8614, "learning_rate": 9.883272836080116e-06, "epoch": 4.3577981651376145, "percentage": 87.16, "elapsed_time": "0:12:28", "remaining_time": "0:01:50"}
{"current_steps": 960, "total_steps": 1090, "loss": 0.891, "learning_rate": 8.541550213737171e-06, "epoch": 4.4036697247706424, "percentage": 88.07, "elapsed_time": "0:12:36", "remaining_time": "0:01:42"}
{"current_steps": 970, "total_steps": 1090, "loss": 0.9344, "learning_rate": 7.293615845160196e-06, "epoch": 4.4495412844036695, "percentage": 88.99, "elapsed_time": "0:12:43", "remaining_time": "0:01:34"}
{"current_steps": 980, "total_steps": 1090, "loss": 0.8811, "learning_rate": 6.140749454480932e-06, "epoch": 4.495412844036697, "percentage": 89.91, "elapsed_time": "0:12:51", "remaining_time": "0:01:26"}
{"current_steps": 990, "total_steps": 1090, "loss": 0.873, "learning_rate": 5.0841332761005e-06, "epoch": 4.541284403669724, "percentage": 90.83, "elapsed_time": "0:13:00", "remaining_time": "0:01:18"}
{"current_steps": 1000, "total_steps": 1090, "loss": 0.9262, "learning_rate": 4.124850842338779e-06, "epoch": 4.587155963302752, "percentage": 91.74, "elapsed_time": "0:13:08", "remaining_time": "0:01:11"}
{"current_steps": 1000, "total_steps": 1090, "eval_loss": 1.6428269147872925, "epoch": 4.587155963302752, "percentage": 91.74, "elapsed_time": "0:13:12", "remaining_time": "0:01:11"}
{"current_steps": 1010, "total_steps": 1090, "loss": 0.8827, "learning_rate": 3.263885872300343e-06, "epoch": 4.63302752293578, "percentage": 92.66, "elapsed_time": "0:13:21", "remaining_time": "0:01:03"}
{"current_steps": 1020, "total_steps": 1090, "loss": 0.9605, "learning_rate": 2.502121263096224e-06, "epoch": 4.678899082568807, "percentage": 93.58, "elapsed_time": "0:13:28", "remaining_time": "0:00:55"}
{"current_steps": 1030, "total_steps": 1090, "loss": 0.8472, "learning_rate": 1.840338184455881e-06, "epoch": 4.724770642201835, "percentage": 94.5, "elapsed_time": "0:13:36", "remaining_time": "0:00:47"}
{"current_steps": 1040, "total_steps": 1090, "loss": 0.8823, "learning_rate": 1.2792152776580968e-06, "epoch": 4.770642201834862, "percentage": 95.41, "elapsed_time": "0:13:43", "remaining_time": "0:00:39"}
{"current_steps": 1050, "total_steps": 1090, "loss": 0.9049, "learning_rate": 8.193279596020121e-07, "epoch": 4.81651376146789, "percentage": 96.33, "elapsed_time": "0:13:50", "remaining_time": "0:00:31"}
{"current_steps": 1060, "total_steps": 1090, "loss": 0.9058, "learning_rate": 4.6114783273213393e-07, "epoch": 4.862385321100917, "percentage": 97.25, "elapsed_time": "0:13:59", "remaining_time": "0:00:23"}
{"current_steps": 1070, "total_steps": 1090, "loss": 0.8932, "learning_rate": 2.05042201422323e-07, "epoch": 4.908256880733945, "percentage": 98.17, "elapsed_time": "0:14:07", "remaining_time": "0:00:15"}
{"current_steps": 1080, "total_steps": 1090, "loss": 0.8812, "learning_rate": 5.127369531473525e-08, "epoch": 4.954128440366972, "percentage": 99.08, "elapsed_time": "0:14:14", "remaining_time": "0:00:07"}
{"current_steps": 1090, "total_steps": 1090, "loss": 0.8824, "learning_rate": 0.0, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "0:14:22", "remaining_time": "0:00:00"}
{"current_steps": 1090, "total_steps": 1090, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "0:14:22", "remaining_time": "0:00:00"}