Training in progress, step 939
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:11feec52a42068064cfc95c752196d7fbce9c6759006d7d481936d3ad1cf2793
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:895982d9591e5252500e99994b452ac4777b2b8e8e9635e3fbb1e79867130c06
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6c037d9b5996d07f5283d82f6a35b3e4fd7bb818a3f6048599f3f7b6be4da59d
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4783c190695b8110380a58de536f58b92082ba8fce3bde4e1191f4d90f0c54a4
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -78,3 +78,17 @@
|
|
| 78 |
{"current_steps": 780, "total_steps": 939, "loss": 0.206, "lr": 8.58858971477457e-07, "epoch": 2.4928, "percentage": 83.07, "elapsed_time": "0:14:53", "remaining_time": "0:03:02"}
|
| 79 |
{"current_steps": 790, "total_steps": 939, "loss": 0.2173, "lr": 7.575718930512516e-07, "epoch": 2.5248, "percentage": 84.13, "elapsed_time": "0:15:04", "remaining_time": "0:02:50"}
|
| 80 |
{"current_steps": 800, "total_steps": 939, "loss": 0.2037, "lr": 6.621482317764105e-07, "epoch": 2.5568, "percentage": 85.2, "elapsed_time": "0:15:15", "remaining_time": "0:02:38"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 78 |
{"current_steps": 780, "total_steps": 939, "loss": 0.206, "lr": 8.58858971477457e-07, "epoch": 2.4928, "percentage": 83.07, "elapsed_time": "0:14:53", "remaining_time": "0:03:02"}
|
| 79 |
{"current_steps": 790, "total_steps": 939, "loss": 0.2173, "lr": 7.575718930512516e-07, "epoch": 2.5248, "percentage": 84.13, "elapsed_time": "0:15:04", "remaining_time": "0:02:50"}
|
| 80 |
{"current_steps": 800, "total_steps": 939, "loss": 0.2037, "lr": 6.621482317764105e-07, "epoch": 2.5568, "percentage": 85.2, "elapsed_time": "0:15:15", "remaining_time": "0:02:38"}
|
| 81 |
+
{"current_steps": 810, "total_steps": 939, "loss": 0.2314, "lr": 5.727198717339511e-07, "epoch": 2.5888, "percentage": 86.26, "elapsed_time": "0:15:25", "remaining_time": "0:02:27"}
|
| 82 |
+
{"current_steps": 820, "total_steps": 939, "loss": 0.2208, "lr": 4.894104109594466e-07, "epoch": 2.6208, "percentage": 87.33, "elapsed_time": "0:15:36", "remaining_time": "0:02:15"}
|
| 83 |
+
{"current_steps": 830, "total_steps": 939, "loss": 0.2099, "lr": 4.123349906194357e-07, "epoch": 2.6528, "percentage": 88.39, "elapsed_time": "0:15:46", "remaining_time": "0:02:04"}
|
| 84 |
+
{"current_steps": 840, "total_steps": 939, "loss": 0.2293, "lr": 3.416001358759635e-07, "epoch": 2.6848, "percentage": 89.46, "elapsed_time": "0:15:57", "remaining_time": "0:01:52"}
|
| 85 |
+
{"current_steps": 850, "total_steps": 939, "loss": 0.2014, "lr": 2.7730360865923954e-07, "epoch": 2.7168, "percentage": 90.52, "elapsed_time": "0:16:07", "remaining_time": "0:01:41"}
|
| 86 |
+
{"current_steps": 860, "total_steps": 939, "loss": 0.2449, "lr": 2.1953427255185122e-07, "epoch": 2.7488, "percentage": 91.59, "elapsed_time": "0:16:18", "remaining_time": "0:01:29"}
|
| 87 |
+
{"current_steps": 870, "total_steps": 939, "loss": 0.2224, "lr": 1.6837196997130434e-07, "epoch": 2.7808, "percentage": 92.65, "elapsed_time": "0:16:28", "remaining_time": "0:01:18"}
|
| 88 |
+
{"current_steps": 880, "total_steps": 939, "loss": 0.1969, "lr": 1.2388741182062348e-07, "epoch": 2.8128, "percentage": 93.72, "elapsed_time": "0:16:39", "remaining_time": "0:01:06"}
|
| 89 |
+
{"current_steps": 890, "total_steps": 939, "loss": 0.2248, "lr": 8.614207975952083e-08, "epoch": 2.8448, "percentage": 94.78, "elapsed_time": "0:16:49", "remaining_time": "0:00:55"}
|
| 90 |
+
{"current_steps": 900, "total_steps": 939, "loss": 0.1906, "lr": 5.518814123121885e-08, "epoch": 2.8768000000000002, "percentage": 95.85, "elapsed_time": "0:17:00", "remaining_time": "0:00:44"}
|
| 91 |
+
{"current_steps": 910, "total_steps": 939, "loss": 0.1928, "lr": 3.10683773623488e-08, "epoch": 2.9088000000000003, "percentage": 96.91, "elapsed_time": "0:17:10", "remaining_time": "0:00:32"}
|
| 92 |
+
{"current_steps": 920, "total_steps": 939, "loss": 0.2329, "lr": 1.3816123835588835e-08, "epoch": 2.9408, "percentage": 97.98, "elapsed_time": "0:17:21", "remaining_time": "0:00:21"}
|
| 93 |
+
{"current_steps": 930, "total_steps": 939, "loss": 0.2185, "lr": 3.4552248167507576e-09, "epoch": 2.9728, "percentage": 99.04, "elapsed_time": "0:17:31", "remaining_time": "0:00:10"}
|
| 94 |
+
{"current_steps": 939, "total_steps": 939, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:18:35", "remaining_time": "0:00:00"}
|