apwic commited on
Commit
14d9016
·
verified ·
1 Parent(s): dade0c5

End of training

Browse files
README.md CHANGED
@@ -1,4 +1,6 @@
1
  ---
 
 
2
  license: mit
3
  base_model: indolem/indobert-base-uncased
4
  tags:
 
1
  ---
2
+ language:
3
+ - id
4
  license: mit
5
  base_model: indolem/indobert-base-uncased
6
  tags:
all_results.json CHANGED
@@ -6,16 +6,16 @@
6
  "eval_loss": 0.7891051769256592,
7
  "eval_precision": 0.8795731707317074,
8
  "eval_recall": 0.8697945080923805,
9
- "eval_runtime": 4.7471,
10
  "eval_samples": 399,
11
- "eval_samples_per_second": 84.052,
12
- "eval_steps_per_second": 10.533,
13
  "f1": 0.8941622310727313,
14
  "precision": 0.8899245317748838,
15
  "recall": 0.8987993825126839,
16
  "train_loss": 0.05962105130807298,
17
- "train_runtime": 2714.936,
18
  "train_samples": 3638,
19
- "train_samples_per_second": 26.8,
20
- "train_steps_per_second": 0.899
21
  }
 
6
  "eval_loss": 0.7891051769256592,
7
  "eval_precision": 0.8795731707317074,
8
  "eval_recall": 0.8697945080923805,
9
+ "eval_runtime": 4.7492,
10
  "eval_samples": 399,
11
+ "eval_samples_per_second": 84.015,
12
+ "eval_steps_per_second": 10.528,
13
  "f1": 0.8941622310727313,
14
  "precision": 0.8899245317748838,
15
  "recall": 0.8987993825126839,
16
  "train_loss": 0.05962105130807298,
17
+ "train_runtime": 2691.1784,
18
  "train_samples": 3638,
19
+ "train_samples_per_second": 27.036,
20
+ "train_steps_per_second": 0.907
21
  }
eval_results.json CHANGED
@@ -5,8 +5,8 @@
5
  "eval_loss": 0.7891051769256592,
6
  "eval_precision": 0.8795731707317074,
7
  "eval_recall": 0.8697945080923805,
8
- "eval_runtime": 4.7471,
9
  "eval_samples": 399,
10
- "eval_samples_per_second": 84.052,
11
- "eval_steps_per_second": 10.533
12
  }
 
5
  "eval_loss": 0.7891051769256592,
6
  "eval_precision": 0.8795731707317074,
7
  "eval_recall": 0.8697945080923805,
8
+ "eval_runtime": 4.7492,
9
  "eval_samples": 399,
10
+ "eval_samples_per_second": 84.015,
11
+ "eval_steps_per_second": 10.528
12
  }
predict_results.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "accuracy": 0.9109792284866469,
3
+ "f1": 0.8941622310727313,
4
+ "precision": 0.8899245317748838,
5
+ "recall": 0.8987993825126839
6
+ }
runs/May25_13-12-14_indolem-petl-vm/events.out.tfevents.1716645450.indolem-petl-vm.2202872.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8d2d626adce37f9e1077866d44dd6d164293a2ec16bc5f9c5a69301eeb42bdb
3
+ size 560
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 20.0,
3
  "train_loss": 0.05962105130807298,
4
- "train_runtime": 2714.936,
5
  "train_samples": 3638,
6
- "train_samples_per_second": 26.8,
7
- "train_steps_per_second": 0.899
8
  }
 
1
  {
2
  "epoch": 20.0,
3
  "train_loss": 0.05962105130807298,
4
+ "train_runtime": 2691.1784,
5
  "train_samples": 3638,
6
+ "train_samples_per_second": 27.036,
7
+ "train_steps_per_second": 0.907
8
  }
trainer_state.json CHANGED
@@ -22,9 +22,9 @@
22
  "eval_loss": 0.275076687335968,
23
  "eval_precision": 0.8473684210526315,
24
  "eval_recall": 0.8420621931260229,
25
- "eval_runtime": 4.712,
26
- "eval_samples_per_second": 84.677,
27
- "eval_steps_per_second": 10.611,
28
  "step": 122
29
  },
30
  {
@@ -41,9 +41,9 @@
41
  "eval_loss": 0.3036659359931946,
42
  "eval_precision": 0.8573529411764707,
43
  "eval_recall": 0.897708674304419,
44
- "eval_runtime": 4.9592,
45
- "eval_samples_per_second": 80.457,
46
- "eval_steps_per_second": 10.082,
47
  "step": 244
48
  },
49
  {
@@ -60,9 +60,9 @@
60
  "eval_loss": 0.3442274332046509,
61
  "eval_precision": 0.8464828897338403,
62
  "eval_recall": 0.8756137479541735,
63
- "eval_runtime": 4.9511,
64
- "eval_samples_per_second": 80.588,
65
- "eval_steps_per_second": 10.099,
66
  "step": 366
67
  },
68
  {
@@ -79,9 +79,9 @@
79
  "eval_loss": 0.3736657500267029,
80
  "eval_precision": 0.8818924438393465,
81
  "eval_recall": 0.8740680123658847,
82
- "eval_runtime": 4.9528,
83
- "eval_samples_per_second": 80.56,
84
- "eval_steps_per_second": 10.095,
85
  "step": 488
86
  },
87
  {
@@ -98,9 +98,9 @@
98
  "eval_loss": 0.43064403533935547,
99
  "eval_precision": 0.8834928678678678,
100
  "eval_recall": 0.8715675577377705,
101
- "eval_runtime": 4.9624,
102
- "eval_samples_per_second": 80.405,
103
- "eval_steps_per_second": 10.076,
104
  "step": 610
105
  },
106
  {
@@ -117,9 +117,9 @@
117
  "eval_loss": 0.6448621153831482,
118
  "eval_precision": 0.8546209186496956,
119
  "eval_recall": 0.8884342607746863,
120
- "eval_runtime": 4.9531,
121
- "eval_samples_per_second": 80.556,
122
- "eval_steps_per_second": 10.095,
123
  "step": 732
124
  },
125
  {
@@ -136,9 +136,9 @@
136
  "eval_loss": 0.5595228672027588,
137
  "eval_precision": 0.8754297605404427,
138
  "eval_recall": 0.877295871976723,
139
- "eval_runtime": 4.9653,
140
- "eval_samples_per_second": 80.357,
141
- "eval_steps_per_second": 10.07,
142
  "step": 854
143
  },
144
  {
@@ -155,9 +155,9 @@
155
  "eval_loss": 0.6727907657623291,
156
  "eval_precision": 0.8686536646744258,
157
  "eval_recall": 0.8552009456264775,
158
- "eval_runtime": 4.9483,
159
- "eval_samples_per_second": 80.635,
160
- "eval_steps_per_second": 10.105,
161
  "step": 976
162
  },
163
  {
@@ -174,9 +174,9 @@
174
  "eval_loss": 0.6217536926269531,
175
  "eval_precision": 0.8977236138837015,
176
  "eval_recall": 0.8743862520458265,
177
- "eval_runtime": 4.9609,
178
- "eval_samples_per_second": 80.43,
179
- "eval_steps_per_second": 10.079,
180
  "step": 1098
181
  },
182
  {
@@ -193,9 +193,9 @@
193
  "eval_loss": 0.6576113104820251,
194
  "eval_precision": 0.8766227567773959,
195
  "eval_recall": 0.8587470449172576,
196
- "eval_runtime": 4.9593,
197
- "eval_samples_per_second": 80.455,
198
- "eval_steps_per_second": 10.082,
199
  "step": 1220
200
  },
201
  {
@@ -212,9 +212,9 @@
212
  "eval_loss": 0.7506579160690308,
213
  "eval_precision": 0.8940436639772188,
214
  "eval_recall": 0.8522913256955811,
215
- "eval_runtime": 4.9497,
216
- "eval_samples_per_second": 80.611,
217
- "eval_steps_per_second": 10.102,
218
  "step": 1342
219
  },
220
  {
@@ -231,9 +231,9 @@
231
  "eval_loss": 0.6859227418899536,
232
  "eval_precision": 0.8848766823362741,
233
  "eval_recall": 0.8622931442080378,
234
- "eval_runtime": 4.9227,
235
- "eval_samples_per_second": 81.053,
236
- "eval_steps_per_second": 10.157,
237
  "step": 1464
238
  },
239
  {
@@ -250,9 +250,9 @@
250
  "eval_loss": 0.6514401435852051,
251
  "eval_precision": 0.8903508771929824,
252
  "eval_recall": 0.8843880705582834,
253
- "eval_runtime": 4.9442,
254
- "eval_samples_per_second": 80.7,
255
- "eval_steps_per_second": 10.113,
256
  "step": 1586
257
  },
258
  {
@@ -269,9 +269,9 @@
269
  "eval_loss": 0.7604307532310486,
270
  "eval_precision": 0.8852261942423283,
271
  "eval_recall": 0.8690671031096563,
272
- "eval_runtime": 4.9491,
273
- "eval_samples_per_second": 80.62,
274
- "eval_steps_per_second": 10.103,
275
  "step": 1708
276
  },
277
  {
@@ -288,9 +288,9 @@
288
  "eval_loss": 0.7281515598297119,
289
  "eval_precision": 0.8874803397294746,
290
  "eval_recall": 0.8733406073831607,
291
- "eval_runtime": 4.9475,
292
- "eval_samples_per_second": 80.646,
293
- "eval_steps_per_second": 10.106,
294
  "step": 1830
295
  },
296
  {
@@ -307,9 +307,9 @@
307
  "eval_loss": 0.6987277269363403,
308
  "eval_precision": 0.8964912280701754,
309
  "eval_recall": 0.8904346244771777,
310
- "eval_runtime": 4.9546,
311
- "eval_samples_per_second": 80.531,
312
- "eval_steps_per_second": 10.092,
313
  "step": 1952
314
  },
315
  {
@@ -326,9 +326,9 @@
326
  "eval_loss": 0.7402216792106628,
327
  "eval_precision": 0.8897334834834836,
328
  "eval_recall": 0.8776141116566649,
329
- "eval_runtime": 4.977,
330
- "eval_samples_per_second": 80.17,
331
- "eval_steps_per_second": 10.046,
332
  "step": 2074
333
  },
334
  {
@@ -345,9 +345,9 @@
345
  "eval_loss": 0.7846499085426331,
346
  "eval_precision": 0.8719298245614036,
347
  "eval_recall": 0.8662484088016003,
348
- "eval_runtime": 4.9435,
349
- "eval_samples_per_second": 80.712,
350
- "eval_steps_per_second": 10.114,
351
  "step": 2196
352
  },
353
  {
@@ -364,9 +364,9 @@
364
  "eval_loss": 0.7948206067085266,
365
  "eval_precision": 0.8719298245614036,
366
  "eval_recall": 0.8662484088016003,
367
- "eval_runtime": 4.9539,
368
- "eval_samples_per_second": 80.542,
369
- "eval_steps_per_second": 10.093,
370
  "step": 2318
371
  },
372
  {
@@ -383,9 +383,9 @@
383
  "eval_loss": 0.7891051769256592,
384
  "eval_precision": 0.8795731707317074,
385
  "eval_recall": 0.8697945080923805,
386
- "eval_runtime": 4.9391,
387
- "eval_samples_per_second": 80.783,
388
- "eval_steps_per_second": 10.123,
389
  "step": 2440
390
  },
391
  {
@@ -393,9 +393,9 @@
393
  "step": 2440,
394
  "total_flos": 7584162436176000.0,
395
  "train_loss": 0.05962105130807298,
396
- "train_runtime": 2714.936,
397
- "train_samples_per_second": 26.8,
398
- "train_steps_per_second": 0.899
399
  }
400
  ],
401
  "logging_steps": 500,
 
22
  "eval_loss": 0.275076687335968,
23
  "eval_precision": 0.8473684210526315,
24
  "eval_recall": 0.8420621931260229,
25
+ "eval_runtime": 4.9569,
26
+ "eval_samples_per_second": 80.493,
27
+ "eval_steps_per_second": 10.087,
28
  "step": 122
29
  },
30
  {
 
41
  "eval_loss": 0.3036659359931946,
42
  "eval_precision": 0.8573529411764707,
43
  "eval_recall": 0.897708674304419,
44
+ "eval_runtime": 4.9408,
45
+ "eval_samples_per_second": 80.756,
46
+ "eval_steps_per_second": 10.12,
47
  "step": 244
48
  },
49
  {
 
60
  "eval_loss": 0.3442274332046509,
61
  "eval_precision": 0.8464828897338403,
62
  "eval_recall": 0.8756137479541735,
63
+ "eval_runtime": 4.9579,
64
+ "eval_samples_per_second": 80.478,
65
+ "eval_steps_per_second": 10.085,
66
  "step": 366
67
  },
68
  {
 
79
  "eval_loss": 0.3736657500267029,
80
  "eval_precision": 0.8818924438393465,
81
  "eval_recall": 0.8740680123658847,
82
+ "eval_runtime": 4.9699,
83
+ "eval_samples_per_second": 80.283,
84
+ "eval_steps_per_second": 10.061,
85
  "step": 488
86
  },
87
  {
 
98
  "eval_loss": 0.43064403533935547,
99
  "eval_precision": 0.8834928678678678,
100
  "eval_recall": 0.8715675577377705,
101
+ "eval_runtime": 4.9329,
102
+ "eval_samples_per_second": 80.886,
103
+ "eval_steps_per_second": 10.136,
104
  "step": 610
105
  },
106
  {
 
117
  "eval_loss": 0.6448621153831482,
118
  "eval_precision": 0.8546209186496956,
119
  "eval_recall": 0.8884342607746863,
120
+ "eval_runtime": 4.9504,
121
+ "eval_samples_per_second": 80.6,
122
+ "eval_steps_per_second": 10.1,
123
  "step": 732
124
  },
125
  {
 
136
  "eval_loss": 0.5595228672027588,
137
  "eval_precision": 0.8754297605404427,
138
  "eval_recall": 0.877295871976723,
139
+ "eval_runtime": 4.952,
140
+ "eval_samples_per_second": 80.574,
141
+ "eval_steps_per_second": 10.097,
142
  "step": 854
143
  },
144
  {
 
155
  "eval_loss": 0.6727907657623291,
156
  "eval_precision": 0.8686536646744258,
157
  "eval_recall": 0.8552009456264775,
158
+ "eval_runtime": 4.9909,
159
+ "eval_samples_per_second": 79.945,
160
+ "eval_steps_per_second": 10.018,
161
  "step": 976
162
  },
163
  {
 
174
  "eval_loss": 0.6217536926269531,
175
  "eval_precision": 0.8977236138837015,
176
  "eval_recall": 0.8743862520458265,
177
+ "eval_runtime": 4.9504,
178
+ "eval_samples_per_second": 80.6,
179
+ "eval_steps_per_second": 10.1,
180
  "step": 1098
181
  },
182
  {
 
193
  "eval_loss": 0.6576113104820251,
194
  "eval_precision": 0.8766227567773959,
195
  "eval_recall": 0.8587470449172576,
196
+ "eval_runtime": 4.9651,
197
+ "eval_samples_per_second": 80.361,
198
+ "eval_steps_per_second": 10.07,
199
  "step": 1220
200
  },
201
  {
 
212
  "eval_loss": 0.7506579160690308,
213
  "eval_precision": 0.8940436639772188,
214
  "eval_recall": 0.8522913256955811,
215
+ "eval_runtime": 4.9691,
216
+ "eval_samples_per_second": 80.296,
217
+ "eval_steps_per_second": 10.062,
218
  "step": 1342
219
  },
220
  {
 
231
  "eval_loss": 0.6859227418899536,
232
  "eval_precision": 0.8848766823362741,
233
  "eval_recall": 0.8622931442080378,
234
+ "eval_runtime": 4.9578,
235
+ "eval_samples_per_second": 80.48,
236
+ "eval_steps_per_second": 10.085,
237
  "step": 1464
238
  },
239
  {
 
250
  "eval_loss": 0.6514401435852051,
251
  "eval_precision": 0.8903508771929824,
252
  "eval_recall": 0.8843880705582834,
253
+ "eval_runtime": 4.9373,
254
+ "eval_samples_per_second": 80.813,
255
+ "eval_steps_per_second": 10.127,
256
  "step": 1586
257
  },
258
  {
 
269
  "eval_loss": 0.7604307532310486,
270
  "eval_precision": 0.8852261942423283,
271
  "eval_recall": 0.8690671031096563,
272
+ "eval_runtime": 4.9312,
273
+ "eval_samples_per_second": 80.913,
274
+ "eval_steps_per_second": 10.14,
275
  "step": 1708
276
  },
277
  {
 
288
  "eval_loss": 0.7281515598297119,
289
  "eval_precision": 0.8874803397294746,
290
  "eval_recall": 0.8733406073831607,
291
+ "eval_runtime": 4.9315,
292
+ "eval_samples_per_second": 80.909,
293
+ "eval_steps_per_second": 10.139,
294
  "step": 1830
295
  },
296
  {
 
307
  "eval_loss": 0.6987277269363403,
308
  "eval_precision": 0.8964912280701754,
309
  "eval_recall": 0.8904346244771777,
310
+ "eval_runtime": 4.9746,
311
+ "eval_samples_per_second": 80.207,
312
+ "eval_steps_per_second": 10.051,
313
  "step": 1952
314
  },
315
  {
 
326
  "eval_loss": 0.7402216792106628,
327
  "eval_precision": 0.8897334834834836,
328
  "eval_recall": 0.8776141116566649,
329
+ "eval_runtime": 4.9544,
330
+ "eval_samples_per_second": 80.535,
331
+ "eval_steps_per_second": 10.092,
332
  "step": 2074
333
  },
334
  {
 
345
  "eval_loss": 0.7846499085426331,
346
  "eval_precision": 0.8719298245614036,
347
  "eval_recall": 0.8662484088016003,
348
+ "eval_runtime": 4.9898,
349
+ "eval_samples_per_second": 79.962,
350
+ "eval_steps_per_second": 10.02,
351
  "step": 2196
352
  },
353
  {
 
364
  "eval_loss": 0.7948206067085266,
365
  "eval_precision": 0.8719298245614036,
366
  "eval_recall": 0.8662484088016003,
367
+ "eval_runtime": 4.9737,
368
+ "eval_samples_per_second": 80.222,
369
+ "eval_steps_per_second": 10.053,
370
  "step": 2318
371
  },
372
  {
 
383
  "eval_loss": 0.7891051769256592,
384
  "eval_precision": 0.8795731707317074,
385
  "eval_recall": 0.8697945080923805,
386
+ "eval_runtime": 4.9669,
387
+ "eval_samples_per_second": 80.331,
388
+ "eval_steps_per_second": 10.067,
389
  "step": 2440
390
  },
391
  {
 
393
  "step": 2440,
394
  "total_flos": 7584162436176000.0,
395
  "train_loss": 0.05962105130807298,
396
+ "train_runtime": 2691.1784,
397
+ "train_samples_per_second": 27.036,
398
+ "train_steps_per_second": 0.907
399
  }
400
  ],
401
  "logging_steps": 500,