apwic commited on
Commit
da71ae6
1 Parent(s): 2ca5986

End of training

Browse files
README.md CHANGED
@@ -1,4 +1,6 @@
1
  ---
 
 
2
  license: mit
3
  base_model: indolem/indobert-base-uncased
4
  tags:
 
1
  ---
2
+ language:
3
+ - id
4
  license: mit
5
  base_model: indolem/indobert-base-uncased
6
  tags:
all_results.json CHANGED
@@ -25,10 +25,10 @@
25
  "eval_overall_f1": 0.8432432432432433,
26
  "eval_overall_precision": 0.8020565552699229,
27
  "eval_overall_recall": 0.8888888888888888,
28
- "eval_runtime": 0.3857,
29
  "eval_samples": 187,
30
- "eval_samples_per_second": 484.856,
31
- "eval_steps_per_second": 7.778,
32
  "predict_LOCATION_f1": 0.9802955665024631,
33
  "predict_LOCATION_number": 202,
34
  "predict_LOCATION_precision": 0.9754901960784313,
@@ -54,12 +54,12 @@
54
  "predict_overall_f1": 0.9689089881288865,
55
  "predict_overall_precision": 0.9586129753914989,
56
  "predict_overall_recall": 0.9794285714285714,
57
- "predict_runtime": 0.9968,
58
- "predict_samples_per_second": 470.518,
59
- "predict_steps_per_second": 8.026,
60
  "train_loss": 0.07131878634668747,
61
- "train_runtime": 622.8213,
62
  "train_samples": 1688,
63
- "train_samples_per_second": 271.025,
64
- "train_steps_per_second": 17.019
65
  }
 
25
  "eval_overall_f1": 0.8432432432432433,
26
  "eval_overall_precision": 0.8020565552699229,
27
  "eval_overall_recall": 0.8888888888888888,
28
+ "eval_runtime": 0.3863,
29
  "eval_samples": 187,
30
+ "eval_samples_per_second": 484.082,
31
+ "eval_steps_per_second": 7.766,
32
  "predict_LOCATION_f1": 0.9802955665024631,
33
  "predict_LOCATION_number": 202,
34
  "predict_LOCATION_precision": 0.9754901960784313,
 
54
  "predict_overall_f1": 0.9689089881288865,
55
  "predict_overall_precision": 0.9586129753914989,
56
  "predict_overall_recall": 0.9794285714285714,
57
+ "predict_runtime": 0.9904,
58
+ "predict_samples_per_second": 473.541,
59
+ "predict_steps_per_second": 8.077,
60
  "train_loss": 0.07131878634668747,
61
+ "train_runtime": 621.5745,
62
  "train_samples": 1688,
63
+ "train_samples_per_second": 271.568,
64
+ "train_steps_per_second": 17.053
65
  }
eval_results.json CHANGED
@@ -25,8 +25,8 @@
25
  "eval_overall_f1": 0.8432432432432433,
26
  "eval_overall_precision": 0.8020565552699229,
27
  "eval_overall_recall": 0.8888888888888888,
28
- "eval_runtime": 0.3857,
29
  "eval_samples": 187,
30
- "eval_samples_per_second": 484.856,
31
- "eval_steps_per_second": 7.778
32
  }
 
25
  "eval_overall_f1": 0.8432432432432433,
26
  "eval_overall_precision": 0.8020565552699229,
27
  "eval_overall_recall": 0.8888888888888888,
28
+ "eval_runtime": 0.3863,
29
  "eval_samples": 187,
30
+ "eval_samples_per_second": 484.082,
31
+ "eval_steps_per_second": 7.766
32
  }
predict_results.json CHANGED
@@ -24,7 +24,7 @@
24
  "predict_overall_f1": 0.9689089881288865,
25
  "predict_overall_precision": 0.9586129753914989,
26
  "predict_overall_recall": 0.9794285714285714,
27
- "predict_runtime": 0.9968,
28
- "predict_samples_per_second": 470.518,
29
- "predict_steps_per_second": 8.026
30
  }
 
24
  "predict_overall_f1": 0.9689089881288865,
25
  "predict_overall_precision": 0.9586129753914989,
26
  "predict_overall_recall": 0.9794285714285714,
27
+ "predict_runtime": 0.9904,
28
+ "predict_samples_per_second": 473.541,
29
+ "predict_steps_per_second": 8.077
30
  }
runs/Jun04_09-15-08_a358b85c7679/events.out.tfevents.1717493143.a358b85c7679.596431.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee39ea2c05b986c465938a71d5f4ec9ac06b914655ad9b2fc113ddfbccba963e
3
+ size 1759
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 100.0,
3
  "train_loss": 0.07131878634668747,
4
- "train_runtime": 622.8213,
5
  "train_samples": 1688,
6
- "train_samples_per_second": 271.025,
7
- "train_steps_per_second": 17.019
8
  }
 
1
  {
2
  "epoch": 100.0,
3
  "train_loss": 0.07131878634668747,
4
+ "train_runtime": 621.5745,
5
  "train_samples": 1688,
6
+ "train_samples_per_second": 271.568,
7
+ "train_steps_per_second": 17.053
8
  }
trainer_state.json CHANGED
@@ -42,9 +42,9 @@
42
  "eval_overall_f1": 0.010416666666666668,
43
  "eval_overall_precision": 0.06060606060606061,
44
  "eval_overall_recall": 0.005698005698005698,
45
- "eval_runtime": 0.398,
46
- "eval_samples_per_second": 469.835,
47
- "eval_steps_per_second": 7.537,
48
  "step": 106
49
  },
50
  {
@@ -81,9 +81,9 @@
81
  "eval_overall_f1": 0.4402332361516035,
82
  "eval_overall_precision": 0.4507462686567164,
83
  "eval_overall_recall": 0.4301994301994302,
84
- "eval_runtime": 0.386,
85
- "eval_samples_per_second": 484.468,
86
- "eval_steps_per_second": 7.772,
87
  "step": 212
88
  },
89
  {
@@ -120,9 +120,9 @@
120
  "eval_overall_f1": 0.6755674232309746,
121
  "eval_overall_precision": 0.635678391959799,
122
  "eval_overall_recall": 0.7207977207977208,
123
- "eval_runtime": 0.3847,
124
- "eval_samples_per_second": 486.037,
125
- "eval_steps_per_second": 7.797,
126
  "step": 318
127
  },
128
  {
@@ -159,9 +159,9 @@
159
  "eval_overall_f1": 0.7506361323155216,
160
  "eval_overall_precision": 0.6781609195402298,
161
  "eval_overall_recall": 0.8404558404558404,
162
- "eval_runtime": 0.3877,
163
- "eval_samples_per_second": 482.308,
164
- "eval_steps_per_second": 7.738,
165
  "step": 424
166
  },
167
  {
@@ -198,9 +198,9 @@
198
  "eval_overall_f1": 0.7506361323155216,
199
  "eval_overall_precision": 0.6781609195402298,
200
  "eval_overall_recall": 0.8404558404558404,
201
- "eval_runtime": 0.3854,
202
- "eval_samples_per_second": 485.195,
203
- "eval_steps_per_second": 7.784,
204
  "step": 530
205
  },
206
  {
@@ -237,9 +237,9 @@
237
  "eval_overall_f1": 0.7652173913043478,
238
  "eval_overall_precision": 0.6784140969162996,
239
  "eval_overall_recall": 0.8774928774928775,
240
- "eval_runtime": 0.3878,
241
- "eval_samples_per_second": 482.177,
242
- "eval_steps_per_second": 7.735,
243
  "step": 636
244
  },
245
  {
@@ -276,9 +276,9 @@
276
  "eval_overall_f1": 0.7974025974025974,
277
  "eval_overall_precision": 0.7326968973747017,
278
  "eval_overall_recall": 0.8746438746438746,
279
- "eval_runtime": 0.3862,
280
- "eval_samples_per_second": 484.261,
281
- "eval_steps_per_second": 7.769,
282
  "step": 742
283
  },
284
  {
@@ -315,9 +315,9 @@
315
  "eval_overall_f1": 0.7943078913324709,
316
  "eval_overall_precision": 0.7274881516587678,
317
  "eval_overall_recall": 0.8746438746438746,
318
- "eval_runtime": 0.3852,
319
- "eval_samples_per_second": 485.507,
320
- "eval_steps_per_second": 7.789,
321
  "step": 848
322
  },
323
  {
@@ -354,9 +354,9 @@
354
  "eval_overall_f1": 0.8269484808454426,
355
  "eval_overall_precision": 0.770935960591133,
356
  "eval_overall_recall": 0.8917378917378918,
357
- "eval_runtime": 0.3849,
358
- "eval_samples_per_second": 485.83,
359
- "eval_steps_per_second": 7.794,
360
  "step": 954
361
  },
362
  {
@@ -393,9 +393,9 @@
393
  "eval_overall_f1": 0.8284182305630027,
394
  "eval_overall_precision": 0.7822784810126582,
395
  "eval_overall_recall": 0.8803418803418803,
396
- "eval_runtime": 0.3839,
397
- "eval_samples_per_second": 487.093,
398
- "eval_steps_per_second": 7.814,
399
  "step": 1060
400
  },
401
  {
@@ -432,9 +432,9 @@
432
  "eval_overall_f1": 0.8138297872340426,
433
  "eval_overall_precision": 0.7630922693266833,
434
  "eval_overall_recall": 0.8717948717948718,
435
- "eval_runtime": 0.3859,
436
- "eval_samples_per_second": 484.593,
437
- "eval_steps_per_second": 7.774,
438
  "step": 1166
439
  },
440
  {
@@ -471,9 +471,9 @@
471
  "eval_overall_f1": 0.8146214099216709,
472
  "eval_overall_precision": 0.7518072289156627,
473
  "eval_overall_recall": 0.8888888888888888,
474
- "eval_runtime": 0.3854,
475
- "eval_samples_per_second": 485.157,
476
- "eval_steps_per_second": 7.783,
477
  "step": 1272
478
  },
479
  {
@@ -510,9 +510,9 @@
510
  "eval_overall_f1": 0.8255659121171771,
511
  "eval_overall_precision": 0.775,
512
  "eval_overall_recall": 0.8831908831908832,
513
- "eval_runtime": 0.3861,
514
- "eval_samples_per_second": 484.32,
515
- "eval_steps_per_second": 7.77,
516
  "step": 1378
517
  },
518
  {
@@ -549,9 +549,9 @@
549
  "eval_overall_f1": 0.807843137254902,
550
  "eval_overall_precision": 0.7463768115942029,
551
  "eval_overall_recall": 0.8803418803418803,
552
- "eval_runtime": 0.3849,
553
- "eval_samples_per_second": 485.803,
554
- "eval_steps_per_second": 7.794,
555
  "step": 1484
556
  },
557
  {
@@ -588,9 +588,9 @@
588
  "eval_overall_f1": 0.8284182305630027,
589
  "eval_overall_precision": 0.7822784810126582,
590
  "eval_overall_recall": 0.8803418803418803,
591
- "eval_runtime": 0.3921,
592
- "eval_samples_per_second": 476.967,
593
- "eval_steps_per_second": 7.652,
594
  "step": 1590
595
  },
596
  {
@@ -627,9 +627,9 @@
627
  "eval_overall_f1": 0.8333333333333334,
628
  "eval_overall_precision": 0.7888040712468194,
629
  "eval_overall_recall": 0.8831908831908832,
630
- "eval_runtime": 0.3926,
631
- "eval_samples_per_second": 476.356,
632
- "eval_steps_per_second": 7.642,
633
  "step": 1696
634
  },
635
  {
@@ -666,9 +666,9 @@
666
  "eval_overall_f1": 0.8398384925975775,
667
  "eval_overall_precision": 0.7959183673469388,
668
  "eval_overall_recall": 0.8888888888888888,
669
- "eval_runtime": 0.3867,
670
- "eval_samples_per_second": 483.521,
671
- "eval_steps_per_second": 7.757,
672
  "step": 1802
673
  },
674
  {
@@ -705,9 +705,9 @@
705
  "eval_overall_f1": 0.8279569892473119,
706
  "eval_overall_precision": 0.7837150127226463,
707
  "eval_overall_recall": 0.8774928774928775,
708
- "eval_runtime": 0.3875,
709
- "eval_samples_per_second": 482.589,
710
- "eval_steps_per_second": 7.742,
711
  "step": 1908
712
  },
713
  {
@@ -744,9 +744,9 @@
744
  "eval_overall_f1": 0.8371467025572006,
745
  "eval_overall_precision": 0.7933673469387755,
746
  "eval_overall_recall": 0.886039886039886,
747
- "eval_runtime": 0.3917,
748
- "eval_samples_per_second": 477.449,
749
- "eval_steps_per_second": 7.66,
750
  "step": 2014
751
  },
752
  {
@@ -783,9 +783,9 @@
783
  "eval_overall_f1": 0.8364611260053618,
784
  "eval_overall_precision": 0.789873417721519,
785
  "eval_overall_recall": 0.8888888888888888,
786
- "eval_runtime": 0.3853,
787
- "eval_samples_per_second": 485.372,
788
- "eval_steps_per_second": 7.787,
789
  "step": 2120
790
  },
791
  {
@@ -822,9 +822,9 @@
822
  "eval_overall_f1": 0.8348993288590604,
823
  "eval_overall_precision": 0.7893401015228426,
824
  "eval_overall_recall": 0.886039886039886,
825
- "eval_runtime": 0.3889,
826
- "eval_samples_per_second": 480.805,
827
- "eval_steps_per_second": 7.713,
828
  "step": 2226
829
  },
830
  {
@@ -861,9 +861,9 @@
861
  "eval_overall_f1": 0.8378378378378378,
862
  "eval_overall_precision": 0.7969151670951157,
863
  "eval_overall_recall": 0.8831908831908832,
864
- "eval_runtime": 0.3894,
865
- "eval_samples_per_second": 480.224,
866
- "eval_steps_per_second": 7.704,
867
  "step": 2332
868
  },
869
  {
@@ -900,9 +900,9 @@
900
  "eval_overall_f1": 0.8502024291497975,
901
  "eval_overall_precision": 0.8076923076923077,
902
  "eval_overall_recall": 0.8974358974358975,
903
- "eval_runtime": 0.3909,
904
- "eval_samples_per_second": 478.381,
905
- "eval_steps_per_second": 7.675,
906
  "step": 2438
907
  },
908
  {
@@ -939,9 +939,9 @@
939
  "eval_overall_f1": 0.8449197860962567,
940
  "eval_overall_precision": 0.7959697732997482,
941
  "eval_overall_recall": 0.9002849002849003,
942
- "eval_runtime": 0.3873,
943
- "eval_samples_per_second": 482.826,
944
- "eval_steps_per_second": 7.746,
945
  "step": 2544
946
  },
947
  {
@@ -978,9 +978,9 @@
978
  "eval_overall_f1": 0.8266666666666667,
979
  "eval_overall_precision": 0.7769423558897243,
980
  "eval_overall_recall": 0.8831908831908832,
981
- "eval_runtime": 0.3857,
982
- "eval_samples_per_second": 484.853,
983
- "eval_steps_per_second": 7.778,
984
  "step": 2650
985
  },
986
  {
@@ -1017,9 +1017,9 @@
1017
  "eval_overall_f1": 0.8225806451612903,
1018
  "eval_overall_precision": 0.7786259541984732,
1019
  "eval_overall_recall": 0.8717948717948718,
1020
- "eval_runtime": 0.386,
1021
- "eval_samples_per_second": 484.512,
1022
- "eval_steps_per_second": 7.773,
1023
  "step": 2756
1024
  },
1025
  {
@@ -1056,9 +1056,9 @@
1056
  "eval_overall_f1": 0.8253968253968255,
1057
  "eval_overall_precision": 0.7703703703703704,
1058
  "eval_overall_recall": 0.8888888888888888,
1059
- "eval_runtime": 0.3902,
1060
- "eval_samples_per_second": 479.247,
1061
- "eval_steps_per_second": 7.688,
1062
  "step": 2862
1063
  },
1064
  {
@@ -1095,9 +1095,9 @@
1095
  "eval_overall_f1": 0.8287292817679558,
1096
  "eval_overall_precision": 0.8042895442359249,
1097
  "eval_overall_recall": 0.8547008547008547,
1098
- "eval_runtime": 0.3858,
1099
- "eval_samples_per_second": 484.693,
1100
- "eval_steps_per_second": 7.776,
1101
  "step": 2968
1102
  },
1103
  {
@@ -1134,9 +1134,9 @@
1134
  "eval_overall_f1": 0.8532608695652173,
1135
  "eval_overall_precision": 0.8155844155844156,
1136
  "eval_overall_recall": 0.8945868945868946,
1137
- "eval_runtime": 0.3861,
1138
- "eval_samples_per_second": 484.295,
1139
- "eval_steps_per_second": 7.769,
1140
  "step": 3074
1141
  },
1142
  {
@@ -1173,9 +1173,9 @@
1173
  "eval_overall_f1": 0.8423913043478262,
1174
  "eval_overall_precision": 0.8051948051948052,
1175
  "eval_overall_recall": 0.8831908831908832,
1176
- "eval_runtime": 0.3879,
1177
- "eval_samples_per_second": 482.094,
1178
- "eval_steps_per_second": 7.734,
1179
  "step": 3180
1180
  },
1181
  {
@@ -1212,9 +1212,9 @@
1212
  "eval_overall_f1": 0.8367071524966261,
1213
  "eval_overall_precision": 0.7948717948717948,
1214
  "eval_overall_recall": 0.8831908831908832,
1215
- "eval_runtime": 0.3914,
1216
- "eval_samples_per_second": 477.78,
1217
- "eval_steps_per_second": 7.665,
1218
  "step": 3286
1219
  },
1220
  {
@@ -1251,9 +1251,9 @@
1251
  "eval_overall_f1": 0.824468085106383,
1252
  "eval_overall_precision": 0.773067331670823,
1253
  "eval_overall_recall": 0.8831908831908832,
1254
- "eval_runtime": 0.3886,
1255
- "eval_samples_per_second": 481.274,
1256
- "eval_steps_per_second": 7.721,
1257
  "step": 3392
1258
  },
1259
  {
@@ -1290,9 +1290,9 @@
1290
  "eval_overall_f1": 0.8389715832205684,
1291
  "eval_overall_precision": 0.7989690721649485,
1292
  "eval_overall_recall": 0.8831908831908832,
1293
- "eval_runtime": 0.3876,
1294
- "eval_samples_per_second": 482.477,
1295
- "eval_steps_per_second": 7.74,
1296
  "step": 3498
1297
  },
1298
  {
@@ -1329,9 +1329,9 @@
1329
  "eval_overall_f1": 0.8466757123473541,
1330
  "eval_overall_precision": 0.8082901554404145,
1331
  "eval_overall_recall": 0.8888888888888888,
1332
- "eval_runtime": 0.3867,
1333
- "eval_samples_per_second": 483.635,
1334
- "eval_steps_per_second": 7.759,
1335
  "step": 3604
1336
  },
1337
  {
@@ -1368,9 +1368,9 @@
1368
  "eval_overall_f1": 0.8346883468834689,
1369
  "eval_overall_precision": 0.7958656330749354,
1370
  "eval_overall_recall": 0.8774928774928775,
1371
- "eval_runtime": 0.3911,
1372
- "eval_samples_per_second": 478.197,
1373
- "eval_steps_per_second": 7.672,
1374
  "step": 3710
1375
  },
1376
  {
@@ -1407,9 +1407,9 @@
1407
  "eval_overall_f1": 0.8273092369477911,
1408
  "eval_overall_precision": 0.7803030303030303,
1409
  "eval_overall_recall": 0.8803418803418803,
1410
- "eval_runtime": 0.3868,
1411
- "eval_samples_per_second": 483.41,
1412
- "eval_steps_per_second": 7.755,
1413
  "step": 3816
1414
  },
1415
  {
@@ -1446,9 +1446,9 @@
1446
  "eval_overall_f1": 0.8279569892473119,
1447
  "eval_overall_precision": 0.7837150127226463,
1448
  "eval_overall_recall": 0.8774928774928775,
1449
- "eval_runtime": 0.3874,
1450
- "eval_samples_per_second": 482.655,
1451
- "eval_steps_per_second": 7.743,
1452
  "step": 3922
1453
  },
1454
  {
@@ -1485,9 +1485,9 @@
1485
  "eval_overall_f1": 0.8342541436464089,
1486
  "eval_overall_precision": 0.8096514745308311,
1487
  "eval_overall_recall": 0.8603988603988604,
1488
- "eval_runtime": 0.3876,
1489
- "eval_samples_per_second": 482.503,
1490
- "eval_steps_per_second": 7.741,
1491
  "step": 4028
1492
  },
1493
  {
@@ -1524,9 +1524,9 @@
1524
  "eval_overall_f1": 0.8355795148247979,
1525
  "eval_overall_precision": 0.7928388746803069,
1526
  "eval_overall_recall": 0.8831908831908832,
1527
- "eval_runtime": 0.3886,
1528
- "eval_samples_per_second": 481.159,
1529
- "eval_steps_per_second": 7.719,
1530
  "step": 4134
1531
  },
1532
  {
@@ -1563,9 +1563,9 @@
1563
  "eval_overall_f1": 0.8304405874499333,
1564
  "eval_overall_precision": 0.7814070351758794,
1565
  "eval_overall_recall": 0.886039886039886,
1566
- "eval_runtime": 0.3881,
1567
- "eval_samples_per_second": 481.816,
1568
- "eval_steps_per_second": 7.73,
1569
  "step": 4240
1570
  },
1571
  {
@@ -1602,9 +1602,9 @@
1602
  "eval_overall_f1": 0.8266666666666667,
1603
  "eval_overall_precision": 0.7769423558897243,
1604
  "eval_overall_recall": 0.8831908831908832,
1605
- "eval_runtime": 0.3878,
1606
- "eval_samples_per_second": 482.196,
1607
- "eval_steps_per_second": 7.736,
1608
  "step": 4346
1609
  },
1610
  {
@@ -1641,9 +1641,9 @@
1641
  "eval_overall_f1": 0.8385345997286296,
1642
  "eval_overall_precision": 0.8005181347150259,
1643
  "eval_overall_recall": 0.8803418803418803,
1644
- "eval_runtime": 0.3855,
1645
- "eval_samples_per_second": 485.113,
1646
- "eval_steps_per_second": 7.783,
1647
  "step": 4452
1648
  },
1649
  {
@@ -1680,9 +1680,9 @@
1680
  "eval_overall_f1": 0.8259109311740892,
1681
  "eval_overall_precision": 0.7846153846153846,
1682
  "eval_overall_recall": 0.8717948717948718,
1683
- "eval_runtime": 0.3848,
1684
- "eval_samples_per_second": 486.006,
1685
- "eval_steps_per_second": 7.797,
1686
  "step": 4558
1687
  },
1688
  {
@@ -1719,9 +1719,9 @@
1719
  "eval_overall_f1": 0.8512960436562074,
1720
  "eval_overall_precision": 0.8167539267015707,
1721
  "eval_overall_recall": 0.8888888888888888,
1722
- "eval_runtime": 0.3855,
1723
- "eval_samples_per_second": 485.134,
1724
- "eval_steps_per_second": 7.783,
1725
  "step": 4664
1726
  },
1727
  {
@@ -1758,9 +1758,9 @@
1758
  "eval_overall_f1": 0.850415512465374,
1759
  "eval_overall_precision": 0.8274932614555256,
1760
  "eval_overall_recall": 0.8746438746438746,
1761
- "eval_runtime": 0.3877,
1762
- "eval_samples_per_second": 482.27,
1763
- "eval_steps_per_second": 7.737,
1764
  "step": 4770
1765
  },
1766
  {
@@ -1797,9 +1797,9 @@
1797
  "eval_overall_f1": 0.8602739726027397,
1798
  "eval_overall_precision": 0.8284960422163589,
1799
  "eval_overall_recall": 0.8945868945868946,
1800
- "eval_runtime": 0.3876,
1801
- "eval_samples_per_second": 482.517,
1802
- "eval_steps_per_second": 7.741,
1803
  "step": 4876
1804
  },
1805
  {
@@ -1836,9 +1836,9 @@
1836
  "eval_overall_f1": 0.8540540540540541,
1837
  "eval_overall_precision": 0.8123393316195373,
1838
  "eval_overall_recall": 0.9002849002849003,
1839
- "eval_runtime": 0.3866,
1840
- "eval_samples_per_second": 483.755,
1841
- "eval_steps_per_second": 7.761,
1842
  "step": 4982
1843
  },
1844
  {
@@ -1875,9 +1875,9 @@
1875
  "eval_overall_f1": 0.8415300546448087,
1876
  "eval_overall_precision": 0.8083989501312336,
1877
  "eval_overall_recall": 0.8774928774928775,
1878
- "eval_runtime": 0.3865,
1879
- "eval_samples_per_second": 483.867,
1880
- "eval_steps_per_second": 7.763,
1881
  "step": 5088
1882
  },
1883
  {
@@ -1914,9 +1914,9 @@
1914
  "eval_overall_f1": 0.8602442333785618,
1915
  "eval_overall_precision": 0.8212435233160622,
1916
  "eval_overall_recall": 0.9031339031339032,
1917
- "eval_runtime": 0.3869,
1918
- "eval_samples_per_second": 483.349,
1919
- "eval_steps_per_second": 7.754,
1920
  "step": 5194
1921
  },
1922
  {
@@ -1953,9 +1953,9 @@
1953
  "eval_overall_f1": 0.8571428571428573,
1954
  "eval_overall_precision": 0.8203125,
1955
  "eval_overall_recall": 0.8974358974358975,
1956
- "eval_runtime": 0.3879,
1957
- "eval_samples_per_second": 482.064,
1958
- "eval_steps_per_second": 7.734,
1959
  "step": 5300
1960
  },
1961
  {
@@ -1992,9 +1992,9 @@
1992
  "eval_overall_f1": 0.8405405405405405,
1993
  "eval_overall_precision": 0.7994858611825193,
1994
  "eval_overall_recall": 0.886039886039886,
1995
- "eval_runtime": 0.3863,
1996
- "eval_samples_per_second": 484.101,
1997
- "eval_steps_per_second": 7.766,
1998
  "step": 5406
1999
  },
2000
  {
@@ -2031,9 +2031,9 @@
2031
  "eval_overall_f1": 0.8498659517426275,
2032
  "eval_overall_precision": 0.8025316455696202,
2033
  "eval_overall_recall": 0.9031339031339032,
2034
- "eval_runtime": 0.3866,
2035
- "eval_samples_per_second": 483.708,
2036
- "eval_steps_per_second": 7.76,
2037
  "step": 5512
2038
  },
2039
  {
@@ -2070,9 +2070,9 @@
2070
  "eval_overall_f1": 0.8517520215633424,
2071
  "eval_overall_precision": 0.8081841432225064,
2072
  "eval_overall_recall": 0.9002849002849003,
2073
- "eval_runtime": 0.3859,
2074
- "eval_samples_per_second": 484.521,
2075
- "eval_steps_per_second": 7.773,
2076
  "step": 5618
2077
  },
2078
  {
@@ -2109,9 +2109,9 @@
2109
  "eval_overall_f1": 0.8497970230040596,
2110
  "eval_overall_precision": 0.8092783505154639,
2111
  "eval_overall_recall": 0.8945868945868946,
2112
- "eval_runtime": 0.3852,
2113
- "eval_samples_per_second": 485.517,
2114
- "eval_steps_per_second": 7.789,
2115
  "step": 5724
2116
  },
2117
  {
@@ -2148,9 +2148,9 @@
2148
  "eval_overall_f1": 0.8313090418353576,
2149
  "eval_overall_precision": 0.7897435897435897,
2150
  "eval_overall_recall": 0.8774928774928775,
2151
- "eval_runtime": 0.3848,
2152
- "eval_samples_per_second": 485.964,
2153
- "eval_steps_per_second": 7.796,
2154
  "step": 5830
2155
  },
2156
  {
@@ -2187,9 +2187,9 @@
2187
  "eval_overall_f1": 0.840381991814461,
2188
  "eval_overall_precision": 0.806282722513089,
2189
  "eval_overall_recall": 0.8774928774928775,
2190
- "eval_runtime": 0.3864,
2191
- "eval_samples_per_second": 483.981,
2192
- "eval_steps_per_second": 7.764,
2193
  "step": 5936
2194
  },
2195
  {
@@ -2226,9 +2226,9 @@
2226
  "eval_overall_f1": 0.8516483516483517,
2227
  "eval_overall_precision": 0.8222811671087533,
2228
  "eval_overall_recall": 0.8831908831908832,
2229
- "eval_runtime": 0.3879,
2230
- "eval_samples_per_second": 482.058,
2231
- "eval_steps_per_second": 7.734,
2232
  "step": 6042
2233
  },
2234
  {
@@ -2265,9 +2265,9 @@
2265
  "eval_overall_f1": 0.8358208955223881,
2266
  "eval_overall_precision": 0.7979274611398963,
2267
  "eval_overall_recall": 0.8774928774928775,
2268
- "eval_runtime": 0.3884,
2269
- "eval_samples_per_second": 481.478,
2270
- "eval_steps_per_second": 7.724,
2271
  "step": 6148
2272
  },
2273
  {
@@ -2304,9 +2304,9 @@
2304
  "eval_overall_f1": 0.8474114441416893,
2305
  "eval_overall_precision": 0.8120104438642297,
2306
  "eval_overall_recall": 0.886039886039886,
2307
- "eval_runtime": 0.3866,
2308
- "eval_samples_per_second": 483.696,
2309
- "eval_steps_per_second": 7.76,
2310
  "step": 6254
2311
  },
2312
  {
@@ -2343,9 +2343,9 @@
2343
  "eval_overall_f1": 0.8528610354223433,
2344
  "eval_overall_precision": 0.8172323759791122,
2345
  "eval_overall_recall": 0.8917378917378918,
2346
- "eval_runtime": 0.3856,
2347
- "eval_samples_per_second": 484.992,
2348
- "eval_steps_per_second": 7.781,
2349
  "step": 6360
2350
  },
2351
  {
@@ -2382,9 +2382,9 @@
2382
  "eval_overall_f1": 0.8322147651006713,
2383
  "eval_overall_precision": 0.7868020304568528,
2384
  "eval_overall_recall": 0.8831908831908832,
2385
- "eval_runtime": 0.3885,
2386
- "eval_samples_per_second": 481.387,
2387
- "eval_steps_per_second": 7.723,
2388
  "step": 6466
2389
  },
2390
  {
@@ -2421,9 +2421,9 @@
2421
  "eval_overall_f1": 0.8524590163934426,
2422
  "eval_overall_precision": 0.8188976377952756,
2423
  "eval_overall_recall": 0.8888888888888888,
2424
- "eval_runtime": 0.3895,
2425
- "eval_samples_per_second": 480.151,
2426
- "eval_steps_per_second": 7.703,
2427
  "step": 6572
2428
  },
2429
  {
@@ -2460,9 +2460,9 @@
2460
  "eval_overall_f1": 0.8555858310626703,
2461
  "eval_overall_precision": 0.8198433420365535,
2462
  "eval_overall_recall": 0.8945868945868946,
2463
- "eval_runtime": 0.3869,
2464
- "eval_samples_per_second": 483.389,
2465
- "eval_steps_per_second": 7.755,
2466
  "step": 6678
2467
  },
2468
  {
@@ -2499,9 +2499,9 @@
2499
  "eval_overall_f1": 0.8324175824175825,
2500
  "eval_overall_precision": 0.8037135278514589,
2501
  "eval_overall_recall": 0.8632478632478633,
2502
- "eval_runtime": 0.3879,
2503
- "eval_samples_per_second": 482.096,
2504
- "eval_steps_per_second": 7.734,
2505
  "step": 6784
2506
  },
2507
  {
@@ -2538,9 +2538,9 @@
2538
  "eval_overall_f1": 0.8435374149659863,
2539
  "eval_overall_precision": 0.8072916666666666,
2540
  "eval_overall_recall": 0.8831908831908832,
2541
- "eval_runtime": 0.3875,
2542
- "eval_samples_per_second": 482.599,
2543
- "eval_steps_per_second": 7.742,
2544
  "step": 6890
2545
  },
2546
  {
@@ -2577,9 +2577,9 @@
2577
  "eval_overall_f1": 0.845945945945946,
2578
  "eval_overall_precision": 0.8046272493573264,
2579
  "eval_overall_recall": 0.8917378917378918,
2580
- "eval_runtime": 0.3869,
2581
- "eval_samples_per_second": 483.358,
2582
- "eval_steps_per_second": 7.754,
2583
  "step": 6996
2584
  },
2585
  {
@@ -2616,9 +2616,9 @@
2616
  "eval_overall_f1": 0.8367626886145405,
2617
  "eval_overall_precision": 0.8068783068783069,
2618
  "eval_overall_recall": 0.8689458689458689,
2619
- "eval_runtime": 0.3869,
2620
- "eval_samples_per_second": 483.332,
2621
- "eval_steps_per_second": 7.754,
2622
  "step": 7102
2623
  },
2624
  {
@@ -2655,9 +2655,9 @@
2655
  "eval_overall_f1": 0.8392370572207084,
2656
  "eval_overall_precision": 0.804177545691906,
2657
  "eval_overall_recall": 0.8774928774928775,
2658
- "eval_runtime": 0.3881,
2659
- "eval_samples_per_second": 481.831,
2660
- "eval_steps_per_second": 7.73,
2661
  "step": 7208
2662
  },
2663
  {
@@ -2694,9 +2694,9 @@
2694
  "eval_overall_f1": 0.8455284552845528,
2695
  "eval_overall_precision": 0.8062015503875969,
2696
  "eval_overall_recall": 0.8888888888888888,
2697
- "eval_runtime": 0.3858,
2698
- "eval_samples_per_second": 484.678,
2699
- "eval_steps_per_second": 7.776,
2700
  "step": 7314
2701
  },
2702
  {
@@ -2733,9 +2733,9 @@
2733
  "eval_overall_f1": 0.8462585034013606,
2734
  "eval_overall_precision": 0.8098958333333334,
2735
  "eval_overall_recall": 0.886039886039886,
2736
- "eval_runtime": 0.3854,
2737
- "eval_samples_per_second": 485.205,
2738
- "eval_steps_per_second": 7.784,
2739
  "step": 7420
2740
  },
2741
  {
@@ -2772,9 +2772,9 @@
2772
  "eval_overall_f1": 0.8571428571428573,
2773
  "eval_overall_precision": 0.8203125,
2774
  "eval_overall_recall": 0.8974358974358975,
2775
- "eval_runtime": 0.3874,
2776
- "eval_samples_per_second": 482.652,
2777
- "eval_steps_per_second": 7.743,
2778
  "step": 7526
2779
  },
2780
  {
@@ -2811,9 +2811,9 @@
2811
  "eval_overall_f1": 0.8365122615803815,
2812
  "eval_overall_precision": 0.8015665796344648,
2813
  "eval_overall_recall": 0.8746438746438746,
2814
- "eval_runtime": 0.3877,
2815
- "eval_samples_per_second": 482.314,
2816
- "eval_steps_per_second": 7.738,
2817
  "step": 7632
2818
  },
2819
  {
@@ -2850,9 +2850,9 @@
2850
  "eval_overall_f1": 0.8501362397820162,
2851
  "eval_overall_precision": 0.814621409921671,
2852
  "eval_overall_recall": 0.8888888888888888,
2853
- "eval_runtime": 0.3856,
2854
- "eval_samples_per_second": 484.921,
2855
- "eval_steps_per_second": 7.779,
2856
  "step": 7738
2857
  },
2858
  {
@@ -2889,9 +2889,9 @@
2889
  "eval_overall_f1": 0.8532235939643347,
2890
  "eval_overall_precision": 0.8227513227513228,
2891
  "eval_overall_recall": 0.886039886039886,
2892
- "eval_runtime": 0.3872,
2893
- "eval_samples_per_second": 482.9,
2894
- "eval_steps_per_second": 7.747,
2895
  "step": 7844
2896
  },
2897
  {
@@ -2928,9 +2928,9 @@
2928
  "eval_overall_f1": 0.8532608695652173,
2929
  "eval_overall_precision": 0.8155844155844156,
2930
  "eval_overall_recall": 0.8945868945868946,
2931
- "eval_runtime": 0.3855,
2932
- "eval_samples_per_second": 485.067,
2933
- "eval_steps_per_second": 7.782,
2934
  "step": 7950
2935
  },
2936
  {
@@ -2967,8 +2967,8 @@
2967
  "eval_overall_f1": 0.8544474393530996,
2968
  "eval_overall_precision": 0.8107416879795396,
2969
  "eval_overall_recall": 0.9031339031339032,
2970
- "eval_runtime": 0.3869,
2971
- "eval_samples_per_second": 483.365,
2972
  "eval_steps_per_second": 7.755,
2973
  "step": 8056
2974
  },
@@ -3006,9 +3006,9 @@
3006
  "eval_overall_f1": 0.8517006802721088,
3007
  "eval_overall_precision": 0.8151041666666666,
3008
  "eval_overall_recall": 0.8917378917378918,
3009
- "eval_runtime": 0.3948,
3010
- "eval_samples_per_second": 473.674,
3011
- "eval_steps_per_second": 7.599,
3012
  "step": 8162
3013
  },
3014
  {
@@ -3045,9 +3045,9 @@
3045
  "eval_overall_f1": 0.854368932038835,
3046
  "eval_overall_precision": 0.8324324324324325,
3047
  "eval_overall_recall": 0.8774928774928775,
3048
- "eval_runtime": 0.3858,
3049
- "eval_samples_per_second": 484.686,
3050
- "eval_steps_per_second": 7.776,
3051
  "step": 8268
3052
  },
3053
  {
@@ -3084,9 +3084,9 @@
3084
  "eval_overall_f1": 0.8401084010840107,
3085
  "eval_overall_precision": 0.8010335917312662,
3086
  "eval_overall_recall": 0.8831908831908832,
3087
- "eval_runtime": 0.3867,
3088
- "eval_samples_per_second": 483.59,
3089
- "eval_steps_per_second": 7.758,
3090
  "step": 8374
3091
  },
3092
  {
@@ -3123,9 +3123,9 @@
3123
  "eval_overall_f1": 0.854794520547945,
3124
  "eval_overall_precision": 0.8232189973614775,
3125
  "eval_overall_recall": 0.8888888888888888,
3126
- "eval_runtime": 0.3871,
3127
- "eval_samples_per_second": 483.069,
3128
- "eval_steps_per_second": 7.75,
3129
  "step": 8480
3130
  },
3131
  {
@@ -3162,9 +3162,9 @@
3162
  "eval_overall_f1": 0.8451086956521738,
3163
  "eval_overall_precision": 0.8077922077922078,
3164
  "eval_overall_recall": 0.886039886039886,
3165
- "eval_runtime": 0.3874,
3166
- "eval_samples_per_second": 482.691,
3167
- "eval_steps_per_second": 7.744,
3168
  "step": 8586
3169
  },
3170
  {
@@ -3201,9 +3201,9 @@
3201
  "eval_overall_f1": 0.8485675306957708,
3202
  "eval_overall_precision": 0.8141361256544503,
3203
  "eval_overall_recall": 0.886039886039886,
3204
- "eval_runtime": 0.3861,
3205
- "eval_samples_per_second": 484.302,
3206
- "eval_steps_per_second": 7.77,
3207
  "step": 8692
3208
  },
3209
  {
@@ -3240,9 +3240,9 @@
3240
  "eval_overall_f1": 0.8373983739837397,
3241
  "eval_overall_precision": 0.7984496124031008,
3242
  "eval_overall_recall": 0.8803418803418803,
3243
- "eval_runtime": 0.3873,
3244
- "eval_samples_per_second": 482.882,
3245
- "eval_steps_per_second": 7.747,
3246
  "step": 8798
3247
  },
3248
  {
@@ -3279,9 +3279,9 @@
3279
  "eval_overall_f1": 0.8398384925975775,
3280
  "eval_overall_precision": 0.7959183673469388,
3281
  "eval_overall_recall": 0.8888888888888888,
3282
- "eval_runtime": 0.3876,
3283
- "eval_samples_per_second": 482.481,
3284
- "eval_steps_per_second": 7.74,
3285
  "step": 8904
3286
  },
3287
  {
@@ -3318,9 +3318,9 @@
3318
  "eval_overall_f1": 0.8412483039348712,
3319
  "eval_overall_precision": 0.8031088082901554,
3320
  "eval_overall_recall": 0.8831908831908832,
3321
- "eval_runtime": 0.392,
3322
- "eval_samples_per_second": 477.052,
3323
- "eval_steps_per_second": 7.653,
3324
  "step": 9010
3325
  },
3326
  {
@@ -3357,9 +3357,9 @@
3357
  "eval_overall_f1": 0.8493150684931507,
3358
  "eval_overall_precision": 0.8179419525065963,
3359
  "eval_overall_recall": 0.8831908831908832,
3360
- "eval_runtime": 0.3875,
3361
- "eval_samples_per_second": 482.525,
3362
- "eval_steps_per_second": 7.741,
3363
  "step": 9116
3364
  },
3365
  {
@@ -3396,9 +3396,9 @@
3396
  "eval_overall_f1": 0.844804318488529,
3397
  "eval_overall_precision": 0.8025641025641026,
3398
  "eval_overall_recall": 0.8917378917378918,
3399
- "eval_runtime": 0.3876,
3400
- "eval_samples_per_second": 482.435,
3401
- "eval_steps_per_second": 7.74,
3402
  "step": 9222
3403
  },
3404
  {
@@ -3435,9 +3435,9 @@
3435
  "eval_overall_f1": 0.8443843031123139,
3436
  "eval_overall_precision": 0.8041237113402062,
3437
  "eval_overall_recall": 0.8888888888888888,
3438
- "eval_runtime": 0.3861,
3439
- "eval_samples_per_second": 484.269,
3440
- "eval_steps_per_second": 7.769,
3441
  "step": 9328
3442
  },
3443
  {
@@ -3474,9 +3474,9 @@
3474
  "eval_overall_f1": 0.8394062078272606,
3475
  "eval_overall_precision": 0.7974358974358975,
3476
  "eval_overall_recall": 0.886039886039886,
3477
- "eval_runtime": 0.3874,
3478
- "eval_samples_per_second": 482.728,
3479
- "eval_steps_per_second": 7.744,
3480
  "step": 9434
3481
  },
3482
  {
@@ -3513,9 +3513,9 @@
3513
  "eval_overall_f1": 0.8478260869565218,
3514
  "eval_overall_precision": 0.8103896103896104,
3515
  "eval_overall_recall": 0.8888888888888888,
3516
- "eval_runtime": 0.3896,
3517
- "eval_samples_per_second": 480.006,
3518
- "eval_steps_per_second": 7.701,
3519
  "step": 9540
3520
  },
3521
  {
@@ -3552,9 +3552,9 @@
3552
  "eval_overall_f1": 0.8466757123473541,
3553
  "eval_overall_precision": 0.8082901554404145,
3554
  "eval_overall_recall": 0.8888888888888888,
3555
- "eval_runtime": 0.39,
3556
- "eval_samples_per_second": 479.51,
3557
- "eval_steps_per_second": 7.693,
3558
  "step": 9646
3559
  },
3560
  {
@@ -3591,9 +3591,9 @@
3591
  "eval_overall_f1": 0.8505434782608695,
3592
  "eval_overall_precision": 0.812987012987013,
3593
  "eval_overall_recall": 0.8917378917378918,
3594
- "eval_runtime": 0.3921,
3595
- "eval_samples_per_second": 476.865,
3596
- "eval_steps_per_second": 7.65,
3597
  "step": 9752
3598
  },
3599
  {
@@ -3630,9 +3630,9 @@
3630
  "eval_overall_f1": 0.8497970230040596,
3631
  "eval_overall_precision": 0.8092783505154639,
3632
  "eval_overall_recall": 0.8945868945868946,
3633
- "eval_runtime": 0.3933,
3634
- "eval_samples_per_second": 475.405,
3635
- "eval_steps_per_second": 7.627,
3636
  "step": 9858
3637
  },
3638
  {
@@ -3669,9 +3669,9 @@
3669
  "eval_overall_f1": 0.8470906630581868,
3670
  "eval_overall_precision": 0.8067010309278351,
3671
  "eval_overall_recall": 0.8917378917378918,
3672
- "eval_runtime": 0.394,
3673
- "eval_samples_per_second": 474.646,
3674
- "eval_steps_per_second": 7.615,
3675
  "step": 9964
3676
  },
3677
  {
@@ -3708,9 +3708,9 @@
3708
  "eval_overall_f1": 0.8493894165535957,
3709
  "eval_overall_precision": 0.810880829015544,
3710
  "eval_overall_recall": 0.8917378917378918,
3711
- "eval_runtime": 0.3923,
3712
- "eval_samples_per_second": 476.645,
3713
- "eval_steps_per_second": 7.647,
3714
  "step": 10070
3715
  },
3716
  {
@@ -3747,9 +3747,9 @@
3747
  "eval_overall_f1": 0.8416779431664412,
3748
  "eval_overall_precision": 0.8015463917525774,
3749
  "eval_overall_recall": 0.886039886039886,
3750
- "eval_runtime": 0.3899,
3751
- "eval_samples_per_second": 479.554,
3752
- "eval_steps_per_second": 7.693,
3753
  "step": 10176
3754
  },
3755
  {
@@ -3786,9 +3786,9 @@
3786
  "eval_overall_f1": 0.8466757123473541,
3787
  "eval_overall_precision": 0.8082901554404145,
3788
  "eval_overall_recall": 0.8888888888888888,
3789
- "eval_runtime": 0.3979,
3790
- "eval_samples_per_second": 469.952,
3791
- "eval_steps_per_second": 7.539,
3792
  "step": 10282
3793
  },
3794
  {
@@ -3825,9 +3825,9 @@
3825
  "eval_overall_f1": 0.8443843031123139,
3826
  "eval_overall_precision": 0.8041237113402062,
3827
  "eval_overall_recall": 0.8888888888888888,
3828
- "eval_runtime": 0.3908,
3829
- "eval_samples_per_second": 478.561,
3830
- "eval_steps_per_second": 7.677,
3831
  "step": 10388
3832
  },
3833
  {
@@ -3864,9 +3864,9 @@
3864
  "eval_overall_f1": 0.8443843031123139,
3865
  "eval_overall_precision": 0.8041237113402062,
3866
  "eval_overall_recall": 0.8888888888888888,
3867
- "eval_runtime": 0.3928,
3868
- "eval_samples_per_second": 476.04,
3869
- "eval_steps_per_second": 7.637,
3870
  "step": 10494
3871
  },
3872
  {
@@ -3903,9 +3903,9 @@
3903
  "eval_overall_f1": 0.8432432432432433,
3904
  "eval_overall_precision": 0.8020565552699229,
3905
  "eval_overall_recall": 0.8888888888888888,
3906
- "eval_runtime": 0.3916,
3907
- "eval_samples_per_second": 477.569,
3908
- "eval_steps_per_second": 7.662,
3909
  "step": 10600
3910
  },
3911
  {
@@ -3913,9 +3913,9 @@
3913
  "step": 10600,
3914
  "total_flos": 5043631411410816.0,
3915
  "train_loss": 0.07131878634668747,
3916
- "train_runtime": 622.8213,
3917
- "train_samples_per_second": 271.025,
3918
- "train_steps_per_second": 17.019
3919
  }
3920
  ],
3921
  "logging_steps": 500,
 
42
  "eval_overall_f1": 0.010416666666666668,
43
  "eval_overall_precision": 0.06060606060606061,
44
  "eval_overall_recall": 0.005698005698005698,
45
+ "eval_runtime": 0.3862,
46
+ "eval_samples_per_second": 484.243,
47
+ "eval_steps_per_second": 7.769,
48
  "step": 106
49
  },
50
  {
 
81
  "eval_overall_f1": 0.4402332361516035,
82
  "eval_overall_precision": 0.4507462686567164,
83
  "eval_overall_recall": 0.4301994301994302,
84
+ "eval_runtime": 0.3854,
85
+ "eval_samples_per_second": 485.184,
86
+ "eval_steps_per_second": 7.784,
87
  "step": 212
88
  },
89
  {
 
120
  "eval_overall_f1": 0.6755674232309746,
121
  "eval_overall_precision": 0.635678391959799,
122
  "eval_overall_recall": 0.7207977207977208,
123
+ "eval_runtime": 0.3874,
124
+ "eval_samples_per_second": 482.736,
125
+ "eval_steps_per_second": 7.744,
126
  "step": 318
127
  },
128
  {
 
159
  "eval_overall_f1": 0.7506361323155216,
160
  "eval_overall_precision": 0.6781609195402298,
161
  "eval_overall_recall": 0.8404558404558404,
162
+ "eval_runtime": 0.386,
163
+ "eval_samples_per_second": 484.418,
164
+ "eval_steps_per_second": 7.771,
165
  "step": 424
166
  },
167
  {
 
198
  "eval_overall_f1": 0.7506361323155216,
199
  "eval_overall_precision": 0.6781609195402298,
200
  "eval_overall_recall": 0.8404558404558404,
201
+ "eval_runtime": 0.3888,
202
+ "eval_samples_per_second": 480.92,
203
+ "eval_steps_per_second": 7.715,
204
  "step": 530
205
  },
206
  {
 
237
  "eval_overall_f1": 0.7652173913043478,
238
  "eval_overall_precision": 0.6784140969162996,
239
  "eval_overall_recall": 0.8774928774928775,
240
+ "eval_runtime": 0.3887,
241
+ "eval_samples_per_second": 481.105,
242
+ "eval_steps_per_second": 7.718,
243
  "step": 636
244
  },
245
  {
 
276
  "eval_overall_f1": 0.7974025974025974,
277
  "eval_overall_precision": 0.7326968973747017,
278
  "eval_overall_recall": 0.8746438746438746,
279
+ "eval_runtime": 0.3888,
280
+ "eval_samples_per_second": 481.015,
281
+ "eval_steps_per_second": 7.717,
282
  "step": 742
283
  },
284
  {
 
315
  "eval_overall_f1": 0.7943078913324709,
316
  "eval_overall_precision": 0.7274881516587678,
317
  "eval_overall_recall": 0.8746438746438746,
318
+ "eval_runtime": 0.3896,
319
+ "eval_samples_per_second": 479.969,
320
+ "eval_steps_per_second": 7.7,
321
  "step": 848
322
  },
323
  {
 
354
  "eval_overall_f1": 0.8269484808454426,
355
  "eval_overall_precision": 0.770935960591133,
356
  "eval_overall_recall": 0.8917378917378918,
357
+ "eval_runtime": 0.3907,
358
+ "eval_samples_per_second": 478.642,
359
+ "eval_steps_per_second": 7.679,
360
  "step": 954
361
  },
362
  {
 
393
  "eval_overall_f1": 0.8284182305630027,
394
  "eval_overall_precision": 0.7822784810126582,
395
  "eval_overall_recall": 0.8803418803418803,
396
+ "eval_runtime": 0.3875,
397
+ "eval_samples_per_second": 482.56,
398
+ "eval_steps_per_second": 7.742,
399
  "step": 1060
400
  },
401
  {
 
432
  "eval_overall_f1": 0.8138297872340426,
433
  "eval_overall_precision": 0.7630922693266833,
434
  "eval_overall_recall": 0.8717948717948718,
435
+ "eval_runtime": 0.3856,
436
+ "eval_samples_per_second": 484.897,
437
+ "eval_steps_per_second": 7.779,
438
  "step": 1166
439
  },
440
  {
 
471
  "eval_overall_f1": 0.8146214099216709,
472
  "eval_overall_precision": 0.7518072289156627,
473
  "eval_overall_recall": 0.8888888888888888,
474
+ "eval_runtime": 0.3856,
475
+ "eval_samples_per_second": 484.965,
476
+ "eval_steps_per_second": 7.78,
477
  "step": 1272
478
  },
479
  {
 
510
  "eval_overall_f1": 0.8255659121171771,
511
  "eval_overall_precision": 0.775,
512
  "eval_overall_recall": 0.8831908831908832,
513
+ "eval_runtime": 0.3838,
514
+ "eval_samples_per_second": 487.205,
515
+ "eval_steps_per_second": 7.816,
516
  "step": 1378
517
  },
518
  {
 
549
  "eval_overall_f1": 0.807843137254902,
550
  "eval_overall_precision": 0.7463768115942029,
551
  "eval_overall_recall": 0.8803418803418803,
552
+ "eval_runtime": 0.3863,
553
+ "eval_samples_per_second": 484.097,
554
+ "eval_steps_per_second": 7.766,
555
  "step": 1484
556
  },
557
  {
 
588
  "eval_overall_f1": 0.8284182305630027,
589
  "eval_overall_precision": 0.7822784810126582,
590
  "eval_overall_recall": 0.8803418803418803,
591
+ "eval_runtime": 0.3835,
592
+ "eval_samples_per_second": 487.585,
593
+ "eval_steps_per_second": 7.822,
594
  "step": 1590
595
  },
596
  {
 
627
  "eval_overall_f1": 0.8333333333333334,
628
  "eval_overall_precision": 0.7888040712468194,
629
  "eval_overall_recall": 0.8831908831908832,
630
+ "eval_runtime": 0.3837,
631
+ "eval_samples_per_second": 487.337,
632
+ "eval_steps_per_second": 7.818,
633
  "step": 1696
634
  },
635
  {
 
666
  "eval_overall_f1": 0.8398384925975775,
667
  "eval_overall_precision": 0.7959183673469388,
668
  "eval_overall_recall": 0.8888888888888888,
669
+ "eval_runtime": 0.3851,
670
+ "eval_samples_per_second": 485.53,
671
+ "eval_steps_per_second": 7.789,
672
  "step": 1802
673
  },
674
  {
 
705
  "eval_overall_f1": 0.8279569892473119,
706
  "eval_overall_precision": 0.7837150127226463,
707
  "eval_overall_recall": 0.8774928774928775,
708
+ "eval_runtime": 0.3852,
709
+ "eval_samples_per_second": 485.425,
710
+ "eval_steps_per_second": 7.788,
711
  "step": 1908
712
  },
713
  {
 
744
  "eval_overall_f1": 0.8371467025572006,
745
  "eval_overall_precision": 0.7933673469387755,
746
  "eval_overall_recall": 0.886039886039886,
747
+ "eval_runtime": 0.3833,
748
+ "eval_samples_per_second": 487.824,
749
+ "eval_steps_per_second": 7.826,
750
  "step": 2014
751
  },
752
  {
 
783
  "eval_overall_f1": 0.8364611260053618,
784
  "eval_overall_precision": 0.789873417721519,
785
  "eval_overall_recall": 0.8888888888888888,
786
+ "eval_runtime": 0.3837,
787
+ "eval_samples_per_second": 487.366,
788
+ "eval_steps_per_second": 7.819,
789
  "step": 2120
790
  },
791
  {
 
822
  "eval_overall_f1": 0.8348993288590604,
823
  "eval_overall_precision": 0.7893401015228426,
824
  "eval_overall_recall": 0.886039886039886,
825
+ "eval_runtime": 0.3836,
826
+ "eval_samples_per_second": 487.45,
827
+ "eval_steps_per_second": 7.82,
828
  "step": 2226
829
  },
830
  {
 
861
  "eval_overall_f1": 0.8378378378378378,
862
  "eval_overall_precision": 0.7969151670951157,
863
  "eval_overall_recall": 0.8831908831908832,
864
+ "eval_runtime": 0.3851,
865
+ "eval_samples_per_second": 485.564,
866
+ "eval_steps_per_second": 7.79,
867
  "step": 2332
868
  },
869
  {
 
900
  "eval_overall_f1": 0.8502024291497975,
901
  "eval_overall_precision": 0.8076923076923077,
902
  "eval_overall_recall": 0.8974358974358975,
903
+ "eval_runtime": 0.3866,
904
+ "eval_samples_per_second": 483.721,
905
+ "eval_steps_per_second": 7.76,
906
  "step": 2438
907
  },
908
  {
 
939
  "eval_overall_f1": 0.8449197860962567,
940
  "eval_overall_precision": 0.7959697732997482,
941
  "eval_overall_recall": 0.9002849002849003,
942
+ "eval_runtime": 0.3896,
943
+ "eval_samples_per_second": 479.933,
944
+ "eval_steps_per_second": 7.699,
945
  "step": 2544
946
  },
947
  {
 
978
  "eval_overall_f1": 0.8266666666666667,
979
  "eval_overall_precision": 0.7769423558897243,
980
  "eval_overall_recall": 0.8831908831908832,
981
+ "eval_runtime": 0.3874,
982
+ "eval_samples_per_second": 482.751,
983
+ "eval_steps_per_second": 7.745,
984
  "step": 2650
985
  },
986
  {
 
1017
  "eval_overall_f1": 0.8225806451612903,
1018
  "eval_overall_precision": 0.7786259541984732,
1019
  "eval_overall_recall": 0.8717948717948718,
1020
+ "eval_runtime": 0.3851,
1021
+ "eval_samples_per_second": 485.534,
1022
+ "eval_steps_per_second": 7.789,
1023
  "step": 2756
1024
  },
1025
  {
 
1056
  "eval_overall_f1": 0.8253968253968255,
1057
  "eval_overall_precision": 0.7703703703703704,
1058
  "eval_overall_recall": 0.8888888888888888,
1059
+ "eval_runtime": 0.3833,
1060
+ "eval_samples_per_second": 487.887,
1061
+ "eval_steps_per_second": 7.827,
1062
  "step": 2862
1063
  },
1064
  {
 
1095
  "eval_overall_f1": 0.8287292817679558,
1096
  "eval_overall_precision": 0.8042895442359249,
1097
  "eval_overall_recall": 0.8547008547008547,
1098
+ "eval_runtime": 0.3862,
1099
+ "eval_samples_per_second": 484.155,
1100
+ "eval_steps_per_second": 7.767,
1101
  "step": 2968
1102
  },
1103
  {
 
1134
  "eval_overall_f1": 0.8532608695652173,
1135
  "eval_overall_precision": 0.8155844155844156,
1136
  "eval_overall_recall": 0.8945868945868946,
1137
+ "eval_runtime": 0.3854,
1138
+ "eval_samples_per_second": 485.171,
1139
+ "eval_steps_per_second": 7.783,
1140
  "step": 3074
1141
  },
1142
  {
 
1173
  "eval_overall_f1": 0.8423913043478262,
1174
  "eval_overall_precision": 0.8051948051948052,
1175
  "eval_overall_recall": 0.8831908831908832,
1176
+ "eval_runtime": 0.3861,
1177
+ "eval_samples_per_second": 484.356,
1178
+ "eval_steps_per_second": 7.77,
1179
  "step": 3180
1180
  },
1181
  {
 
1212
  "eval_overall_f1": 0.8367071524966261,
1213
  "eval_overall_precision": 0.7948717948717948,
1214
  "eval_overall_recall": 0.8831908831908832,
1215
+ "eval_runtime": 0.3844,
1216
+ "eval_samples_per_second": 486.52,
1217
+ "eval_steps_per_second": 7.805,
1218
  "step": 3286
1219
  },
1220
  {
 
1251
  "eval_overall_f1": 0.824468085106383,
1252
  "eval_overall_precision": 0.773067331670823,
1253
  "eval_overall_recall": 0.8831908831908832,
1254
+ "eval_runtime": 0.3854,
1255
+ "eval_samples_per_second": 485.203,
1256
+ "eval_steps_per_second": 7.784,
1257
  "step": 3392
1258
  },
1259
  {
 
1290
  "eval_overall_f1": 0.8389715832205684,
1291
  "eval_overall_precision": 0.7989690721649485,
1292
  "eval_overall_recall": 0.8831908831908832,
1293
+ "eval_runtime": 0.3862,
1294
+ "eval_samples_per_second": 484.264,
1295
+ "eval_steps_per_second": 7.769,
1296
  "step": 3498
1297
  },
1298
  {
 
1329
  "eval_overall_f1": 0.8466757123473541,
1330
  "eval_overall_precision": 0.8082901554404145,
1331
  "eval_overall_recall": 0.8888888888888888,
1332
+ "eval_runtime": 0.3852,
1333
+ "eval_samples_per_second": 485.414,
1334
+ "eval_steps_per_second": 7.787,
1335
  "step": 3604
1336
  },
1337
  {
 
1368
  "eval_overall_f1": 0.8346883468834689,
1369
  "eval_overall_precision": 0.7958656330749354,
1370
  "eval_overall_recall": 0.8774928774928775,
1371
+ "eval_runtime": 0.3862,
1372
+ "eval_samples_per_second": 484.19,
1373
+ "eval_steps_per_second": 7.768,
1374
  "step": 3710
1375
  },
1376
  {
 
1407
  "eval_overall_f1": 0.8273092369477911,
1408
  "eval_overall_precision": 0.7803030303030303,
1409
  "eval_overall_recall": 0.8803418803418803,
1410
+ "eval_runtime": 0.3864,
1411
+ "eval_samples_per_second": 483.938,
1412
+ "eval_steps_per_second": 7.764,
1413
  "step": 3816
1414
  },
1415
  {
 
1446
  "eval_overall_f1": 0.8279569892473119,
1447
  "eval_overall_precision": 0.7837150127226463,
1448
  "eval_overall_recall": 0.8774928774928775,
1449
+ "eval_runtime": 0.3877,
1450
+ "eval_samples_per_second": 482.325,
1451
+ "eval_steps_per_second": 7.738,
1452
  "step": 3922
1453
  },
1454
  {
 
1485
  "eval_overall_f1": 0.8342541436464089,
1486
  "eval_overall_precision": 0.8096514745308311,
1487
  "eval_overall_recall": 0.8603988603988604,
1488
+ "eval_runtime": 0.3858,
1489
+ "eval_samples_per_second": 484.723,
1490
+ "eval_steps_per_second": 7.776,
1491
  "step": 4028
1492
  },
1493
  {
 
1524
  "eval_overall_f1": 0.8355795148247979,
1525
  "eval_overall_precision": 0.7928388746803069,
1526
  "eval_overall_recall": 0.8831908831908832,
1527
+ "eval_runtime": 0.394,
1528
+ "eval_samples_per_second": 474.609,
1529
+ "eval_steps_per_second": 7.614,
1530
  "step": 4134
1531
  },
1532
  {
 
1563
  "eval_overall_f1": 0.8304405874499333,
1564
  "eval_overall_precision": 0.7814070351758794,
1565
  "eval_overall_recall": 0.886039886039886,
1566
+ "eval_runtime": 0.3873,
1567
+ "eval_samples_per_second": 482.792,
1568
+ "eval_steps_per_second": 7.745,
1569
  "step": 4240
1570
  },
1571
  {
 
1602
  "eval_overall_f1": 0.8266666666666667,
1603
  "eval_overall_precision": 0.7769423558897243,
1604
  "eval_overall_recall": 0.8831908831908832,
1605
+ "eval_runtime": 0.3855,
1606
+ "eval_samples_per_second": 485.071,
1607
+ "eval_steps_per_second": 7.782,
1608
  "step": 4346
1609
  },
1610
  {
 
1641
  "eval_overall_f1": 0.8385345997286296,
1642
  "eval_overall_precision": 0.8005181347150259,
1643
  "eval_overall_recall": 0.8803418803418803,
1644
+ "eval_runtime": 0.3852,
1645
+ "eval_samples_per_second": 485.429,
1646
+ "eval_steps_per_second": 7.788,
1647
  "step": 4452
1648
  },
1649
  {
 
1680
  "eval_overall_f1": 0.8259109311740892,
1681
  "eval_overall_precision": 0.7846153846153846,
1682
  "eval_overall_recall": 0.8717948717948718,
1683
+ "eval_runtime": 0.3873,
1684
+ "eval_samples_per_second": 482.887,
1685
+ "eval_steps_per_second": 7.747,
1686
  "step": 4558
1687
  },
1688
  {
 
1719
  "eval_overall_f1": 0.8512960436562074,
1720
  "eval_overall_precision": 0.8167539267015707,
1721
  "eval_overall_recall": 0.8888888888888888,
1722
+ "eval_runtime": 0.3853,
1723
+ "eval_samples_per_second": 485.335,
1724
+ "eval_steps_per_second": 7.786,
1725
  "step": 4664
1726
  },
1727
  {
 
1758
  "eval_overall_f1": 0.850415512465374,
1759
  "eval_overall_precision": 0.8274932614555256,
1760
  "eval_overall_recall": 0.8746438746438746,
1761
+ "eval_runtime": 0.3871,
1762
+ "eval_samples_per_second": 483.034,
1763
+ "eval_steps_per_second": 7.749,
1764
  "step": 4770
1765
  },
1766
  {
 
1797
  "eval_overall_f1": 0.8602739726027397,
1798
  "eval_overall_precision": 0.8284960422163589,
1799
  "eval_overall_recall": 0.8945868945868946,
1800
+ "eval_runtime": 0.3856,
1801
+ "eval_samples_per_second": 484.938,
1802
+ "eval_steps_per_second": 7.78,
1803
  "step": 4876
1804
  },
1805
  {
 
1836
  "eval_overall_f1": 0.8540540540540541,
1837
  "eval_overall_precision": 0.8123393316195373,
1838
  "eval_overall_recall": 0.9002849002849003,
1839
+ "eval_runtime": 0.3872,
1840
+ "eval_samples_per_second": 482.907,
1841
+ "eval_steps_per_second": 7.747,
1842
  "step": 4982
1843
  },
1844
  {
 
1875
  "eval_overall_f1": 0.8415300546448087,
1876
  "eval_overall_precision": 0.8083989501312336,
1877
  "eval_overall_recall": 0.8774928774928775,
1878
+ "eval_runtime": 0.3834,
1879
+ "eval_samples_per_second": 487.749,
1880
+ "eval_steps_per_second": 7.825,
1881
  "step": 5088
1882
  },
1883
  {
 
1914
  "eval_overall_f1": 0.8602442333785618,
1915
  "eval_overall_precision": 0.8212435233160622,
1916
  "eval_overall_recall": 0.9031339031339032,
1917
+ "eval_runtime": 0.3863,
1918
+ "eval_samples_per_second": 484.136,
1919
+ "eval_steps_per_second": 7.767,
1920
  "step": 5194
1921
  },
1922
  {
 
1953
  "eval_overall_f1": 0.8571428571428573,
1954
  "eval_overall_precision": 0.8203125,
1955
  "eval_overall_recall": 0.8974358974358975,
1956
+ "eval_runtime": 0.3897,
1957
+ "eval_samples_per_second": 479.861,
1958
+ "eval_steps_per_second": 7.698,
1959
  "step": 5300
1960
  },
1961
  {
 
1992
  "eval_overall_f1": 0.8405405405405405,
1993
  "eval_overall_precision": 0.7994858611825193,
1994
  "eval_overall_recall": 0.886039886039886,
1995
+ "eval_runtime": 0.3875,
1996
+ "eval_samples_per_second": 482.58,
1997
+ "eval_steps_per_second": 7.742,
1998
  "step": 5406
1999
  },
2000
  {
 
2031
  "eval_overall_f1": 0.8498659517426275,
2032
  "eval_overall_precision": 0.8025316455696202,
2033
  "eval_overall_recall": 0.9031339031339032,
2034
+ "eval_runtime": 0.3872,
2035
+ "eval_samples_per_second": 483.005,
2036
+ "eval_steps_per_second": 7.749,
2037
  "step": 5512
2038
  },
2039
  {
 
2070
  "eval_overall_f1": 0.8517520215633424,
2071
  "eval_overall_precision": 0.8081841432225064,
2072
  "eval_overall_recall": 0.9002849002849003,
2073
+ "eval_runtime": 0.387,
2074
+ "eval_samples_per_second": 483.151,
2075
+ "eval_steps_per_second": 7.751,
2076
  "step": 5618
2077
  },
2078
  {
 
2109
  "eval_overall_f1": 0.8497970230040596,
2110
  "eval_overall_precision": 0.8092783505154639,
2111
  "eval_overall_recall": 0.8945868945868946,
2112
+ "eval_runtime": 0.385,
2113
+ "eval_samples_per_second": 485.707,
2114
+ "eval_steps_per_second": 7.792,
2115
  "step": 5724
2116
  },
2117
  {
 
2148
  "eval_overall_f1": 0.8313090418353576,
2149
  "eval_overall_precision": 0.7897435897435897,
2150
  "eval_overall_recall": 0.8774928774928775,
2151
+ "eval_runtime": 0.3857,
2152
+ "eval_samples_per_second": 484.839,
2153
+ "eval_steps_per_second": 7.778,
2154
  "step": 5830
2155
  },
2156
  {
 
2187
  "eval_overall_f1": 0.840381991814461,
2188
  "eval_overall_precision": 0.806282722513089,
2189
  "eval_overall_recall": 0.8774928774928775,
2190
+ "eval_runtime": 0.3861,
2191
+ "eval_samples_per_second": 484.373,
2192
+ "eval_steps_per_second": 7.771,
2193
  "step": 5936
2194
  },
2195
  {
 
2226
  "eval_overall_f1": 0.8516483516483517,
2227
  "eval_overall_precision": 0.8222811671087533,
2228
  "eval_overall_recall": 0.8831908831908832,
2229
+ "eval_runtime": 0.3872,
2230
+ "eval_samples_per_second": 482.965,
2231
+ "eval_steps_per_second": 7.748,
2232
  "step": 6042
2233
  },
2234
  {
 
2265
  "eval_overall_f1": 0.8358208955223881,
2266
  "eval_overall_precision": 0.7979274611398963,
2267
  "eval_overall_recall": 0.8774928774928775,
2268
+ "eval_runtime": 0.3844,
2269
+ "eval_samples_per_second": 486.46,
2270
+ "eval_steps_per_second": 7.804,
2271
  "step": 6148
2272
  },
2273
  {
 
2304
  "eval_overall_f1": 0.8474114441416893,
2305
  "eval_overall_precision": 0.8120104438642297,
2306
  "eval_overall_recall": 0.886039886039886,
2307
+ "eval_runtime": 0.3865,
2308
+ "eval_samples_per_second": 483.887,
2309
+ "eval_steps_per_second": 7.763,
2310
  "step": 6254
2311
  },
2312
  {
 
2343
  "eval_overall_f1": 0.8528610354223433,
2344
  "eval_overall_precision": 0.8172323759791122,
2345
  "eval_overall_recall": 0.8917378917378918,
2346
+ "eval_runtime": 0.3845,
2347
+ "eval_samples_per_second": 486.366,
2348
+ "eval_steps_per_second": 7.803,
2349
  "step": 6360
2350
  },
2351
  {
 
2382
  "eval_overall_f1": 0.8322147651006713,
2383
  "eval_overall_precision": 0.7868020304568528,
2384
  "eval_overall_recall": 0.8831908831908832,
2385
+ "eval_runtime": 0.3866,
2386
+ "eval_samples_per_second": 483.688,
2387
+ "eval_steps_per_second": 7.76,
2388
  "step": 6466
2389
  },
2390
  {
 
2421
  "eval_overall_f1": 0.8524590163934426,
2422
  "eval_overall_precision": 0.8188976377952756,
2423
  "eval_overall_recall": 0.8888888888888888,
2424
+ "eval_runtime": 0.3851,
2425
+ "eval_samples_per_second": 485.634,
2426
+ "eval_steps_per_second": 7.791,
2427
  "step": 6572
2428
  },
2429
  {
 
2460
  "eval_overall_f1": 0.8555858310626703,
2461
  "eval_overall_precision": 0.8198433420365535,
2462
  "eval_overall_recall": 0.8945868945868946,
2463
+ "eval_runtime": 0.3875,
2464
+ "eval_samples_per_second": 482.637,
2465
+ "eval_steps_per_second": 7.743,
2466
  "step": 6678
2467
  },
2468
  {
 
2499
  "eval_overall_f1": 0.8324175824175825,
2500
  "eval_overall_precision": 0.8037135278514589,
2501
  "eval_overall_recall": 0.8632478632478633,
2502
+ "eval_runtime": 0.3842,
2503
+ "eval_samples_per_second": 486.754,
2504
+ "eval_steps_per_second": 7.809,
2505
  "step": 6784
2506
  },
2507
  {
 
2538
  "eval_overall_f1": 0.8435374149659863,
2539
  "eval_overall_precision": 0.8072916666666666,
2540
  "eval_overall_recall": 0.8831908831908832,
2541
+ "eval_runtime": 0.3854,
2542
+ "eval_samples_per_second": 485.217,
2543
+ "eval_steps_per_second": 7.784,
2544
  "step": 6890
2545
  },
2546
  {
 
2577
  "eval_overall_f1": 0.845945945945946,
2578
  "eval_overall_precision": 0.8046272493573264,
2579
  "eval_overall_recall": 0.8917378917378918,
2580
+ "eval_runtime": 0.3859,
2581
+ "eval_samples_per_second": 484.618,
2582
+ "eval_steps_per_second": 7.775,
2583
  "step": 6996
2584
  },
2585
  {
 
2616
  "eval_overall_f1": 0.8367626886145405,
2617
  "eval_overall_precision": 0.8068783068783069,
2618
  "eval_overall_recall": 0.8689458689458689,
2619
+ "eval_runtime": 0.3883,
2620
+ "eval_samples_per_second": 481.631,
2621
+ "eval_steps_per_second": 7.727,
2622
  "step": 7102
2623
  },
2624
  {
 
2655
  "eval_overall_f1": 0.8392370572207084,
2656
  "eval_overall_precision": 0.804177545691906,
2657
  "eval_overall_recall": 0.8774928774928775,
2658
+ "eval_runtime": 0.3857,
2659
+ "eval_samples_per_second": 484.796,
2660
+ "eval_steps_per_second": 7.777,
2661
  "step": 7208
2662
  },
2663
  {
 
2694
  "eval_overall_f1": 0.8455284552845528,
2695
  "eval_overall_precision": 0.8062015503875969,
2696
  "eval_overall_recall": 0.8888888888888888,
2697
+ "eval_runtime": 0.3855,
2698
+ "eval_samples_per_second": 485.143,
2699
+ "eval_steps_per_second": 7.783,
2700
  "step": 7314
2701
  },
2702
  {
 
2733
  "eval_overall_f1": 0.8462585034013606,
2734
  "eval_overall_precision": 0.8098958333333334,
2735
  "eval_overall_recall": 0.886039886039886,
2736
+ "eval_runtime": 0.3882,
2737
+ "eval_samples_per_second": 481.683,
2738
+ "eval_steps_per_second": 7.728,
2739
  "step": 7420
2740
  },
2741
  {
 
2772
  "eval_overall_f1": 0.8571428571428573,
2773
  "eval_overall_precision": 0.8203125,
2774
  "eval_overall_recall": 0.8974358974358975,
2775
+ "eval_runtime": 0.389,
2776
+ "eval_samples_per_second": 480.776,
2777
+ "eval_steps_per_second": 7.713,
2778
  "step": 7526
2779
  },
2780
  {
 
2811
  "eval_overall_f1": 0.8365122615803815,
2812
  "eval_overall_precision": 0.8015665796344648,
2813
  "eval_overall_recall": 0.8746438746438746,
2814
+ "eval_runtime": 0.3865,
2815
+ "eval_samples_per_second": 483.842,
2816
+ "eval_steps_per_second": 7.762,
2817
  "step": 7632
2818
  },
2819
  {
 
2850
  "eval_overall_f1": 0.8501362397820162,
2851
  "eval_overall_precision": 0.814621409921671,
2852
  "eval_overall_recall": 0.8888888888888888,
2853
+ "eval_runtime": 0.3874,
2854
+ "eval_samples_per_second": 482.759,
2855
+ "eval_steps_per_second": 7.745,
2856
  "step": 7738
2857
  },
2858
  {
 
2889
  "eval_overall_f1": 0.8532235939643347,
2890
  "eval_overall_precision": 0.8227513227513228,
2891
  "eval_overall_recall": 0.886039886039886,
2892
+ "eval_runtime": 0.3863,
2893
+ "eval_samples_per_second": 484.063,
2894
+ "eval_steps_per_second": 7.766,
2895
  "step": 7844
2896
  },
2897
  {
 
2928
  "eval_overall_f1": 0.8532608695652173,
2929
  "eval_overall_precision": 0.8155844155844156,
2930
  "eval_overall_recall": 0.8945868945868946,
2931
+ "eval_runtime": 0.3884,
2932
+ "eval_samples_per_second": 481.456,
2933
+ "eval_steps_per_second": 7.724,
2934
  "step": 7950
2935
  },
2936
  {
 
2967
  "eval_overall_f1": 0.8544474393530996,
2968
  "eval_overall_precision": 0.8107416879795396,
2969
  "eval_overall_recall": 0.9031339031339032,
2970
+ "eval_runtime": 0.3868,
2971
+ "eval_samples_per_second": 483.423,
2972
  "eval_steps_per_second": 7.755,
2973
  "step": 8056
2974
  },
 
3006
  "eval_overall_f1": 0.8517006802721088,
3007
  "eval_overall_precision": 0.8151041666666666,
3008
  "eval_overall_recall": 0.8917378917378918,
3009
+ "eval_runtime": 0.385,
3010
+ "eval_samples_per_second": 485.697,
3011
+ "eval_steps_per_second": 7.792,
3012
  "step": 8162
3013
  },
3014
  {
 
3045
  "eval_overall_f1": 0.854368932038835,
3046
  "eval_overall_precision": 0.8324324324324325,
3047
  "eval_overall_recall": 0.8774928774928775,
3048
+ "eval_runtime": 0.3856,
3049
+ "eval_samples_per_second": 484.945,
3050
+ "eval_steps_per_second": 7.78,
3051
  "step": 8268
3052
  },
3053
  {
 
3084
  "eval_overall_f1": 0.8401084010840107,
3085
  "eval_overall_precision": 0.8010335917312662,
3086
  "eval_overall_recall": 0.8831908831908832,
3087
+ "eval_runtime": 0.3861,
3088
+ "eval_samples_per_second": 484.292,
3089
+ "eval_steps_per_second": 7.769,
3090
  "step": 8374
3091
  },
3092
  {
 
3123
  "eval_overall_f1": 0.854794520547945,
3124
  "eval_overall_precision": 0.8232189973614775,
3125
  "eval_overall_recall": 0.8888888888888888,
3126
+ "eval_runtime": 0.3848,
3127
+ "eval_samples_per_second": 485.904,
3128
+ "eval_steps_per_second": 7.795,
3129
  "step": 8480
3130
  },
3131
  {
 
3162
  "eval_overall_f1": 0.8451086956521738,
3163
  "eval_overall_precision": 0.8077922077922078,
3164
  "eval_overall_recall": 0.886039886039886,
3165
+ "eval_runtime": 0.3852,
3166
+ "eval_samples_per_second": 485.468,
3167
+ "eval_steps_per_second": 7.788,
3168
  "step": 8586
3169
  },
3170
  {
 
3201
  "eval_overall_f1": 0.8485675306957708,
3202
  "eval_overall_precision": 0.8141361256544503,
3203
  "eval_overall_recall": 0.886039886039886,
3204
+ "eval_runtime": 0.3868,
3205
+ "eval_samples_per_second": 483.477,
3206
+ "eval_steps_per_second": 7.756,
3207
  "step": 8692
3208
  },
3209
  {
 
3240
  "eval_overall_f1": 0.8373983739837397,
3241
  "eval_overall_precision": 0.7984496124031008,
3242
  "eval_overall_recall": 0.8803418803418803,
3243
+ "eval_runtime": 0.384,
3244
+ "eval_samples_per_second": 487.005,
3245
+ "eval_steps_per_second": 7.813,
3246
  "step": 8798
3247
  },
3248
  {
 
3279
  "eval_overall_f1": 0.8398384925975775,
3280
  "eval_overall_precision": 0.7959183673469388,
3281
  "eval_overall_recall": 0.8888888888888888,
3282
+ "eval_runtime": 0.3862,
3283
+ "eval_samples_per_second": 484.175,
3284
+ "eval_steps_per_second": 7.768,
3285
  "step": 8904
3286
  },
3287
  {
 
3318
  "eval_overall_f1": 0.8412483039348712,
3319
  "eval_overall_precision": 0.8031088082901554,
3320
  "eval_overall_recall": 0.8831908831908832,
3321
+ "eval_runtime": 0.3835,
3322
+ "eval_samples_per_second": 487.614,
3323
+ "eval_steps_per_second": 7.823,
3324
  "step": 9010
3325
  },
3326
  {
 
3357
  "eval_overall_f1": 0.8493150684931507,
3358
  "eval_overall_precision": 0.8179419525065963,
3359
  "eval_overall_recall": 0.8831908831908832,
3360
+ "eval_runtime": 0.3896,
3361
+ "eval_samples_per_second": 479.954,
3362
+ "eval_steps_per_second": 7.7,
3363
  "step": 9116
3364
  },
3365
  {
 
3396
  "eval_overall_f1": 0.844804318488529,
3397
  "eval_overall_precision": 0.8025641025641026,
3398
  "eval_overall_recall": 0.8917378917378918,
3399
+ "eval_runtime": 0.3857,
3400
+ "eval_samples_per_second": 484.808,
3401
+ "eval_steps_per_second": 7.778,
3402
  "step": 9222
3403
  },
3404
  {
 
3435
  "eval_overall_f1": 0.8443843031123139,
3436
  "eval_overall_precision": 0.8041237113402062,
3437
  "eval_overall_recall": 0.8888888888888888,
3438
+ "eval_runtime": 0.3854,
3439
+ "eval_samples_per_second": 485.254,
3440
+ "eval_steps_per_second": 7.785,
3441
  "step": 9328
3442
  },
3443
  {
 
3474
  "eval_overall_f1": 0.8394062078272606,
3475
  "eval_overall_precision": 0.7974358974358975,
3476
  "eval_overall_recall": 0.886039886039886,
3477
+ "eval_runtime": 0.3838,
3478
+ "eval_samples_per_second": 487.27,
3479
+ "eval_steps_per_second": 7.817,
3480
  "step": 9434
3481
  },
3482
  {
 
3513
  "eval_overall_f1": 0.8478260869565218,
3514
  "eval_overall_precision": 0.8103896103896104,
3515
  "eval_overall_recall": 0.8888888888888888,
3516
+ "eval_runtime": 0.3861,
3517
+ "eval_samples_per_second": 484.354,
3518
+ "eval_steps_per_second": 7.77,
3519
  "step": 9540
3520
  },
3521
  {
 
3552
  "eval_overall_f1": 0.8466757123473541,
3553
  "eval_overall_precision": 0.8082901554404145,
3554
  "eval_overall_recall": 0.8888888888888888,
3555
+ "eval_runtime": 0.3855,
3556
+ "eval_samples_per_second": 485.096,
3557
+ "eval_steps_per_second": 7.782,
3558
  "step": 9646
3559
  },
3560
  {
 
3591
  "eval_overall_f1": 0.8505434782608695,
3592
  "eval_overall_precision": 0.812987012987013,
3593
  "eval_overall_recall": 0.8917378917378918,
3594
+ "eval_runtime": 0.3848,
3595
+ "eval_samples_per_second": 485.911,
3596
+ "eval_steps_per_second": 7.795,
3597
  "step": 9752
3598
  },
3599
  {
 
3630
  "eval_overall_f1": 0.8497970230040596,
3631
  "eval_overall_precision": 0.8092783505154639,
3632
  "eval_overall_recall": 0.8945868945868946,
3633
+ "eval_runtime": 0.3855,
3634
+ "eval_samples_per_second": 485.12,
3635
+ "eval_steps_per_second": 7.783,
3636
  "step": 9858
3637
  },
3638
  {
 
3669
  "eval_overall_f1": 0.8470906630581868,
3670
  "eval_overall_precision": 0.8067010309278351,
3671
  "eval_overall_recall": 0.8917378917378918,
3672
+ "eval_runtime": 0.3874,
3673
+ "eval_samples_per_second": 482.705,
3674
+ "eval_steps_per_second": 7.744,
3675
  "step": 9964
3676
  },
3677
  {
 
3708
  "eval_overall_f1": 0.8493894165535957,
3709
  "eval_overall_precision": 0.810880829015544,
3710
  "eval_overall_recall": 0.8917378917378918,
3711
+ "eval_runtime": 0.3942,
3712
+ "eval_samples_per_second": 474.406,
3713
+ "eval_steps_per_second": 7.611,
3714
  "step": 10070
3715
  },
3716
  {
 
3747
  "eval_overall_f1": 0.8416779431664412,
3748
  "eval_overall_precision": 0.8015463917525774,
3749
  "eval_overall_recall": 0.886039886039886,
3750
+ "eval_runtime": 0.3909,
3751
+ "eval_samples_per_second": 478.441,
3752
+ "eval_steps_per_second": 7.676,
3753
  "step": 10176
3754
  },
3755
  {
 
3786
  "eval_overall_f1": 0.8466757123473541,
3787
  "eval_overall_precision": 0.8082901554404145,
3788
  "eval_overall_recall": 0.8888888888888888,
3789
+ "eval_runtime": 0.3914,
3790
+ "eval_samples_per_second": 477.725,
3791
+ "eval_steps_per_second": 7.664,
3792
  "step": 10282
3793
  },
3794
  {
 
3825
  "eval_overall_f1": 0.8443843031123139,
3826
  "eval_overall_precision": 0.8041237113402062,
3827
  "eval_overall_recall": 0.8888888888888888,
3828
+ "eval_runtime": 0.385,
3829
+ "eval_samples_per_second": 485.655,
3830
+ "eval_steps_per_second": 7.791,
3831
  "step": 10388
3832
  },
3833
  {
 
3864
  "eval_overall_f1": 0.8443843031123139,
3865
  "eval_overall_precision": 0.8041237113402062,
3866
  "eval_overall_recall": 0.8888888888888888,
3867
+ "eval_runtime": 0.3874,
3868
+ "eval_samples_per_second": 482.766,
3869
+ "eval_steps_per_second": 7.745,
3870
  "step": 10494
3871
  },
3872
  {
 
3903
  "eval_overall_f1": 0.8432432432432433,
3904
  "eval_overall_precision": 0.8020565552699229,
3905
  "eval_overall_recall": 0.8888888888888888,
3906
+ "eval_runtime": 0.3863,
3907
+ "eval_samples_per_second": 484.103,
3908
+ "eval_steps_per_second": 7.766,
3909
  "step": 10600
3910
  },
3911
  {
 
3913
  "step": 10600,
3914
  "total_flos": 5043631411410816.0,
3915
  "train_loss": 0.07131878634668747,
3916
+ "train_runtime": 621.5745,
3917
+ "train_samples_per_second": 271.568,
3918
+ "train_steps_per_second": 17.053
3919
  }
3920
  ],
3921
  "logging_steps": 500,