apwic commited on
Commit
b6eaa22
1 Parent(s): 4a0a3f2

End of training

Browse files
README.md CHANGED
@@ -1,4 +1,6 @@
1
  ---
 
 
2
  license: mit
3
  base_model: indolem/indobert-base-uncased
4
  tags:
 
1
  ---
2
+ language:
3
+ - id
4
  license: mit
5
  base_model: indolem/indobert-base-uncased
6
  tags:
all_results.json CHANGED
@@ -17,10 +17,10 @@
17
  "eval_overall_f1": 0.9419035846724352,
18
  "eval_overall_precision": 0.9338235294117647,
19
  "eval_overall_recall": 0.9501246882793017,
20
- "eval_runtime": 0.3063,
21
  "eval_samples": 170,
22
- "eval_samples_per_second": 555.028,
23
- "eval_steps_per_second": 9.795,
24
  "predict_LOCATION_f1": 0.9938650306748468,
25
  "predict_LOCATION_number": 245,
26
  "predict_LOCATION_precision": 0.9959016393442623,
@@ -38,12 +38,12 @@
38
  "predict_overall_f1": 0.9942418426103646,
39
  "predict_overall_precision": 0.9942418426103646,
40
  "predict_overall_recall": 0.9942418426103646,
41
- "predict_runtime": 0.7773,
42
- "predict_samples_per_second": 546.752,
43
- "predict_steps_per_second": 9.005,
44
  "train_loss": 0.03501902000978589,
45
- "train_runtime": 552.429,
46
  "train_samples": 1531,
47
- "train_samples_per_second": 277.14,
48
- "train_steps_per_second": 17.378
49
  }
 
17
  "eval_overall_f1": 0.9419035846724352,
18
  "eval_overall_precision": 0.9338235294117647,
19
  "eval_overall_recall": 0.9501246882793017,
20
+ "eval_runtime": 0.3141,
21
  "eval_samples": 170,
22
+ "eval_samples_per_second": 541.173,
23
+ "eval_steps_per_second": 9.55,
24
  "predict_LOCATION_f1": 0.9938650306748468,
25
  "predict_LOCATION_number": 245,
26
  "predict_LOCATION_precision": 0.9959016393442623,
 
38
  "predict_overall_f1": 0.9942418426103646,
39
  "predict_overall_precision": 0.9942418426103646,
40
  "predict_overall_recall": 0.9942418426103646,
41
+ "predict_runtime": 0.7649,
42
+ "predict_samples_per_second": 555.611,
43
+ "predict_steps_per_second": 9.151,
44
  "train_loss": 0.03501902000978589,
45
+ "train_runtime": 539.9434,
46
  "train_samples": 1531,
47
+ "train_samples_per_second": 283.548,
48
+ "train_steps_per_second": 17.78
49
  }
eval_results.json CHANGED
@@ -17,8 +17,8 @@
17
  "eval_overall_f1": 0.9419035846724352,
18
  "eval_overall_precision": 0.9338235294117647,
19
  "eval_overall_recall": 0.9501246882793017,
20
- "eval_runtime": 0.3063,
21
  "eval_samples": 170,
22
- "eval_samples_per_second": 555.028,
23
- "eval_steps_per_second": 9.795
24
  }
 
17
  "eval_overall_f1": 0.9419035846724352,
18
  "eval_overall_precision": 0.9338235294117647,
19
  "eval_overall_recall": 0.9501246882793017,
20
+ "eval_runtime": 0.3141,
21
  "eval_samples": 170,
22
+ "eval_samples_per_second": 541.173,
23
+ "eval_steps_per_second": 9.55
24
  }
predict_results.json CHANGED
@@ -16,7 +16,7 @@
16
  "predict_overall_f1": 0.9942418426103646,
17
  "predict_overall_precision": 0.9942418426103646,
18
  "predict_overall_recall": 0.9942418426103646,
19
- "predict_runtime": 0.7773,
20
- "predict_samples_per_second": 546.752,
21
- "predict_steps_per_second": 9.005
22
  }
 
16
  "predict_overall_f1": 0.9942418426103646,
17
  "predict_overall_precision": 0.9942418426103646,
18
  "predict_overall_recall": 0.9942418426103646,
19
+ "predict_runtime": 0.7649,
20
+ "predict_samples_per_second": 555.611,
21
+ "predict_steps_per_second": 9.151
22
  }
runs/Jun04_10-41-39_a358b85c7679/events.out.tfevents.1717498253.a358b85c7679.630167.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2e7197ec35991bcab617da31f7749e75a8d8952f70f515655d84035012f16b8
3
+ size 1305
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 100.0,
3
  "train_loss": 0.03501902000978589,
4
- "train_runtime": 552.429,
5
  "train_samples": 1531,
6
- "train_samples_per_second": 277.14,
7
- "train_steps_per_second": 17.378
8
  }
 
1
  {
2
  "epoch": 100.0,
3
  "train_loss": 0.03501902000978589,
4
+ "train_runtime": 539.9434,
5
  "train_samples": 1531,
6
+ "train_samples_per_second": 283.548,
7
+ "train_steps_per_second": 17.78
8
  }
trainer_state.json CHANGED
@@ -34,9 +34,9 @@
34
  "eval_overall_f1": 0.2203626220362622,
35
  "eval_overall_precision": 0.25,
36
  "eval_overall_recall": 0.1970074812967581,
37
- "eval_runtime": 0.2972,
38
- "eval_samples_per_second": 572.026,
39
- "eval_steps_per_second": 10.095,
40
  "step": 96
41
  },
42
  {
@@ -65,9 +65,9 @@
65
  "eval_overall_f1": 0.5780219780219781,
66
  "eval_overall_precision": 0.5166994106090373,
67
  "eval_overall_recall": 0.655860349127182,
68
- "eval_runtime": 0.298,
69
- "eval_samples_per_second": 570.459,
70
- "eval_steps_per_second": 10.067,
71
  "step": 192
72
  },
73
  {
@@ -96,9 +96,9 @@
96
  "eval_overall_f1": 0.803357314148681,
97
  "eval_overall_precision": 0.7736720554272517,
98
  "eval_overall_recall": 0.8354114713216958,
99
- "eval_runtime": 0.2957,
100
- "eval_samples_per_second": 574.874,
101
- "eval_steps_per_second": 10.145,
102
  "step": 288
103
  },
104
  {
@@ -127,9 +127,9 @@
127
  "eval_overall_f1": 0.857482185273159,
128
  "eval_overall_precision": 0.81859410430839,
129
  "eval_overall_recall": 0.9002493765586035,
130
- "eval_runtime": 0.3005,
131
- "eval_samples_per_second": 565.653,
132
- "eval_steps_per_second": 9.982,
133
  "step": 384
134
  },
135
  {
@@ -158,9 +158,9 @@
158
  "eval_overall_f1": 0.9093167701863354,
159
  "eval_overall_precision": 0.905940594059406,
160
  "eval_overall_recall": 0.912718204488778,
161
- "eval_runtime": 0.2992,
162
- "eval_samples_per_second": 568.271,
163
- "eval_steps_per_second": 10.028,
164
  "step": 480
165
  },
166
  {
@@ -189,9 +189,9 @@
189
  "eval_overall_f1": 0.8940886699507389,
190
  "eval_overall_precision": 0.8832116788321168,
191
  "eval_overall_recall": 0.9052369077306733,
192
- "eval_runtime": 0.3015,
193
- "eval_samples_per_second": 563.882,
194
- "eval_steps_per_second": 9.951,
195
  "step": 576
196
  },
197
  {
@@ -220,9 +220,9 @@
220
  "eval_overall_f1": 0.9200968523002423,
221
  "eval_overall_precision": 0.8941176470588236,
222
  "eval_overall_recall": 0.9476309226932669,
223
- "eval_runtime": 0.3005,
224
- "eval_samples_per_second": 565.809,
225
- "eval_steps_per_second": 9.985,
226
  "step": 672
227
  },
228
  {
@@ -251,9 +251,9 @@
251
  "eval_overall_f1": 0.9238329238329237,
252
  "eval_overall_precision": 0.910411622276029,
253
  "eval_overall_recall": 0.9376558603491272,
254
- "eval_runtime": 0.3038,
255
- "eval_samples_per_second": 559.65,
256
- "eval_steps_per_second": 9.876,
257
  "step": 768
258
  },
259
  {
@@ -282,9 +282,9 @@
282
  "eval_overall_f1": 0.9262899262899262,
283
  "eval_overall_precision": 0.9128329297820823,
284
  "eval_overall_recall": 0.940149625935162,
285
- "eval_runtime": 0.2976,
286
- "eval_samples_per_second": 571.181,
287
- "eval_steps_per_second": 10.08,
288
  "step": 864
289
  },
290
  {
@@ -313,9 +313,9 @@
313
  "eval_overall_f1": 0.9153374233128836,
314
  "eval_overall_precision": 0.9009661835748792,
315
  "eval_overall_recall": 0.9301745635910225,
316
- "eval_runtime": 0.2975,
317
- "eval_samples_per_second": 571.464,
318
- "eval_steps_per_second": 10.085,
319
  "step": 960
320
  },
321
  {
@@ -344,9 +344,9 @@
344
  "eval_overall_f1": 0.9253365973072215,
345
  "eval_overall_precision": 0.9086538461538461,
346
  "eval_overall_recall": 0.942643391521197,
347
- "eval_runtime": 0.2984,
348
- "eval_samples_per_second": 569.7,
349
- "eval_steps_per_second": 10.054,
350
  "step": 1056
351
  },
352
  {
@@ -375,9 +375,9 @@
375
  "eval_overall_f1": 0.932349323493235,
376
  "eval_overall_precision": 0.9199029126213593,
377
  "eval_overall_recall": 0.9451371571072319,
378
- "eval_runtime": 0.2985,
379
- "eval_samples_per_second": 569.59,
380
- "eval_steps_per_second": 10.052,
381
  "step": 1152
382
  },
383
  {
@@ -406,9 +406,9 @@
406
  "eval_overall_f1": 0.9282178217821783,
407
  "eval_overall_precision": 0.9213759213759214,
408
  "eval_overall_recall": 0.9351620947630923,
409
- "eval_runtime": 0.2942,
410
- "eval_samples_per_second": 577.91,
411
- "eval_steps_per_second": 10.198,
412
  "step": 1248
413
  },
414
  {
@@ -437,9 +437,9 @@
437
  "eval_overall_f1": 0.9369592088998765,
438
  "eval_overall_precision": 0.928921568627451,
439
  "eval_overall_recall": 0.9451371571072319,
440
- "eval_runtime": 0.2973,
441
- "eval_samples_per_second": 571.9,
442
- "eval_steps_per_second": 10.092,
443
  "step": 1344
444
  },
445
  {
@@ -468,9 +468,9 @@
468
  "eval_overall_f1": 0.9270704573547589,
469
  "eval_overall_precision": 0.9191176470588235,
470
  "eval_overall_recall": 0.9351620947630923,
471
- "eval_runtime": 0.3028,
472
- "eval_samples_per_second": 561.411,
473
- "eval_steps_per_second": 9.907,
474
  "step": 1440
475
  },
476
  {
@@ -499,9 +499,9 @@
499
  "eval_overall_f1": 0.9318463444857497,
500
  "eval_overall_precision": 0.9261083743842364,
501
  "eval_overall_recall": 0.9376558603491272,
502
- "eval_runtime": 0.2965,
503
- "eval_samples_per_second": 573.339,
504
- "eval_steps_per_second": 10.118,
505
  "step": 1536
506
  },
507
  {
@@ -530,9 +530,9 @@
530
  "eval_overall_f1": 0.9346485819975339,
531
  "eval_overall_precision": 0.9243902439024391,
532
  "eval_overall_recall": 0.9451371571072319,
533
- "eval_runtime": 0.2989,
534
- "eval_samples_per_second": 568.742,
535
- "eval_steps_per_second": 10.037,
536
  "step": 1632
537
  },
538
  {
@@ -561,9 +561,9 @@
561
  "eval_overall_f1": 0.9376558603491272,
562
  "eval_overall_precision": 0.9376558603491272,
563
  "eval_overall_recall": 0.9376558603491272,
564
- "eval_runtime": 0.2982,
565
- "eval_samples_per_second": 570.158,
566
- "eval_steps_per_second": 10.062,
567
  "step": 1728
568
  },
569
  {
@@ -592,9 +592,9 @@
592
  "eval_overall_f1": 0.9524999999999999,
593
  "eval_overall_precision": 0.9548872180451128,
594
  "eval_overall_recall": 0.9501246882793017,
595
- "eval_runtime": 0.2955,
596
- "eval_samples_per_second": 575.369,
597
- "eval_steps_per_second": 10.154,
598
  "step": 1824
599
  },
600
  {
@@ -623,9 +623,9 @@
623
  "eval_overall_f1": 0.9407407407407408,
624
  "eval_overall_precision": 0.9315403422982885,
625
  "eval_overall_recall": 0.9501246882793017,
626
- "eval_runtime": 0.2985,
627
- "eval_samples_per_second": 569.44,
628
- "eval_steps_per_second": 10.049,
629
  "step": 1920
630
  },
631
  {
@@ -654,9 +654,9 @@
654
  "eval_overall_f1": 0.9394313967861558,
655
  "eval_overall_precision": 0.9313725490196079,
656
  "eval_overall_recall": 0.9476309226932669,
657
- "eval_runtime": 0.2988,
658
- "eval_samples_per_second": 568.942,
659
- "eval_steps_per_second": 10.04,
660
  "step": 2016
661
  },
662
  {
@@ -685,9 +685,9 @@
685
  "eval_overall_f1": 0.9395807644882862,
686
  "eval_overall_precision": 0.9292682926829269,
687
  "eval_overall_recall": 0.9501246882793017,
688
- "eval_runtime": 0.2981,
689
- "eval_samples_per_second": 570.213,
690
- "eval_steps_per_second": 10.063,
691
  "step": 2112
692
  },
693
  {
@@ -716,9 +716,9 @@
716
  "eval_overall_f1": 0.949569495694957,
717
  "eval_overall_precision": 0.9368932038834952,
718
  "eval_overall_recall": 0.9625935162094763,
719
- "eval_runtime": 0.3003,
720
- "eval_samples_per_second": 566.144,
721
- "eval_steps_per_second": 9.991,
722
  "step": 2208
723
  },
724
  {
@@ -747,9 +747,9 @@
747
  "eval_overall_f1": 0.9478908188585606,
748
  "eval_overall_precision": 0.9432098765432099,
749
  "eval_overall_recall": 0.9526184538653366,
750
- "eval_runtime": 0.2967,
751
- "eval_samples_per_second": 572.889,
752
- "eval_steps_per_second": 10.11,
753
  "step": 2304
754
  },
755
  {
@@ -778,9 +778,9 @@
778
  "eval_overall_f1": 0.9515527950310558,
779
  "eval_overall_precision": 0.948019801980198,
780
  "eval_overall_recall": 0.9551122194513716,
781
- "eval_runtime": 0.2992,
782
- "eval_samples_per_second": 568.163,
783
- "eval_steps_per_second": 10.026,
784
  "step": 2400
785
  },
786
  {
@@ -809,9 +809,9 @@
809
  "eval_overall_f1": 0.9477611940298507,
810
  "eval_overall_precision": 0.9454094292803971,
811
  "eval_overall_recall": 0.9501246882793017,
812
- "eval_runtime": 0.2971,
813
- "eval_samples_per_second": 572.207,
814
- "eval_steps_per_second": 10.098,
815
  "step": 2496
816
  },
817
  {
@@ -840,9 +840,9 @@
840
  "eval_overall_f1": 0.9478908188585606,
841
  "eval_overall_precision": 0.9432098765432099,
842
  "eval_overall_recall": 0.9526184538653366,
843
- "eval_runtime": 0.2979,
844
- "eval_samples_per_second": 570.584,
845
- "eval_steps_per_second": 10.069,
846
  "step": 2592
847
  },
848
  {
@@ -871,9 +871,9 @@
871
  "eval_overall_f1": 0.9408866995073891,
872
  "eval_overall_precision": 0.9294403892944039,
873
  "eval_overall_recall": 0.9526184538653366,
874
- "eval_runtime": 0.2973,
875
- "eval_samples_per_second": 571.866,
876
- "eval_steps_per_second": 10.092,
877
  "step": 2688
878
  },
879
  {
@@ -902,9 +902,9 @@
902
  "eval_overall_f1": 0.9392812887236679,
903
  "eval_overall_precision": 0.9334975369458128,
904
  "eval_overall_recall": 0.9451371571072319,
905
- "eval_runtime": 0.2972,
906
- "eval_samples_per_second": 571.984,
907
- "eval_steps_per_second": 10.094,
908
  "step": 2784
909
  },
910
  {
@@ -933,9 +933,9 @@
933
  "eval_overall_f1": 0.942189421894219,
934
  "eval_overall_precision": 0.9296116504854369,
935
  "eval_overall_recall": 0.9551122194513716,
936
- "eval_runtime": 0.2984,
937
- "eval_samples_per_second": 569.653,
938
- "eval_steps_per_second": 10.053,
939
  "step": 2880
940
  },
941
  {
@@ -964,9 +964,9 @@
964
  "eval_overall_f1": 0.9443757725587144,
965
  "eval_overall_precision": 0.9362745098039216,
966
  "eval_overall_recall": 0.9526184538653366,
967
- "eval_runtime": 0.2983,
968
- "eval_samples_per_second": 569.81,
969
- "eval_steps_per_second": 10.055,
970
  "step": 2976
971
  },
972
  {
@@ -995,9 +995,9 @@
995
  "eval_overall_f1": 0.9442379182156134,
996
  "eval_overall_precision": 0.9384236453201971,
997
  "eval_overall_recall": 0.9501246882793017,
998
- "eval_runtime": 0.2982,
999
- "eval_samples_per_second": 570.182,
1000
- "eval_steps_per_second": 10.062,
1001
  "step": 3072
1002
  },
1003
  {
@@ -1026,9 +1026,9 @@
1026
  "eval_overall_f1": 0.949194547707559,
1027
  "eval_overall_precision": 0.9433497536945813,
1028
  "eval_overall_recall": 0.9551122194513716,
1029
- "eval_runtime": 0.2967,
1030
- "eval_samples_per_second": 573.022,
1031
- "eval_steps_per_second": 10.112,
1032
  "step": 3168
1033
  },
1034
  {
@@ -1057,9 +1057,9 @@
1057
  "eval_overall_f1": 0.9514321295143213,
1058
  "eval_overall_precision": 0.9502487562189055,
1059
  "eval_overall_recall": 0.9526184538653366,
1060
- "eval_runtime": 0.2949,
1061
- "eval_samples_per_second": 576.383,
1062
- "eval_steps_per_second": 10.171,
1063
  "step": 3264
1064
  },
1065
  {
@@ -1088,9 +1088,9 @@
1088
  "eval_overall_f1": 0.9432098765432098,
1089
  "eval_overall_precision": 0.9339853300733496,
1090
  "eval_overall_recall": 0.9526184538653366,
1091
- "eval_runtime": 0.293,
1092
- "eval_samples_per_second": 580.289,
1093
- "eval_steps_per_second": 10.24,
1094
  "step": 3360
1095
  },
1096
  {
@@ -1119,9 +1119,9 @@
1119
  "eval_overall_f1": 0.9417596034696407,
1120
  "eval_overall_precision": 0.9359605911330049,
1121
  "eval_overall_recall": 0.9476309226932669,
1122
- "eval_runtime": 0.2955,
1123
- "eval_samples_per_second": 575.264,
1124
- "eval_steps_per_second": 10.152,
1125
  "step": 3456
1126
  },
1127
  {
@@ -1150,9 +1150,9 @@
1150
  "eval_overall_f1": 0.9527363184079602,
1151
  "eval_overall_precision": 0.9503722084367245,
1152
  "eval_overall_recall": 0.9551122194513716,
1153
- "eval_runtime": 0.2938,
1154
- "eval_samples_per_second": 578.651,
1155
- "eval_steps_per_second": 10.211,
1156
  "step": 3552
1157
  },
1158
  {
@@ -1181,9 +1181,9 @@
1181
  "eval_overall_f1": 0.9359605911330049,
1182
  "eval_overall_precision": 0.9245742092457421,
1183
  "eval_overall_recall": 0.9476309226932669,
1184
- "eval_runtime": 0.297,
1185
- "eval_samples_per_second": 572.456,
1186
- "eval_steps_per_second": 10.102,
1187
  "step": 3648
1188
  },
1189
  {
@@ -1212,9 +1212,9 @@
1212
  "eval_overall_f1": 0.9369592088998765,
1213
  "eval_overall_precision": 0.928921568627451,
1214
  "eval_overall_recall": 0.9451371571072319,
1215
- "eval_runtime": 0.2934,
1216
- "eval_samples_per_second": 579.501,
1217
- "eval_steps_per_second": 10.226,
1218
  "step": 3744
1219
  },
1220
  {
@@ -1243,9 +1243,9 @@
1243
  "eval_overall_f1": 0.949194547707559,
1244
  "eval_overall_precision": 0.9433497536945813,
1245
  "eval_overall_recall": 0.9551122194513716,
1246
- "eval_runtime": 0.2939,
1247
- "eval_samples_per_second": 578.335,
1248
- "eval_steps_per_second": 10.206,
1249
  "step": 3840
1250
  },
1251
  {
@@ -1274,9 +1274,9 @@
1274
  "eval_overall_f1": 0.946716232961586,
1275
  "eval_overall_precision": 0.9408866995073891,
1276
  "eval_overall_recall": 0.9526184538653366,
1277
- "eval_runtime": 0.2955,
1278
- "eval_samples_per_second": 575.283,
1279
- "eval_steps_per_second": 10.152,
1280
  "step": 3936
1281
  },
1282
  {
@@ -1305,9 +1305,9 @@
1305
  "eval_overall_f1": 0.9516728624535316,
1306
  "eval_overall_precision": 0.9458128078817734,
1307
  "eval_overall_recall": 0.9576059850374065,
1308
- "eval_runtime": 0.302,
1309
- "eval_samples_per_second": 562.939,
1310
- "eval_steps_per_second": 9.934,
1311
  "step": 4032
1312
  },
1313
  {
@@ -1336,9 +1336,9 @@
1336
  "eval_overall_f1": 0.9516728624535316,
1337
  "eval_overall_precision": 0.9458128078817734,
1338
  "eval_overall_recall": 0.9576059850374065,
1339
- "eval_runtime": 0.2968,
1340
- "eval_samples_per_second": 572.827,
1341
- "eval_steps_per_second": 10.109,
1342
  "step": 4128
1343
  },
1344
  {
@@ -1367,9 +1367,9 @@
1367
  "eval_overall_f1": 0.9443757725587144,
1368
  "eval_overall_precision": 0.9362745098039216,
1369
  "eval_overall_recall": 0.9526184538653366,
1370
- "eval_runtime": 0.2969,
1371
- "eval_samples_per_second": 572.626,
1372
- "eval_steps_per_second": 10.105,
1373
  "step": 4224
1374
  },
1375
  {
@@ -1398,9 +1398,9 @@
1398
  "eval_overall_f1": 0.9416149068322982,
1399
  "eval_overall_precision": 0.9381188118811881,
1400
  "eval_overall_recall": 0.9451371571072319,
1401
- "eval_runtime": 0.2933,
1402
- "eval_samples_per_second": 579.583,
1403
- "eval_steps_per_second": 10.228,
1404
  "step": 4320
1405
  },
1406
  {
@@ -1429,9 +1429,9 @@
1429
  "eval_overall_f1": 0.949194547707559,
1430
  "eval_overall_precision": 0.9433497536945813,
1431
  "eval_overall_recall": 0.9551122194513716,
1432
- "eval_runtime": 0.2978,
1433
- "eval_samples_per_second": 570.926,
1434
- "eval_steps_per_second": 10.075,
1435
  "step": 4416
1436
  },
1437
  {
@@ -1460,9 +1460,9 @@
1460
  "eval_overall_f1": 0.9430693069306931,
1461
  "eval_overall_precision": 0.9361179361179361,
1462
  "eval_overall_recall": 0.9501246882793017,
1463
- "eval_runtime": 0.2957,
1464
- "eval_samples_per_second": 574.873,
1465
- "eval_steps_per_second": 10.145,
1466
  "step": 4512
1467
  },
1468
  {
@@ -1491,9 +1491,9 @@
1491
  "eval_overall_f1": 0.9376558603491272,
1492
  "eval_overall_precision": 0.9376558603491272,
1493
  "eval_overall_recall": 0.9376558603491272,
1494
- "eval_runtime": 0.2944,
1495
- "eval_samples_per_second": 577.482,
1496
- "eval_steps_per_second": 10.191,
1497
  "step": 4608
1498
  },
1499
  {
@@ -1522,9 +1522,9 @@
1522
  "eval_overall_f1": 0.9318463444857497,
1523
  "eval_overall_precision": 0.9261083743842364,
1524
  "eval_overall_recall": 0.9376558603491272,
1525
- "eval_runtime": 0.2935,
1526
- "eval_samples_per_second": 579.234,
1527
- "eval_steps_per_second": 10.222,
1528
  "step": 4704
1529
  },
1530
  {
@@ -1553,9 +1553,9 @@
1553
  "eval_overall_f1": 0.9455445544554455,
1554
  "eval_overall_precision": 0.9385749385749386,
1555
  "eval_overall_recall": 0.9526184538653366,
1556
- "eval_runtime": 0.2977,
1557
- "eval_samples_per_second": 571.045,
1558
- "eval_steps_per_second": 10.077,
1559
  "step": 4800
1560
  },
1561
  {
@@ -1584,9 +1584,9 @@
1584
  "eval_overall_f1": 0.9381188118811881,
1585
  "eval_overall_precision": 0.9312039312039312,
1586
  "eval_overall_recall": 0.9451371571072319,
1587
- "eval_runtime": 0.2926,
1588
- "eval_samples_per_second": 581.069,
1589
- "eval_steps_per_second": 10.254,
1590
  "step": 4896
1591
  },
1592
  {
@@ -1615,9 +1615,9 @@
1615
  "eval_overall_f1": 0.9416149068322982,
1616
  "eval_overall_precision": 0.9381188118811881,
1617
  "eval_overall_recall": 0.9451371571072319,
1618
- "eval_runtime": 0.2946,
1619
- "eval_samples_per_second": 577.069,
1620
- "eval_steps_per_second": 10.184,
1621
  "step": 4992
1622
  },
1623
  {
@@ -1646,9 +1646,9 @@
1646
  "eval_overall_f1": 0.9417596034696407,
1647
  "eval_overall_precision": 0.9359605911330049,
1648
  "eval_overall_recall": 0.9476309226932669,
1649
- "eval_runtime": 0.299,
1650
- "eval_samples_per_second": 568.493,
1651
- "eval_steps_per_second": 10.032,
1652
  "step": 5088
1653
  },
1654
  {
@@ -1677,9 +1677,9 @@
1677
  "eval_overall_f1": 0.946583850931677,
1678
  "eval_overall_precision": 0.943069306930693,
1679
  "eval_overall_recall": 0.9501246882793017,
1680
- "eval_runtime": 0.297,
1681
- "eval_samples_per_second": 572.336,
1682
- "eval_steps_per_second": 10.1,
1683
  "step": 5184
1684
  },
1685
  {
@@ -1708,9 +1708,9 @@
1708
  "eval_overall_f1": 0.9440993788819876,
1709
  "eval_overall_precision": 0.9405940594059405,
1710
  "eval_overall_recall": 0.9476309226932669,
1711
- "eval_runtime": 0.2956,
1712
- "eval_samples_per_second": 575.088,
1713
- "eval_steps_per_second": 10.149,
1714
  "step": 5280
1715
  },
1716
  {
@@ -1739,9 +1739,9 @@
1739
  "eval_overall_f1": 0.9432098765432098,
1740
  "eval_overall_precision": 0.9339853300733496,
1741
  "eval_overall_recall": 0.9526184538653366,
1742
- "eval_runtime": 0.2959,
1743
- "eval_samples_per_second": 574.433,
1744
- "eval_steps_per_second": 10.137,
1745
  "step": 5376
1746
  },
1747
  {
@@ -1770,9 +1770,9 @@
1770
  "eval_overall_f1": 0.9382716049382714,
1771
  "eval_overall_precision": 0.9290953545232273,
1772
  "eval_overall_recall": 0.9476309226932669,
1773
- "eval_runtime": 0.2961,
1774
- "eval_samples_per_second": 574.153,
1775
- "eval_steps_per_second": 10.132,
1776
  "step": 5472
1777
  },
1778
  {
@@ -1801,9 +1801,9 @@
1801
  "eval_overall_f1": 0.9455445544554455,
1802
  "eval_overall_precision": 0.9385749385749386,
1803
  "eval_overall_recall": 0.9526184538653366,
1804
- "eval_runtime": 0.2949,
1805
- "eval_samples_per_second": 576.43,
1806
- "eval_steps_per_second": 10.172,
1807
  "step": 5568
1808
  },
1809
  {
@@ -1832,9 +1832,9 @@
1832
  "eval_overall_f1": 0.9430693069306931,
1833
  "eval_overall_precision": 0.9361179361179361,
1834
  "eval_overall_recall": 0.9501246882793017,
1835
- "eval_runtime": 0.2955,
1836
- "eval_samples_per_second": 575.281,
1837
- "eval_steps_per_second": 10.152,
1838
  "step": 5664
1839
  },
1840
  {
@@ -1863,9 +1863,9 @@
1863
  "eval_overall_f1": 0.9456790123456791,
1864
  "eval_overall_precision": 0.9364303178484108,
1865
  "eval_overall_recall": 0.9551122194513716,
1866
- "eval_runtime": 0.2949,
1867
- "eval_samples_per_second": 576.544,
1868
- "eval_steps_per_second": 10.174,
1869
  "step": 5760
1870
  },
1871
  {
@@ -1894,9 +1894,9 @@
1894
  "eval_overall_f1": 0.9455445544554455,
1895
  "eval_overall_precision": 0.9385749385749386,
1896
  "eval_overall_recall": 0.9526184538653366,
1897
- "eval_runtime": 0.2951,
1898
- "eval_samples_per_second": 576.102,
1899
- "eval_steps_per_second": 10.167,
1900
  "step": 5856
1901
  },
1902
  {
@@ -1925,9 +1925,9 @@
1925
  "eval_overall_f1": 0.9354838709677419,
1926
  "eval_overall_precision": 0.9308641975308642,
1927
  "eval_overall_recall": 0.940149625935162,
1928
- "eval_runtime": 0.2946,
1929
- "eval_samples_per_second": 577.118,
1930
- "eval_steps_per_second": 10.184,
1931
  "step": 5952
1932
  },
1933
  {
@@ -1956,9 +1956,9 @@
1956
  "eval_overall_f1": 0.9456790123456791,
1957
  "eval_overall_precision": 0.9364303178484108,
1958
  "eval_overall_recall": 0.9551122194513716,
1959
- "eval_runtime": 0.2936,
1960
- "eval_samples_per_second": 579.022,
1961
- "eval_steps_per_second": 10.218,
1962
  "step": 6048
1963
  },
1964
  {
@@ -1987,9 +1987,9 @@
1987
  "eval_overall_f1": 0.9442379182156134,
1988
  "eval_overall_precision": 0.9384236453201971,
1989
  "eval_overall_recall": 0.9501246882793017,
1990
- "eval_runtime": 0.2944,
1991
- "eval_samples_per_second": 577.409,
1992
- "eval_steps_per_second": 10.19,
1993
  "step": 6144
1994
  },
1995
  {
@@ -2018,9 +2018,9 @@
2018
  "eval_overall_f1": 0.9321824907521579,
2019
  "eval_overall_precision": 0.9219512195121952,
2020
  "eval_overall_recall": 0.942643391521197,
2021
- "eval_runtime": 0.3051,
2022
- "eval_samples_per_second": 557.231,
2023
- "eval_steps_per_second": 9.833,
2024
  "step": 6240
2025
  },
2026
  {
@@ -2049,9 +2049,9 @@
2049
  "eval_overall_f1": 0.9382716049382714,
2050
  "eval_overall_precision": 0.9290953545232273,
2051
  "eval_overall_recall": 0.9476309226932669,
2052
- "eval_runtime": 0.2946,
2053
- "eval_samples_per_second": 577.143,
2054
- "eval_steps_per_second": 10.185,
2055
  "step": 6336
2056
  },
2057
  {
@@ -2080,9 +2080,9 @@
2080
  "eval_overall_f1": 0.9381188118811881,
2081
  "eval_overall_precision": 0.9312039312039312,
2082
  "eval_overall_recall": 0.9451371571072319,
2083
- "eval_runtime": 0.294,
2084
- "eval_samples_per_second": 578.275,
2085
- "eval_steps_per_second": 10.205,
2086
  "step": 6432
2087
  },
2088
  {
@@ -2111,9 +2111,9 @@
2111
  "eval_overall_f1": 0.9429280397022332,
2112
  "eval_overall_precision": 0.9382716049382716,
2113
  "eval_overall_recall": 0.9476309226932669,
2114
- "eval_runtime": 0.2938,
2115
- "eval_samples_per_second": 578.598,
2116
- "eval_steps_per_second": 10.211,
2117
  "step": 6528
2118
  },
2119
  {
@@ -2142,9 +2142,9 @@
2142
  "eval_overall_f1": 0.946583850931677,
2143
  "eval_overall_precision": 0.943069306930693,
2144
  "eval_overall_recall": 0.9501246882793017,
2145
- "eval_runtime": 0.2955,
2146
- "eval_samples_per_second": 575.299,
2147
- "eval_steps_per_second": 10.152,
2148
  "step": 6624
2149
  },
2150
  {
@@ -2173,9 +2173,9 @@
2173
  "eval_overall_f1": 0.9429280397022332,
2174
  "eval_overall_precision": 0.9382716049382716,
2175
  "eval_overall_recall": 0.9476309226932669,
2176
- "eval_runtime": 0.3,
2177
- "eval_samples_per_second": 566.609,
2178
- "eval_steps_per_second": 9.999,
2179
  "step": 6720
2180
  },
2181
  {
@@ -2204,9 +2204,9 @@
2204
  "eval_overall_f1": 0.9455445544554455,
2205
  "eval_overall_precision": 0.9385749385749386,
2206
  "eval_overall_recall": 0.9526184538653366,
2207
- "eval_runtime": 0.2936,
2208
- "eval_samples_per_second": 578.941,
2209
- "eval_steps_per_second": 10.217,
2210
  "step": 6816
2211
  },
2212
  {
@@ -2235,9 +2235,9 @@
2235
  "eval_overall_f1": 0.9419035846724352,
2236
  "eval_overall_precision": 0.9338235294117647,
2237
  "eval_overall_recall": 0.9501246882793017,
2238
- "eval_runtime": 0.296,
2239
- "eval_samples_per_second": 574.374,
2240
- "eval_steps_per_second": 10.136,
2241
  "step": 6912
2242
  },
2243
  {
@@ -2266,9 +2266,9 @@
2266
  "eval_overall_f1": 0.9417596034696407,
2267
  "eval_overall_precision": 0.9359605911330049,
2268
  "eval_overall_recall": 0.9476309226932669,
2269
- "eval_runtime": 0.294,
2270
- "eval_samples_per_second": 578.236,
2271
- "eval_steps_per_second": 10.204,
2272
  "step": 7008
2273
  },
2274
  {
@@ -2297,9 +2297,9 @@
2297
  "eval_overall_f1": 0.9392812887236679,
2298
  "eval_overall_precision": 0.9334975369458128,
2299
  "eval_overall_recall": 0.9451371571072319,
2300
- "eval_runtime": 0.2978,
2301
- "eval_samples_per_second": 570.877,
2302
- "eval_steps_per_second": 10.074,
2303
  "step": 7104
2304
  },
2305
  {
@@ -2328,9 +2328,9 @@
2328
  "eval_overall_f1": 0.9419035846724352,
2329
  "eval_overall_precision": 0.9338235294117647,
2330
  "eval_overall_recall": 0.9501246882793017,
2331
- "eval_runtime": 0.2924,
2332
- "eval_samples_per_second": 581.388,
2333
- "eval_steps_per_second": 10.26,
2334
  "step": 7200
2335
  },
2336
  {
@@ -2359,9 +2359,9 @@
2359
  "eval_overall_f1": 0.9490683229813663,
2360
  "eval_overall_precision": 0.9455445544554455,
2361
  "eval_overall_recall": 0.9526184538653366,
2362
- "eval_runtime": 0.2966,
2363
- "eval_samples_per_second": 573.117,
2364
- "eval_steps_per_second": 10.114,
2365
  "step": 7296
2366
  },
2367
  {
@@ -2390,9 +2390,9 @@
2390
  "eval_overall_f1": 0.9363295880149813,
2391
  "eval_overall_precision": 0.9375,
2392
  "eval_overall_recall": 0.9351620947630923,
2393
- "eval_runtime": 0.2971,
2394
- "eval_samples_per_second": 572.223,
2395
- "eval_steps_per_second": 10.098,
2396
  "step": 7392
2397
  },
2398
  {
@@ -2421,9 +2421,9 @@
2421
  "eval_overall_f1": 0.9540372670807453,
2422
  "eval_overall_precision": 0.9504950495049505,
2423
  "eval_overall_recall": 0.9576059850374065,
2424
- "eval_runtime": 0.2968,
2425
- "eval_samples_per_second": 572.842,
2426
- "eval_steps_per_second": 10.109,
2427
  "step": 7488
2428
  },
2429
  {
@@ -2452,9 +2452,9 @@
2452
  "eval_overall_f1": 0.9490683229813663,
2453
  "eval_overall_precision": 0.9455445544554455,
2454
  "eval_overall_recall": 0.9526184538653366,
2455
- "eval_runtime": 0.2949,
2456
- "eval_samples_per_second": 576.488,
2457
- "eval_steps_per_second": 10.173,
2458
  "step": 7584
2459
  },
2460
  {
@@ -2483,9 +2483,9 @@
2483
  "eval_overall_f1": 0.941469489414695,
2484
  "eval_overall_precision": 0.9402985074626866,
2485
  "eval_overall_recall": 0.942643391521197,
2486
- "eval_runtime": 0.2974,
2487
- "eval_samples_per_second": 571.576,
2488
- "eval_steps_per_second": 10.087,
2489
  "step": 7680
2490
  },
2491
  {
@@ -2514,9 +2514,9 @@
2514
  "eval_overall_f1": 0.9381188118811881,
2515
  "eval_overall_precision": 0.9312039312039312,
2516
  "eval_overall_recall": 0.9451371571072319,
2517
- "eval_runtime": 0.2958,
2518
- "eval_samples_per_second": 574.652,
2519
- "eval_steps_per_second": 10.141,
2520
  "step": 7776
2521
  },
2522
  {
@@ -2545,9 +2545,9 @@
2545
  "eval_overall_f1": 0.9429280397022332,
2546
  "eval_overall_precision": 0.9382716049382716,
2547
  "eval_overall_recall": 0.9476309226932669,
2548
- "eval_runtime": 0.3023,
2549
- "eval_samples_per_second": 562.37,
2550
- "eval_steps_per_second": 9.924,
2551
  "step": 7872
2552
  },
2553
  {
@@ -2576,9 +2576,9 @@
2576
  "eval_overall_f1": 0.9417596034696407,
2577
  "eval_overall_precision": 0.9359605911330049,
2578
  "eval_overall_recall": 0.9476309226932669,
2579
- "eval_runtime": 0.2949,
2580
- "eval_samples_per_second": 576.538,
2581
- "eval_steps_per_second": 10.174,
2582
  "step": 7968
2583
  },
2584
  {
@@ -2607,9 +2607,9 @@
2607
  "eval_overall_f1": 0.949194547707559,
2608
  "eval_overall_precision": 0.9433497536945813,
2609
  "eval_overall_recall": 0.9551122194513716,
2610
- "eval_runtime": 0.2951,
2611
- "eval_samples_per_second": 575.994,
2612
- "eval_steps_per_second": 10.165,
2613
  "step": 8064
2614
  },
2615
  {
@@ -2638,9 +2638,9 @@
2638
  "eval_overall_f1": 0.9468479604449938,
2639
  "eval_overall_precision": 0.9387254901960784,
2640
  "eval_overall_recall": 0.9551122194513716,
2641
- "eval_runtime": 0.2965,
2642
- "eval_samples_per_second": 573.314,
2643
- "eval_steps_per_second": 10.117,
2644
  "step": 8160
2645
  },
2646
  {
@@ -2669,9 +2669,9 @@
2669
  "eval_overall_f1": 0.9430693069306931,
2670
  "eval_overall_precision": 0.9361179361179361,
2671
  "eval_overall_recall": 0.9501246882793017,
2672
- "eval_runtime": 0.2961,
2673
- "eval_samples_per_second": 574.052,
2674
- "eval_steps_per_second": 10.13,
2675
  "step": 8256
2676
  },
2677
  {
@@ -2700,9 +2700,9 @@
2700
  "eval_overall_f1": 0.946583850931677,
2701
  "eval_overall_precision": 0.943069306930693,
2702
  "eval_overall_recall": 0.9501246882793017,
2703
- "eval_runtime": 0.296,
2704
- "eval_samples_per_second": 574.399,
2705
- "eval_steps_per_second": 10.136,
2706
  "step": 8352
2707
  },
2708
  {
@@ -2731,9 +2731,9 @@
2731
  "eval_overall_f1": 0.946716232961586,
2732
  "eval_overall_precision": 0.9408866995073891,
2733
  "eval_overall_recall": 0.9526184538653366,
2734
- "eval_runtime": 0.2939,
2735
- "eval_samples_per_second": 578.428,
2736
- "eval_steps_per_second": 10.208,
2737
  "step": 8448
2738
  },
2739
  {
@@ -2762,9 +2762,9 @@
2762
  "eval_overall_f1": 0.9419035846724352,
2763
  "eval_overall_precision": 0.9338235294117647,
2764
  "eval_overall_recall": 0.9501246882793017,
2765
- "eval_runtime": 0.2955,
2766
- "eval_samples_per_second": 575.311,
2767
- "eval_steps_per_second": 10.153,
2768
  "step": 8544
2769
  },
2770
  {
@@ -2793,9 +2793,9 @@
2793
  "eval_overall_f1": 0.946583850931677,
2794
  "eval_overall_precision": 0.943069306930693,
2795
  "eval_overall_recall": 0.9501246882793017,
2796
- "eval_runtime": 0.2943,
2797
- "eval_samples_per_second": 577.551,
2798
- "eval_steps_per_second": 10.192,
2799
  "step": 8640
2800
  },
2801
  {
@@ -2824,9 +2824,9 @@
2824
  "eval_overall_f1": 0.9419035846724352,
2825
  "eval_overall_precision": 0.9338235294117647,
2826
  "eval_overall_recall": 0.9501246882793017,
2827
- "eval_runtime": 0.2941,
2828
- "eval_samples_per_second": 578.128,
2829
- "eval_steps_per_second": 10.202,
2830
  "step": 8736
2831
  },
2832
  {
@@ -2855,9 +2855,9 @@
2855
  "eval_overall_f1": 0.9480198019801981,
2856
  "eval_overall_precision": 0.941031941031941,
2857
  "eval_overall_recall": 0.9551122194513716,
2858
- "eval_runtime": 0.2941,
2859
- "eval_samples_per_second": 577.954,
2860
- "eval_steps_per_second": 10.199,
2861
  "step": 8832
2862
  },
2863
  {
@@ -2886,9 +2886,9 @@
2886
  "eval_overall_f1": 0.9371146732429101,
2887
  "eval_overall_precision": 0.926829268292683,
2888
  "eval_overall_recall": 0.9476309226932669,
2889
- "eval_runtime": 0.2945,
2890
- "eval_samples_per_second": 577.343,
2891
- "eval_steps_per_second": 10.188,
2892
  "step": 8928
2893
  },
2894
  {
@@ -2917,9 +2917,9 @@
2917
  "eval_overall_f1": 0.9430693069306931,
2918
  "eval_overall_precision": 0.9361179361179361,
2919
  "eval_overall_recall": 0.9501246882793017,
2920
- "eval_runtime": 0.2978,
2921
- "eval_samples_per_second": 570.928,
2922
- "eval_steps_per_second": 10.075,
2923
  "step": 9024
2924
  },
2925
  {
@@ -2948,9 +2948,9 @@
2948
  "eval_overall_f1": 0.9419035846724352,
2949
  "eval_overall_precision": 0.9338235294117647,
2950
  "eval_overall_recall": 0.9501246882793017,
2951
- "eval_runtime": 0.2951,
2952
- "eval_samples_per_second": 576.068,
2953
- "eval_steps_per_second": 10.166,
2954
  "step": 9120
2955
  },
2956
  {
@@ -2979,9 +2979,9 @@
2979
  "eval_overall_f1": 0.946583850931677,
2980
  "eval_overall_precision": 0.943069306930693,
2981
  "eval_overall_recall": 0.9501246882793017,
2982
- "eval_runtime": 0.2958,
2983
- "eval_samples_per_second": 574.761,
2984
- "eval_steps_per_second": 10.143,
2985
  "step": 9216
2986
  },
2987
  {
@@ -3010,9 +3010,9 @@
3010
  "eval_overall_f1": 0.9419035846724352,
3011
  "eval_overall_precision": 0.9338235294117647,
3012
  "eval_overall_recall": 0.9501246882793017,
3013
- "eval_runtime": 0.2933,
3014
- "eval_samples_per_second": 579.547,
3015
- "eval_steps_per_second": 10.227,
3016
  "step": 9312
3017
  },
3018
  {
@@ -3041,9 +3041,9 @@
3041
  "eval_overall_f1": 0.9419035846724352,
3042
  "eval_overall_precision": 0.9338235294117647,
3043
  "eval_overall_recall": 0.9501246882793017,
3044
- "eval_runtime": 0.2944,
3045
- "eval_samples_per_second": 577.476,
3046
- "eval_steps_per_second": 10.191,
3047
  "step": 9408
3048
  },
3049
  {
@@ -3072,9 +3072,9 @@
3072
  "eval_overall_f1": 0.9419035846724352,
3073
  "eval_overall_precision": 0.9338235294117647,
3074
  "eval_overall_recall": 0.9501246882793017,
3075
- "eval_runtime": 0.2955,
3076
- "eval_samples_per_second": 575.393,
3077
- "eval_steps_per_second": 10.154,
3078
  "step": 9504
3079
  },
3080
  {
@@ -3103,9 +3103,9 @@
3103
  "eval_overall_f1": 0.9419035846724352,
3104
  "eval_overall_precision": 0.9338235294117647,
3105
  "eval_overall_recall": 0.9501246882793017,
3106
- "eval_runtime": 0.2958,
3107
- "eval_samples_per_second": 574.646,
3108
- "eval_steps_per_second": 10.141,
3109
  "step": 9600
3110
  },
3111
  {
@@ -3113,9 +3113,9 @@
3113
  "step": 9600,
3114
  "total_flos": 4208466347875278.0,
3115
  "train_loss": 0.03501902000978589,
3116
- "train_runtime": 552.429,
3117
- "train_samples_per_second": 277.14,
3118
- "train_steps_per_second": 17.378
3119
  }
3120
  ],
3121
  "logging_steps": 500,
 
34
  "eval_overall_f1": 0.2203626220362622,
35
  "eval_overall_precision": 0.25,
36
  "eval_overall_recall": 0.1970074812967581,
37
+ "eval_runtime": 0.2958,
38
+ "eval_samples_per_second": 574.685,
39
+ "eval_steps_per_second": 10.142,
40
  "step": 96
41
  },
42
  {
 
65
  "eval_overall_f1": 0.5780219780219781,
66
  "eval_overall_precision": 0.5166994106090373,
67
  "eval_overall_recall": 0.655860349127182,
68
+ "eval_runtime": 0.2946,
69
+ "eval_samples_per_second": 577.114,
70
+ "eval_steps_per_second": 10.184,
71
  "step": 192
72
  },
73
  {
 
96
  "eval_overall_f1": 0.803357314148681,
97
  "eval_overall_precision": 0.7736720554272517,
98
  "eval_overall_recall": 0.8354114713216958,
99
+ "eval_runtime": 0.2924,
100
+ "eval_samples_per_second": 581.304,
101
+ "eval_steps_per_second": 10.258,
102
  "step": 288
103
  },
104
  {
 
127
  "eval_overall_f1": 0.857482185273159,
128
  "eval_overall_precision": 0.81859410430839,
129
  "eval_overall_recall": 0.9002493765586035,
130
+ "eval_runtime": 0.2931,
131
+ "eval_samples_per_second": 580.016,
132
+ "eval_steps_per_second": 10.236,
133
  "step": 384
134
  },
135
  {
 
158
  "eval_overall_f1": 0.9093167701863354,
159
  "eval_overall_precision": 0.905940594059406,
160
  "eval_overall_recall": 0.912718204488778,
161
+ "eval_runtime": 0.2956,
162
+ "eval_samples_per_second": 575.164,
163
+ "eval_steps_per_second": 10.15,
164
  "step": 480
165
  },
166
  {
 
189
  "eval_overall_f1": 0.8940886699507389,
190
  "eval_overall_precision": 0.8832116788321168,
191
  "eval_overall_recall": 0.9052369077306733,
192
+ "eval_runtime": 0.2951,
193
+ "eval_samples_per_second": 576.101,
194
+ "eval_steps_per_second": 10.166,
195
  "step": 576
196
  },
197
  {
 
220
  "eval_overall_f1": 0.9200968523002423,
221
  "eval_overall_precision": 0.8941176470588236,
222
  "eval_overall_recall": 0.9476309226932669,
223
+ "eval_runtime": 0.2947,
224
+ "eval_samples_per_second": 576.819,
225
+ "eval_steps_per_second": 10.179,
226
  "step": 672
227
  },
228
  {
 
251
  "eval_overall_f1": 0.9238329238329237,
252
  "eval_overall_precision": 0.910411622276029,
253
  "eval_overall_recall": 0.9376558603491272,
254
+ "eval_runtime": 0.2936,
255
+ "eval_samples_per_second": 579.097,
256
+ "eval_steps_per_second": 10.219,
257
  "step": 768
258
  },
259
  {
 
282
  "eval_overall_f1": 0.9262899262899262,
283
  "eval_overall_precision": 0.9128329297820823,
284
  "eval_overall_recall": 0.940149625935162,
285
+ "eval_runtime": 0.2921,
286
+ "eval_samples_per_second": 582.059,
287
+ "eval_steps_per_second": 10.272,
288
  "step": 864
289
  },
290
  {
 
313
  "eval_overall_f1": 0.9153374233128836,
314
  "eval_overall_precision": 0.9009661835748792,
315
  "eval_overall_recall": 0.9301745635910225,
316
+ "eval_runtime": 0.2946,
317
+ "eval_samples_per_second": 576.963,
318
+ "eval_steps_per_second": 10.182,
319
  "step": 960
320
  },
321
  {
 
344
  "eval_overall_f1": 0.9253365973072215,
345
  "eval_overall_precision": 0.9086538461538461,
346
  "eval_overall_recall": 0.942643391521197,
347
+ "eval_runtime": 0.2959,
348
+ "eval_samples_per_second": 574.541,
349
+ "eval_steps_per_second": 10.139,
350
  "step": 1056
351
  },
352
  {
 
375
  "eval_overall_f1": 0.932349323493235,
376
  "eval_overall_precision": 0.9199029126213593,
377
  "eval_overall_recall": 0.9451371571072319,
378
+ "eval_runtime": 0.2928,
379
+ "eval_samples_per_second": 580.593,
380
+ "eval_steps_per_second": 10.246,
381
  "step": 1152
382
  },
383
  {
 
406
  "eval_overall_f1": 0.9282178217821783,
407
  "eval_overall_precision": 0.9213759213759214,
408
  "eval_overall_recall": 0.9351620947630923,
409
+ "eval_runtime": 0.2932,
410
+ "eval_samples_per_second": 579.856,
411
+ "eval_steps_per_second": 10.233,
412
  "step": 1248
413
  },
414
  {
 
437
  "eval_overall_f1": 0.9369592088998765,
438
  "eval_overall_precision": 0.928921568627451,
439
  "eval_overall_recall": 0.9451371571072319,
440
+ "eval_runtime": 0.2926,
441
+ "eval_samples_per_second": 580.905,
442
+ "eval_steps_per_second": 10.251,
443
  "step": 1344
444
  },
445
  {
 
468
  "eval_overall_f1": 0.9270704573547589,
469
  "eval_overall_precision": 0.9191176470588235,
470
  "eval_overall_recall": 0.9351620947630923,
471
+ "eval_runtime": 0.2927,
472
+ "eval_samples_per_second": 580.788,
473
+ "eval_steps_per_second": 10.249,
474
  "step": 1440
475
  },
476
  {
 
499
  "eval_overall_f1": 0.9318463444857497,
500
  "eval_overall_precision": 0.9261083743842364,
501
  "eval_overall_recall": 0.9376558603491272,
502
+ "eval_runtime": 0.294,
503
+ "eval_samples_per_second": 578.226,
504
+ "eval_steps_per_second": 10.204,
505
  "step": 1536
506
  },
507
  {
 
530
  "eval_overall_f1": 0.9346485819975339,
531
  "eval_overall_precision": 0.9243902439024391,
532
  "eval_overall_recall": 0.9451371571072319,
533
+ "eval_runtime": 0.2926,
534
+ "eval_samples_per_second": 580.917,
535
+ "eval_steps_per_second": 10.251,
536
  "step": 1632
537
  },
538
  {
 
561
  "eval_overall_f1": 0.9376558603491272,
562
  "eval_overall_precision": 0.9376558603491272,
563
  "eval_overall_recall": 0.9376558603491272,
564
+ "eval_runtime": 0.2945,
565
+ "eval_samples_per_second": 577.326,
566
+ "eval_steps_per_second": 10.188,
567
  "step": 1728
568
  },
569
  {
 
592
  "eval_overall_f1": 0.9524999999999999,
593
  "eval_overall_precision": 0.9548872180451128,
594
  "eval_overall_recall": 0.9501246882793017,
595
+ "eval_runtime": 0.2934,
596
+ "eval_samples_per_second": 579.421,
597
+ "eval_steps_per_second": 10.225,
598
  "step": 1824
599
  },
600
  {
 
623
  "eval_overall_f1": 0.9407407407407408,
624
  "eval_overall_precision": 0.9315403422982885,
625
  "eval_overall_recall": 0.9501246882793017,
626
+ "eval_runtime": 0.2935,
627
+ "eval_samples_per_second": 579.202,
628
+ "eval_steps_per_second": 10.221,
629
  "step": 1920
630
  },
631
  {
 
654
  "eval_overall_f1": 0.9394313967861558,
655
  "eval_overall_precision": 0.9313725490196079,
656
  "eval_overall_recall": 0.9476309226932669,
657
+ "eval_runtime": 0.2936,
658
+ "eval_samples_per_second": 579.049,
659
+ "eval_steps_per_second": 10.219,
660
  "step": 2016
661
  },
662
  {
 
685
  "eval_overall_f1": 0.9395807644882862,
686
  "eval_overall_precision": 0.9292682926829269,
687
  "eval_overall_recall": 0.9501246882793017,
688
+ "eval_runtime": 0.2938,
689
+ "eval_samples_per_second": 578.717,
690
+ "eval_steps_per_second": 10.213,
691
  "step": 2112
692
  },
693
  {
 
716
  "eval_overall_f1": 0.949569495694957,
717
  "eval_overall_precision": 0.9368932038834952,
718
  "eval_overall_recall": 0.9625935162094763,
719
+ "eval_runtime": 0.2952,
720
+ "eval_samples_per_second": 575.839,
721
+ "eval_steps_per_second": 10.162,
722
  "step": 2208
723
  },
724
  {
 
747
  "eval_overall_f1": 0.9478908188585606,
748
  "eval_overall_precision": 0.9432098765432099,
749
  "eval_overall_recall": 0.9526184538653366,
750
+ "eval_runtime": 0.2922,
751
+ "eval_samples_per_second": 581.848,
752
+ "eval_steps_per_second": 10.268,
753
  "step": 2304
754
  },
755
  {
 
778
  "eval_overall_f1": 0.9515527950310558,
779
  "eval_overall_precision": 0.948019801980198,
780
  "eval_overall_recall": 0.9551122194513716,
781
+ "eval_runtime": 0.2922,
782
+ "eval_samples_per_second": 581.89,
783
+ "eval_steps_per_second": 10.269,
784
  "step": 2400
785
  },
786
  {
 
809
  "eval_overall_f1": 0.9477611940298507,
810
  "eval_overall_precision": 0.9454094292803971,
811
  "eval_overall_recall": 0.9501246882793017,
812
+ "eval_runtime": 0.2938,
813
+ "eval_samples_per_second": 578.634,
814
+ "eval_steps_per_second": 10.211,
815
  "step": 2496
816
  },
817
  {
 
840
  "eval_overall_f1": 0.9478908188585606,
841
  "eval_overall_precision": 0.9432098765432099,
842
  "eval_overall_recall": 0.9526184538653366,
843
+ "eval_runtime": 0.2917,
844
+ "eval_samples_per_second": 582.867,
845
+ "eval_steps_per_second": 10.286,
846
  "step": 2592
847
  },
848
  {
 
871
  "eval_overall_f1": 0.9408866995073891,
872
  "eval_overall_precision": 0.9294403892944039,
873
  "eval_overall_recall": 0.9526184538653366,
874
+ "eval_runtime": 0.2935,
875
+ "eval_samples_per_second": 579.298,
876
+ "eval_steps_per_second": 10.223,
877
  "step": 2688
878
  },
879
  {
 
902
  "eval_overall_f1": 0.9392812887236679,
903
  "eval_overall_precision": 0.9334975369458128,
904
  "eval_overall_recall": 0.9451371571072319,
905
+ "eval_runtime": 0.2966,
906
+ "eval_samples_per_second": 573.248,
907
+ "eval_steps_per_second": 10.116,
908
  "step": 2784
909
  },
910
  {
 
933
  "eval_overall_f1": 0.942189421894219,
934
  "eval_overall_precision": 0.9296116504854369,
935
  "eval_overall_recall": 0.9551122194513716,
936
+ "eval_runtime": 0.2929,
937
+ "eval_samples_per_second": 580.308,
938
+ "eval_steps_per_second": 10.241,
939
  "step": 2880
940
  },
941
  {
 
964
  "eval_overall_f1": 0.9443757725587144,
965
  "eval_overall_precision": 0.9362745098039216,
966
  "eval_overall_recall": 0.9526184538653366,
967
+ "eval_runtime": 0.2935,
968
+ "eval_samples_per_second": 579.15,
969
+ "eval_steps_per_second": 10.22,
970
  "step": 2976
971
  },
972
  {
 
995
  "eval_overall_f1": 0.9442379182156134,
996
  "eval_overall_precision": 0.9384236453201971,
997
  "eval_overall_recall": 0.9501246882793017,
998
+ "eval_runtime": 0.2945,
999
+ "eval_samples_per_second": 577.309,
1000
+ "eval_steps_per_second": 10.188,
1001
  "step": 3072
1002
  },
1003
  {
 
1026
  "eval_overall_f1": 0.949194547707559,
1027
  "eval_overall_precision": 0.9433497536945813,
1028
  "eval_overall_recall": 0.9551122194513716,
1029
+ "eval_runtime": 0.2947,
1030
+ "eval_samples_per_second": 576.801,
1031
+ "eval_steps_per_second": 10.179,
1032
  "step": 3168
1033
  },
1034
  {
 
1057
  "eval_overall_f1": 0.9514321295143213,
1058
  "eval_overall_precision": 0.9502487562189055,
1059
  "eval_overall_recall": 0.9526184538653366,
1060
+ "eval_runtime": 0.297,
1061
+ "eval_samples_per_second": 572.432,
1062
+ "eval_steps_per_second": 10.102,
1063
  "step": 3264
1064
  },
1065
  {
 
1088
  "eval_overall_f1": 0.9432098765432098,
1089
  "eval_overall_precision": 0.9339853300733496,
1090
  "eval_overall_recall": 0.9526184538653366,
1091
+ "eval_runtime": 0.2949,
1092
+ "eval_samples_per_second": 576.442,
1093
+ "eval_steps_per_second": 10.173,
1094
  "step": 3360
1095
  },
1096
  {
 
1119
  "eval_overall_f1": 0.9417596034696407,
1120
  "eval_overall_precision": 0.9359605911330049,
1121
  "eval_overall_recall": 0.9476309226932669,
1122
+ "eval_runtime": 0.2936,
1123
+ "eval_samples_per_second": 579.066,
1124
+ "eval_steps_per_second": 10.219,
1125
  "step": 3456
1126
  },
1127
  {
 
1150
  "eval_overall_f1": 0.9527363184079602,
1151
  "eval_overall_precision": 0.9503722084367245,
1152
  "eval_overall_recall": 0.9551122194513716,
1153
+ "eval_runtime": 0.2935,
1154
+ "eval_samples_per_second": 579.147,
1155
+ "eval_steps_per_second": 10.22,
1156
  "step": 3552
1157
  },
1158
  {
 
1181
  "eval_overall_f1": 0.9359605911330049,
1182
  "eval_overall_precision": 0.9245742092457421,
1183
  "eval_overall_recall": 0.9476309226932669,
1184
+ "eval_runtime": 0.2953,
1185
+ "eval_samples_per_second": 575.636,
1186
+ "eval_steps_per_second": 10.158,
1187
  "step": 3648
1188
  },
1189
  {
 
1212
  "eval_overall_f1": 0.9369592088998765,
1213
  "eval_overall_precision": 0.928921568627451,
1214
  "eval_overall_recall": 0.9451371571072319,
1215
+ "eval_runtime": 0.2936,
1216
+ "eval_samples_per_second": 579.045,
1217
+ "eval_steps_per_second": 10.218,
1218
  "step": 3744
1219
  },
1220
  {
 
1243
  "eval_overall_f1": 0.949194547707559,
1244
  "eval_overall_precision": 0.9433497536945813,
1245
  "eval_overall_recall": 0.9551122194513716,
1246
+ "eval_runtime": 0.293,
1247
+ "eval_samples_per_second": 580.131,
1248
+ "eval_steps_per_second": 10.238,
1249
  "step": 3840
1250
  },
1251
  {
 
1274
  "eval_overall_f1": 0.946716232961586,
1275
  "eval_overall_precision": 0.9408866995073891,
1276
  "eval_overall_recall": 0.9526184538653366,
1277
+ "eval_runtime": 0.2914,
1278
+ "eval_samples_per_second": 583.341,
1279
+ "eval_steps_per_second": 10.294,
1280
  "step": 3936
1281
  },
1282
  {
 
1305
  "eval_overall_f1": 0.9516728624535316,
1306
  "eval_overall_precision": 0.9458128078817734,
1307
  "eval_overall_recall": 0.9576059850374065,
1308
+ "eval_runtime": 0.2922,
1309
+ "eval_samples_per_second": 581.788,
1310
+ "eval_steps_per_second": 10.267,
1311
  "step": 4032
1312
  },
1313
  {
 
1336
  "eval_overall_f1": 0.9516728624535316,
1337
  "eval_overall_precision": 0.9458128078817734,
1338
  "eval_overall_recall": 0.9576059850374065,
1339
+ "eval_runtime": 0.2934,
1340
+ "eval_samples_per_second": 579.382,
1341
+ "eval_steps_per_second": 10.224,
1342
  "step": 4128
1343
  },
1344
  {
 
1367
  "eval_overall_f1": 0.9443757725587144,
1368
  "eval_overall_precision": 0.9362745098039216,
1369
  "eval_overall_recall": 0.9526184538653366,
1370
+ "eval_runtime": 0.2951,
1371
+ "eval_samples_per_second": 576.031,
1372
+ "eval_steps_per_second": 10.165,
1373
  "step": 4224
1374
  },
1375
  {
 
1398
  "eval_overall_f1": 0.9416149068322982,
1399
  "eval_overall_precision": 0.9381188118811881,
1400
  "eval_overall_recall": 0.9451371571072319,
1401
+ "eval_runtime": 0.3012,
1402
+ "eval_samples_per_second": 564.356,
1403
+ "eval_steps_per_second": 9.959,
1404
  "step": 4320
1405
  },
1406
  {
 
1429
  "eval_overall_f1": 0.949194547707559,
1430
  "eval_overall_precision": 0.9433497536945813,
1431
  "eval_overall_recall": 0.9551122194513716,
1432
+ "eval_runtime": 0.2913,
1433
+ "eval_samples_per_second": 583.503,
1434
+ "eval_steps_per_second": 10.297,
1435
  "step": 4416
1436
  },
1437
  {
 
1460
  "eval_overall_f1": 0.9430693069306931,
1461
  "eval_overall_precision": 0.9361179361179361,
1462
  "eval_overall_recall": 0.9501246882793017,
1463
+ "eval_runtime": 0.2927,
1464
+ "eval_samples_per_second": 580.849,
1465
+ "eval_steps_per_second": 10.25,
1466
  "step": 4512
1467
  },
1468
  {
 
1491
  "eval_overall_f1": 0.9376558603491272,
1492
  "eval_overall_precision": 0.9376558603491272,
1493
  "eval_overall_recall": 0.9376558603491272,
1494
+ "eval_runtime": 0.2963,
1495
+ "eval_samples_per_second": 573.804,
1496
+ "eval_steps_per_second": 10.126,
1497
  "step": 4608
1498
  },
1499
  {
 
1522
  "eval_overall_f1": 0.9318463444857497,
1523
  "eval_overall_precision": 0.9261083743842364,
1524
  "eval_overall_recall": 0.9376558603491272,
1525
+ "eval_runtime": 0.2942,
1526
+ "eval_samples_per_second": 577.811,
1527
+ "eval_steps_per_second": 10.197,
1528
  "step": 4704
1529
  },
1530
  {
 
1553
  "eval_overall_f1": 0.9455445544554455,
1554
  "eval_overall_precision": 0.9385749385749386,
1555
  "eval_overall_recall": 0.9526184538653366,
1556
+ "eval_runtime": 0.2924,
1557
+ "eval_samples_per_second": 581.359,
1558
+ "eval_steps_per_second": 10.259,
1559
  "step": 4800
1560
  },
1561
  {
 
1584
  "eval_overall_f1": 0.9381188118811881,
1585
  "eval_overall_precision": 0.9312039312039312,
1586
  "eval_overall_recall": 0.9451371571072319,
1587
+ "eval_runtime": 0.2925,
1588
+ "eval_samples_per_second": 581.258,
1589
+ "eval_steps_per_second": 10.257,
1590
  "step": 4896
1591
  },
1592
  {
 
1615
  "eval_overall_f1": 0.9416149068322982,
1616
  "eval_overall_precision": 0.9381188118811881,
1617
  "eval_overall_recall": 0.9451371571072319,
1618
+ "eval_runtime": 0.2935,
1619
+ "eval_samples_per_second": 579.129,
1620
+ "eval_steps_per_second": 10.22,
1621
  "step": 4992
1622
  },
1623
  {
 
1646
  "eval_overall_f1": 0.9417596034696407,
1647
  "eval_overall_precision": 0.9359605911330049,
1648
  "eval_overall_recall": 0.9476309226932669,
1649
+ "eval_runtime": 0.2958,
1650
+ "eval_samples_per_second": 574.635,
1651
+ "eval_steps_per_second": 10.141,
1652
  "step": 5088
1653
  },
1654
  {
 
1677
  "eval_overall_f1": 0.946583850931677,
1678
  "eval_overall_precision": 0.943069306930693,
1679
  "eval_overall_recall": 0.9501246882793017,
1680
+ "eval_runtime": 0.2935,
1681
+ "eval_samples_per_second": 579.235,
1682
+ "eval_steps_per_second": 10.222,
1683
  "step": 5184
1684
  },
1685
  {
 
1708
  "eval_overall_f1": 0.9440993788819876,
1709
  "eval_overall_precision": 0.9405940594059405,
1710
  "eval_overall_recall": 0.9476309226932669,
1711
+ "eval_runtime": 0.294,
1712
+ "eval_samples_per_second": 578.325,
1713
+ "eval_steps_per_second": 10.206,
1714
  "step": 5280
1715
  },
1716
  {
 
1739
  "eval_overall_f1": 0.9432098765432098,
1740
  "eval_overall_precision": 0.9339853300733496,
1741
  "eval_overall_recall": 0.9526184538653366,
1742
+ "eval_runtime": 0.2937,
1743
+ "eval_samples_per_second": 578.886,
1744
+ "eval_steps_per_second": 10.216,
1745
  "step": 5376
1746
  },
1747
  {
 
1770
  "eval_overall_f1": 0.9382716049382714,
1771
  "eval_overall_precision": 0.9290953545232273,
1772
  "eval_overall_recall": 0.9476309226932669,
1773
+ "eval_runtime": 0.2947,
1774
+ "eval_samples_per_second": 576.934,
1775
+ "eval_steps_per_second": 10.181,
1776
  "step": 5472
1777
  },
1778
  {
 
1801
  "eval_overall_f1": 0.9455445544554455,
1802
  "eval_overall_precision": 0.9385749385749386,
1803
  "eval_overall_recall": 0.9526184538653366,
1804
+ "eval_runtime": 0.2928,
1805
+ "eval_samples_per_second": 580.542,
1806
+ "eval_steps_per_second": 10.245,
1807
  "step": 5568
1808
  },
1809
  {
 
1832
  "eval_overall_f1": 0.9430693069306931,
1833
  "eval_overall_precision": 0.9361179361179361,
1834
  "eval_overall_recall": 0.9501246882793017,
1835
+ "eval_runtime": 0.2954,
1836
+ "eval_samples_per_second": 575.444,
1837
+ "eval_steps_per_second": 10.155,
1838
  "step": 5664
1839
  },
1840
  {
 
1863
  "eval_overall_f1": 0.9456790123456791,
1864
  "eval_overall_precision": 0.9364303178484108,
1865
  "eval_overall_recall": 0.9551122194513716,
1866
+ "eval_runtime": 0.2939,
1867
+ "eval_samples_per_second": 578.464,
1868
+ "eval_steps_per_second": 10.208,
1869
  "step": 5760
1870
  },
1871
  {
 
1894
  "eval_overall_f1": 0.9455445544554455,
1895
  "eval_overall_precision": 0.9385749385749386,
1896
  "eval_overall_recall": 0.9526184538653366,
1897
+ "eval_runtime": 0.2936,
1898
+ "eval_samples_per_second": 579.115,
1899
+ "eval_steps_per_second": 10.22,
1900
  "step": 5856
1901
  },
1902
  {
 
1925
  "eval_overall_f1": 0.9354838709677419,
1926
  "eval_overall_precision": 0.9308641975308642,
1927
  "eval_overall_recall": 0.940149625935162,
1928
+ "eval_runtime": 0.2935,
1929
+ "eval_samples_per_second": 579.189,
1930
+ "eval_steps_per_second": 10.221,
1931
  "step": 5952
1932
  },
1933
  {
 
1956
  "eval_overall_f1": 0.9456790123456791,
1957
  "eval_overall_precision": 0.9364303178484108,
1958
  "eval_overall_recall": 0.9551122194513716,
1959
+ "eval_runtime": 0.2927,
1960
+ "eval_samples_per_second": 580.719,
1961
+ "eval_steps_per_second": 10.248,
1962
  "step": 6048
1963
  },
1964
  {
 
1987
  "eval_overall_f1": 0.9442379182156134,
1988
  "eval_overall_precision": 0.9384236453201971,
1989
  "eval_overall_recall": 0.9501246882793017,
1990
+ "eval_runtime": 0.2951,
1991
+ "eval_samples_per_second": 576.162,
1992
+ "eval_steps_per_second": 10.168,
1993
  "step": 6144
1994
  },
1995
  {
 
2018
  "eval_overall_f1": 0.9321824907521579,
2019
  "eval_overall_precision": 0.9219512195121952,
2020
  "eval_overall_recall": 0.942643391521197,
2021
+ "eval_runtime": 0.2926,
2022
+ "eval_samples_per_second": 581.067,
2023
+ "eval_steps_per_second": 10.254,
2024
  "step": 6240
2025
  },
2026
  {
 
2049
  "eval_overall_f1": 0.9382716049382714,
2050
  "eval_overall_precision": 0.9290953545232273,
2051
  "eval_overall_recall": 0.9476309226932669,
2052
+ "eval_runtime": 0.2944,
2053
+ "eval_samples_per_second": 577.425,
2054
+ "eval_steps_per_second": 10.19,
2055
  "step": 6336
2056
  },
2057
  {
 
2080
  "eval_overall_f1": 0.9381188118811881,
2081
  "eval_overall_precision": 0.9312039312039312,
2082
  "eval_overall_recall": 0.9451371571072319,
2083
+ "eval_runtime": 0.2939,
2084
+ "eval_samples_per_second": 578.489,
2085
+ "eval_steps_per_second": 10.209,
2086
  "step": 6432
2087
  },
2088
  {
 
2111
  "eval_overall_f1": 0.9429280397022332,
2112
  "eval_overall_precision": 0.9382716049382716,
2113
  "eval_overall_recall": 0.9476309226932669,
2114
+ "eval_runtime": 0.2939,
2115
+ "eval_samples_per_second": 578.427,
2116
+ "eval_steps_per_second": 10.208,
2117
  "step": 6528
2118
  },
2119
  {
 
2142
  "eval_overall_f1": 0.946583850931677,
2143
  "eval_overall_precision": 0.943069306930693,
2144
  "eval_overall_recall": 0.9501246882793017,
2145
+ "eval_runtime": 0.2981,
2146
+ "eval_samples_per_second": 570.262,
2147
+ "eval_steps_per_second": 10.063,
2148
  "step": 6624
2149
  },
2150
  {
 
2173
  "eval_overall_f1": 0.9429280397022332,
2174
  "eval_overall_precision": 0.9382716049382716,
2175
  "eval_overall_recall": 0.9476309226932669,
2176
+ "eval_runtime": 0.2938,
2177
+ "eval_samples_per_second": 578.591,
2178
+ "eval_steps_per_second": 10.21,
2179
  "step": 6720
2180
  },
2181
  {
 
2204
  "eval_overall_f1": 0.9455445544554455,
2205
  "eval_overall_precision": 0.9385749385749386,
2206
  "eval_overall_recall": 0.9526184538653366,
2207
+ "eval_runtime": 0.2931,
2208
+ "eval_samples_per_second": 580.025,
2209
+ "eval_steps_per_second": 10.236,
2210
  "step": 6816
2211
  },
2212
  {
 
2235
  "eval_overall_f1": 0.9419035846724352,
2236
  "eval_overall_precision": 0.9338235294117647,
2237
  "eval_overall_recall": 0.9501246882793017,
2238
+ "eval_runtime": 0.2924,
2239
+ "eval_samples_per_second": 581.48,
2240
+ "eval_steps_per_second": 10.261,
2241
  "step": 6912
2242
  },
2243
  {
 
2266
  "eval_overall_f1": 0.9417596034696407,
2267
  "eval_overall_precision": 0.9359605911330049,
2268
  "eval_overall_recall": 0.9476309226932669,
2269
+ "eval_runtime": 0.2956,
2270
+ "eval_samples_per_second": 575.026,
2271
+ "eval_steps_per_second": 10.148,
2272
  "step": 7008
2273
  },
2274
  {
 
2297
  "eval_overall_f1": 0.9392812887236679,
2298
  "eval_overall_precision": 0.9334975369458128,
2299
  "eval_overall_recall": 0.9451371571072319,
2300
+ "eval_runtime": 0.2973,
2301
+ "eval_samples_per_second": 571.866,
2302
+ "eval_steps_per_second": 10.092,
2303
  "step": 7104
2304
  },
2305
  {
 
2328
  "eval_overall_f1": 0.9419035846724352,
2329
  "eval_overall_precision": 0.9338235294117647,
2330
  "eval_overall_recall": 0.9501246882793017,
2331
+ "eval_runtime": 0.2954,
2332
+ "eval_samples_per_second": 575.432,
2333
+ "eval_steps_per_second": 10.155,
2334
  "step": 7200
2335
  },
2336
  {
 
2359
  "eval_overall_f1": 0.9490683229813663,
2360
  "eval_overall_precision": 0.9455445544554455,
2361
  "eval_overall_recall": 0.9526184538653366,
2362
+ "eval_runtime": 0.2934,
2363
+ "eval_samples_per_second": 579.425,
2364
+ "eval_steps_per_second": 10.225,
2365
  "step": 7296
2366
  },
2367
  {
 
2390
  "eval_overall_f1": 0.9363295880149813,
2391
  "eval_overall_precision": 0.9375,
2392
  "eval_overall_recall": 0.9351620947630923,
2393
+ "eval_runtime": 0.2933,
2394
+ "eval_samples_per_second": 579.667,
2395
+ "eval_steps_per_second": 10.229,
2396
  "step": 7392
2397
  },
2398
  {
 
2421
  "eval_overall_f1": 0.9540372670807453,
2422
  "eval_overall_precision": 0.9504950495049505,
2423
  "eval_overall_recall": 0.9576059850374065,
2424
+ "eval_runtime": 0.2938,
2425
+ "eval_samples_per_second": 578.658,
2426
+ "eval_steps_per_second": 10.212,
2427
  "step": 7488
2428
  },
2429
  {
 
2452
  "eval_overall_f1": 0.9490683229813663,
2453
  "eval_overall_precision": 0.9455445544554455,
2454
  "eval_overall_recall": 0.9526184538653366,
2455
+ "eval_runtime": 0.2947,
2456
+ "eval_samples_per_second": 576.85,
2457
+ "eval_steps_per_second": 10.18,
2458
  "step": 7584
2459
  },
2460
  {
 
2483
  "eval_overall_f1": 0.941469489414695,
2484
  "eval_overall_precision": 0.9402985074626866,
2485
  "eval_overall_recall": 0.942643391521197,
2486
+ "eval_runtime": 0.2967,
2487
+ "eval_samples_per_second": 572.922,
2488
+ "eval_steps_per_second": 10.11,
2489
  "step": 7680
2490
  },
2491
  {
 
2514
  "eval_overall_f1": 0.9381188118811881,
2515
  "eval_overall_precision": 0.9312039312039312,
2516
  "eval_overall_recall": 0.9451371571072319,
2517
+ "eval_runtime": 0.2946,
2518
+ "eval_samples_per_second": 577.151,
2519
+ "eval_steps_per_second": 10.185,
2520
  "step": 7776
2521
  },
2522
  {
 
2545
  "eval_overall_f1": 0.9429280397022332,
2546
  "eval_overall_precision": 0.9382716049382716,
2547
  "eval_overall_recall": 0.9476309226932669,
2548
+ "eval_runtime": 0.2947,
2549
+ "eval_samples_per_second": 576.946,
2550
+ "eval_steps_per_second": 10.181,
2551
  "step": 7872
2552
  },
2553
  {
 
2576
  "eval_overall_f1": 0.9417596034696407,
2577
  "eval_overall_precision": 0.9359605911330049,
2578
  "eval_overall_recall": 0.9476309226932669,
2579
+ "eval_runtime": 0.294,
2580
+ "eval_samples_per_second": 578.264,
2581
+ "eval_steps_per_second": 10.205,
2582
  "step": 7968
2583
  },
2584
  {
 
2607
  "eval_overall_f1": 0.949194547707559,
2608
  "eval_overall_precision": 0.9433497536945813,
2609
  "eval_overall_recall": 0.9551122194513716,
2610
+ "eval_runtime": 0.294,
2611
+ "eval_samples_per_second": 578.246,
2612
+ "eval_steps_per_second": 10.204,
2613
  "step": 8064
2614
  },
2615
  {
 
2638
  "eval_overall_f1": 0.9468479604449938,
2639
  "eval_overall_precision": 0.9387254901960784,
2640
  "eval_overall_recall": 0.9551122194513716,
2641
+ "eval_runtime": 0.2953,
2642
+ "eval_samples_per_second": 575.681,
2643
+ "eval_steps_per_second": 10.159,
2644
  "step": 8160
2645
  },
2646
  {
 
2669
  "eval_overall_f1": 0.9430693069306931,
2670
  "eval_overall_precision": 0.9361179361179361,
2671
  "eval_overall_recall": 0.9501246882793017,
2672
+ "eval_runtime": 0.2949,
2673
+ "eval_samples_per_second": 576.492,
2674
+ "eval_steps_per_second": 10.173,
2675
  "step": 8256
2676
  },
2677
  {
 
2700
  "eval_overall_f1": 0.946583850931677,
2701
  "eval_overall_precision": 0.943069306930693,
2702
  "eval_overall_recall": 0.9501246882793017,
2703
+ "eval_runtime": 0.2934,
2704
+ "eval_samples_per_second": 579.336,
2705
+ "eval_steps_per_second": 10.224,
2706
  "step": 8352
2707
  },
2708
  {
 
2731
  "eval_overall_f1": 0.946716232961586,
2732
  "eval_overall_precision": 0.9408866995073891,
2733
  "eval_overall_recall": 0.9526184538653366,
2734
+ "eval_runtime": 0.2932,
2735
+ "eval_samples_per_second": 579.761,
2736
+ "eval_steps_per_second": 10.231,
2737
  "step": 8448
2738
  },
2739
  {
 
2762
  "eval_overall_f1": 0.9419035846724352,
2763
  "eval_overall_precision": 0.9338235294117647,
2764
  "eval_overall_recall": 0.9501246882793017,
2765
+ "eval_runtime": 0.2968,
2766
+ "eval_samples_per_second": 572.687,
2767
+ "eval_steps_per_second": 10.106,
2768
  "step": 8544
2769
  },
2770
  {
 
2793
  "eval_overall_f1": 0.946583850931677,
2794
  "eval_overall_precision": 0.943069306930693,
2795
  "eval_overall_recall": 0.9501246882793017,
2796
+ "eval_runtime": 0.2948,
2797
+ "eval_samples_per_second": 576.759,
2798
+ "eval_steps_per_second": 10.178,
2799
  "step": 8640
2800
  },
2801
  {
 
2824
  "eval_overall_f1": 0.9419035846724352,
2825
  "eval_overall_precision": 0.9338235294117647,
2826
  "eval_overall_recall": 0.9501246882793017,
2827
+ "eval_runtime": 0.2937,
2828
+ "eval_samples_per_second": 578.886,
2829
+ "eval_steps_per_second": 10.216,
2830
  "step": 8736
2831
  },
2832
  {
 
2855
  "eval_overall_f1": 0.9480198019801981,
2856
  "eval_overall_precision": 0.941031941031941,
2857
  "eval_overall_recall": 0.9551122194513716,
2858
+ "eval_runtime": 0.2932,
2859
+ "eval_samples_per_second": 579.905,
2860
+ "eval_steps_per_second": 10.234,
2861
  "step": 8832
2862
  },
2863
  {
 
2886
  "eval_overall_f1": 0.9371146732429101,
2887
  "eval_overall_precision": 0.926829268292683,
2888
  "eval_overall_recall": 0.9476309226932669,
2889
+ "eval_runtime": 0.2947,
2890
+ "eval_samples_per_second": 576.916,
2891
+ "eval_steps_per_second": 10.181,
2892
  "step": 8928
2893
  },
2894
  {
 
2917
  "eval_overall_f1": 0.9430693069306931,
2918
  "eval_overall_precision": 0.9361179361179361,
2919
  "eval_overall_recall": 0.9501246882793017,
2920
+ "eval_runtime": 0.2937,
2921
+ "eval_samples_per_second": 578.863,
2922
+ "eval_steps_per_second": 10.215,
2923
  "step": 9024
2924
  },
2925
  {
 
2948
  "eval_overall_f1": 0.9419035846724352,
2949
  "eval_overall_precision": 0.9338235294117647,
2950
  "eval_overall_recall": 0.9501246882793017,
2951
+ "eval_runtime": 0.2935,
2952
+ "eval_samples_per_second": 579.128,
2953
+ "eval_steps_per_second": 10.22,
2954
  "step": 9120
2955
  },
2956
  {
 
2979
  "eval_overall_f1": 0.946583850931677,
2980
  "eval_overall_precision": 0.943069306930693,
2981
  "eval_overall_recall": 0.9501246882793017,
2982
+ "eval_runtime": 0.2918,
2983
+ "eval_samples_per_second": 582.535,
2984
+ "eval_steps_per_second": 10.28,
2985
  "step": 9216
2986
  },
2987
  {
 
3010
  "eval_overall_f1": 0.9419035846724352,
3011
  "eval_overall_precision": 0.9338235294117647,
3012
  "eval_overall_recall": 0.9501246882793017,
3013
+ "eval_runtime": 0.2919,
3014
+ "eval_samples_per_second": 582.295,
3015
+ "eval_steps_per_second": 10.276,
3016
  "step": 9312
3017
  },
3018
  {
 
3041
  "eval_overall_f1": 0.9419035846724352,
3042
  "eval_overall_precision": 0.9338235294117647,
3043
  "eval_overall_recall": 0.9501246882793017,
3044
+ "eval_runtime": 0.2941,
3045
+ "eval_samples_per_second": 578.041,
3046
+ "eval_steps_per_second": 10.201,
3047
  "step": 9408
3048
  },
3049
  {
 
3072
  "eval_overall_f1": 0.9419035846724352,
3073
  "eval_overall_precision": 0.9338235294117647,
3074
  "eval_overall_recall": 0.9501246882793017,
3075
+ "eval_runtime": 0.2949,
3076
+ "eval_samples_per_second": 576.383,
3077
+ "eval_steps_per_second": 10.171,
3078
  "step": 9504
3079
  },
3080
  {
 
3103
  "eval_overall_f1": 0.9419035846724352,
3104
  "eval_overall_precision": 0.9338235294117647,
3105
  "eval_overall_recall": 0.9501246882793017,
3106
+ "eval_runtime": 0.2957,
3107
+ "eval_samples_per_second": 574.904,
3108
+ "eval_steps_per_second": 10.145,
3109
  "step": 9600
3110
  },
3111
  {
 
3113
  "step": 9600,
3114
  "total_flos": 4208466347875278.0,
3115
  "train_loss": 0.03501902000978589,
3116
+ "train_runtime": 539.9434,
3117
+ "train_samples_per_second": 283.548,
3118
+ "train_steps_per_second": 17.78
3119
  }
3120
  ],
3121
  "logging_steps": 500,