nyt-ingredient-tagger-gte-small / trainer_state.json
napsternxg's picture
End of training
54f5db1
{
"best_metric": 0.873456597328186,
"best_model_checkpoint": "nyt-ingredient-tagger-gte-small/checkpoint-15000",
"epoch": 5.0,
"eval_steps": 1000,
"global_step": 25255,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.1,
"learning_rate": 4.9010097010492975e-05,
"loss": 1.1066,
"step": 500
},
{
"epoch": 0.2,
"learning_rate": 4.802019402098595e-05,
"loss": 0.9427,
"step": 1000
},
{
"epoch": 0.2,
"eval_COMMENT": {
"f1": 0.6827173347214992,
"number": 6735,
"precision": 0.6076682497393722,
"recall": 0.7789161098737936
},
"eval_NAME": {
"f1": 0.7975022301516503,
"number": 8801,
"precision": 0.7829228243021347,
"recall": 0.8126349278491081
},
"eval_QTY": {
"f1": 0.9832785279507451,
"number": 7088,
"precision": 0.97529493407356,
"recall": 0.9913939051918735
},
"eval_RANGE_END": {
"f1": 0.6793893129770994,
"number": 91,
"precision": 0.52046783625731,
"recall": 0.978021978021978
},
"eval_UNIT": {
"f1": 0.9474663734032653,
"number": 5697,
"precision": 0.914435009797518,
"recall": 0.982973494821836
},
"eval_loss": 0.9320821166038513,
"eval_overall_accuracy": 0.8183442525312686,
"eval_overall_f1": 0.8416219839142092,
"eval_overall_precision": 0.8031853652296277,
"eval_overall_recall": 0.883922286357877,
"eval_runtime": 12.4448,
"eval_samples_per_second": 683.5,
"eval_steps_per_second": 21.374,
"step": 1000
},
{
"epoch": 0.3,
"learning_rate": 4.703029103147892e-05,
"loss": 0.9333,
"step": 1500
},
{
"epoch": 0.4,
"learning_rate": 4.6040388041971886e-05,
"loss": 0.9169,
"step": 2000
},
{
"epoch": 0.4,
"eval_COMMENT": {
"f1": 0.7030077684084721,
"number": 6735,
"precision": 0.6358395387941388,
"recall": 0.7860430586488493
},
"eval_NAME": {
"f1": 0.798910626945309,
"number": 8801,
"precision": 0.781960613643782,
"recall": 0.8166117486649245
},
"eval_QTY": {
"f1": 0.9835744740336898,
"number": 7088,
"precision": 0.9746502285635129,
"recall": 0.9926636568848759
},
"eval_RANGE_END": {
"f1": 0.7543859649122806,
"number": 91,
"precision": 0.6277372262773723,
"recall": 0.945054945054945
},
"eval_UNIT": {
"f1": 0.9503173931443081,
"number": 5697,
"precision": 0.9176201372997712,
"recall": 0.9854309285588907
},
"eval_loss": 0.9112022519111633,
"eval_overall_accuracy": 0.8256066398970201,
"eval_overall_f1": 0.8490143595441308,
"eval_overall_precision": 0.8136878448581847,
"eval_overall_recall": 0.8875475151344502,
"eval_runtime": 12.0886,
"eval_samples_per_second": 703.64,
"eval_steps_per_second": 22.004,
"step": 2000
},
{
"epoch": 0.49,
"learning_rate": 4.505048505246486e-05,
"loss": 0.9126,
"step": 2500
},
{
"epoch": 0.59,
"learning_rate": 4.406058206295783e-05,
"loss": 0.9,
"step": 3000
},
{
"epoch": 0.59,
"eval_COMMENT": {
"f1": 0.7219525171244263,
"number": 6735,
"precision": 0.6538183570224042,
"recall": 0.8059391239792131
},
"eval_NAME": {
"f1": 0.8061383928571427,
"number": 8801,
"precision": 0.7920824651825858,
"recall": 0.8207021929326213
},
"eval_QTY": {
"f1": 0.9870641169853768,
"number": 7088,
"precision": 0.9837443946188341,
"recall": 0.9904063205417607
},
"eval_RANGE_END": {
"f1": 0.7309644670050762,
"number": 91,
"precision": 0.6792452830188679,
"recall": 0.7912087912087912
},
"eval_UNIT": {
"f1": 0.9483108108108108,
"number": 5697,
"precision": 0.9138857235878235,
"recall": 0.9854309285588907
},
"eval_loss": 0.902090847492218,
"eval_overall_accuracy": 0.8302368921593114,
"eval_overall_f1": 0.856395015029214,
"eval_overall_precision": 0.8231188729468285,
"eval_overall_recall": 0.8924750105589188,
"eval_runtime": 14.5748,
"eval_samples_per_second": 583.612,
"eval_steps_per_second": 18.251,
"step": 3000
},
{
"epoch": 0.69,
"learning_rate": 4.3070679073450804e-05,
"loss": 0.9058,
"step": 3500
},
{
"epoch": 0.79,
"learning_rate": 4.208077608394378e-05,
"loss": 0.9061,
"step": 4000
},
{
"epoch": 0.79,
"eval_COMMENT": {
"f1": 0.7202272266179753,
"number": 6735,
"precision": 0.6613263785394933,
"recall": 0.7906458797327395
},
"eval_NAME": {
"f1": 0.8081158124196521,
"number": 8801,
"precision": 0.7952695269526953,
"recall": 0.821383933643904
},
"eval_QTY": {
"f1": 0.9869014084507043,
"number": 7088,
"precision": 0.985236220472441,
"recall": 0.9885722347629797
},
"eval_RANGE_END": {
"f1": 0.7592592592592593,
"number": 91,
"precision": 0.656,
"recall": 0.9010989010989011
},
"eval_UNIT": {
"f1": 0.9522355137015356,
"number": 5697,
"precision": 0.9215106732348112,
"recall": 0.9850798665964543
},
"eval_loss": 0.8911505341529846,
"eval_overall_accuracy": 0.8325616246229515,
"eval_overall_f1": 0.857831898235424,
"eval_overall_precision": 0.8288752502543569,
"eval_overall_recall": 0.8888849781782345,
"eval_runtime": 12.1725,
"eval_samples_per_second": 698.791,
"eval_steps_per_second": 21.853,
"step": 4000
},
{
"epoch": 0.89,
"learning_rate": 4.109087309443675e-05,
"loss": 0.8962,
"step": 4500
},
{
"epoch": 0.99,
"learning_rate": 4.010097010492972e-05,
"loss": 0.8889,
"step": 5000
},
{
"epoch": 0.99,
"eval_COMMENT": {
"f1": 0.7147275101367603,
"number": 6735,
"precision": 0.6653019447287615,
"recall": 0.7720861172976986
},
"eval_NAME": {
"f1": 0.8085439498993513,
"number": 8801,
"precision": 0.7959925134867335,
"recall": 0.8214975570957845
},
"eval_QTY": {
"f1": 0.9872508276396421,
"number": 7088,
"precision": 0.9857926571951048,
"recall": 0.9887133182844243
},
"eval_RANGE_END": {
"f1": 0.7623318385650225,
"number": 91,
"precision": 0.6439393939393939,
"recall": 0.9340659340659341
},
"eval_UNIT": {
"f1": 0.9522514868309261,
"number": 5697,
"precision": 0.9227729293594599,
"recall": 0.9836756187467088
},
"eval_loss": 0.8908107876777649,
"eval_overall_accuracy": 0.8310630367538281,
"eval_overall_f1": 0.8572110874200426,
"eval_overall_precision": 0.8316618674080694,
"eval_overall_recall": 0.8843798395044348,
"eval_runtime": 12.1451,
"eval_samples_per_second": 700.364,
"eval_steps_per_second": 21.902,
"step": 5000
},
{
"epoch": 1.09,
"learning_rate": 3.911106711542269e-05,
"loss": 0.8786,
"step": 5500
},
{
"epoch": 1.19,
"learning_rate": 3.812116412591566e-05,
"loss": 0.88,
"step": 6000
},
{
"epoch": 1.19,
"eval_COMMENT": {
"f1": 0.7254114813327982,
"number": 6735,
"precision": 0.660211910851297,
"recall": 0.8048997772828508
},
"eval_NAME": {
"f1": 0.8067433292397008,
"number": 8801,
"precision": 0.7929331723910896,
"recall": 0.8210430632882627
},
"eval_QTY": {
"f1": 0.9868633649455567,
"number": 7088,
"precision": 0.9827899818105499,
"recall": 0.9909706546275395
},
"eval_RANGE_END": {
"f1": 0.7631578947368421,
"number": 91,
"precision": 0.635036496350365,
"recall": 0.9560439560439561
},
"eval_UNIT": {
"f1": 0.9526315789473684,
"number": 5697,
"precision": 0.9224067072168338,
"recall": 0.984904335615236
},
"eval_loss": 0.8873026371002197,
"eval_overall_accuracy": 0.8337912351822321,
"eval_overall_f1": 0.8584674212814917,
"eval_overall_precision": 0.8265941155387573,
"eval_overall_recall": 0.8928973673095875,
"eval_runtime": 13.0658,
"eval_samples_per_second": 651.014,
"eval_steps_per_second": 20.359,
"step": 6000
},
{
"epoch": 1.29,
"learning_rate": 3.7131261136408633e-05,
"loss": 0.8761,
"step": 6500
},
{
"epoch": 1.39,
"learning_rate": 3.6141358146901606e-05,
"loss": 0.8751,
"step": 7000
},
{
"epoch": 1.39,
"eval_COMMENT": {
"f1": 0.7309149972929073,
"number": 6735,
"precision": 0.6715582638975252,
"recall": 0.8017817371937639
},
"eval_NAME": {
"f1": 0.8121178120617111,
"number": 8801,
"precision": 0.8020833333333334,
"recall": 0.8224065447108283
},
"eval_QTY": {
"f1": 0.9871903153153153,
"number": 7088,
"precision": 0.9849719101123595,
"recall": 0.9894187358916479
},
"eval_RANGE_END": {
"f1": 0.7565217391304349,
"number": 91,
"precision": 0.6258992805755396,
"recall": 0.9560439560439561
},
"eval_UNIT": {
"f1": 0.9523647209203238,
"number": 5697,
"precision": 0.9254720105995363,
"recall": 0.9808671230472178
},
"eval_loss": 0.8865671157836914,
"eval_overall_accuracy": 0.834847931756614,
"eval_overall_f1": 0.8618096437200122,
"eval_overall_precision": 0.8341347737303207,
"eval_overall_recall": 0.8913839222863579,
"eval_runtime": 12.663,
"eval_samples_per_second": 671.721,
"eval_steps_per_second": 21.006,
"step": 7000
},
{
"epoch": 1.48,
"learning_rate": 3.515145515739457e-05,
"loss": 0.8836,
"step": 7500
},
{
"epoch": 1.58,
"learning_rate": 3.416155216788755e-05,
"loss": 0.8816,
"step": 8000
},
{
"epoch": 1.58,
"eval_COMMENT": {
"f1": 0.7336898395721925,
"number": 6735,
"precision": 0.6672340425531915,
"recall": 0.8148478099480326
},
"eval_NAME": {
"f1": 0.8090705487122061,
"number": 8801,
"precision": 0.797549398388343,
"recall": 0.8209294398363822
},
"eval_QTY": {
"f1": 0.9869745828346124,
"number": 7088,
"precision": 0.9851018973998594,
"recall": 0.988854401805869
},
"eval_RANGE_END": {
"f1": 0.7623318385650225,
"number": 91,
"precision": 0.6439393939393939,
"recall": 0.9340659340659341
},
"eval_UNIT": {
"f1": 0.9534507701472215,
"number": 5697,
"precision": 0.9253386190948133,
"recall": 0.9833245567842724
},
"eval_loss": 0.8822705745697021,
"eval_overall_accuracy": 0.835962266325962,
"eval_overall_f1": 0.8613658321609573,
"eval_overall_precision": 0.8307667157103155,
"eval_overall_recall": 0.8943052231451499,
"eval_runtime": 12.6561,
"eval_samples_per_second": 672.089,
"eval_steps_per_second": 21.018,
"step": 8000
},
{
"epoch": 1.68,
"learning_rate": 3.317164917838052e-05,
"loss": 0.8785,
"step": 8500
},
{
"epoch": 1.78,
"learning_rate": 3.218174618887349e-05,
"loss": 0.8756,
"step": 9000
},
{
"epoch": 1.78,
"eval_COMMENT": {
"f1": 0.7321063394683027,
"number": 6735,
"precision": 0.6767485822306238,
"recall": 0.7973273942093542
},
"eval_NAME": {
"f1": 0.8122265844083006,
"number": 8801,
"precision": 0.8019714254070218,
"recall": 0.8227474150664698
},
"eval_QTY": {
"f1": 0.9867829021372329,
"number": 7088,
"precision": 0.9834641255605381,
"recall": 0.9901241534988713
},
"eval_RANGE_END": {
"f1": 0.7864077669902914,
"number": 91,
"precision": 0.7043478260869566,
"recall": 0.8901098901098901
},
"eval_UNIT": {
"f1": 0.9523567310952866,
"number": 5697,
"precision": 0.9209706509263814,
"recall": 0.9859575215025452
},
"eval_loss": 0.8817200660705566,
"eval_overall_accuracy": 0.8375377048550404,
"eval_overall_f1": 0.8625481047576883,
"eval_overall_precision": 0.8354885531437619,
"eval_overall_recall": 0.891419118682247,
"eval_runtime": 13.1407,
"eval_samples_per_second": 647.302,
"eval_steps_per_second": 20.242,
"step": 9000
},
{
"epoch": 1.88,
"learning_rate": 3.119184319936647e-05,
"loss": 0.8739,
"step": 9500
},
{
"epoch": 1.98,
"learning_rate": 3.0201940209859435e-05,
"loss": 0.8695,
"step": 10000
},
{
"epoch": 1.98,
"eval_COMMENT": {
"f1": 0.7372581084764241,
"number": 6735,
"precision": 0.6812743986903412,
"recall": 0.8032665181885672
},
"eval_NAME": {
"f1": 0.8095131505316173,
"number": 8801,
"precision": 0.7975521005623553,
"recall": 0.821838427451426
},
"eval_QTY": {
"f1": 0.9853692684634231,
"number": 7088,
"precision": 0.9779074614422676,
"recall": 0.9929458239277652
},
"eval_RANGE_END": {
"f1": 0.7639484978540774,
"number": 91,
"precision": 0.6267605633802817,
"recall": 0.978021978021978
},
"eval_UNIT": {
"f1": 0.9517510387518019,
"number": 5697,
"precision": 0.9206036745406824,
"recall": 0.9850798665964543
},
"eval_loss": 0.8788286447525024,
"eval_overall_accuracy": 0.8376145555149955,
"eval_overall_f1": 0.8624972390709686,
"eval_overall_precision": 0.8337001149614058,
"eval_overall_recall": 0.8933549204561453,
"eval_runtime": 12.7467,
"eval_samples_per_second": 667.312,
"eval_steps_per_second": 20.868,
"step": 10000
},
{
"epoch": 2.08,
"learning_rate": 2.9212037220352405e-05,
"loss": 0.8595,
"step": 10500
},
{
"epoch": 2.18,
"learning_rate": 2.8222134230845377e-05,
"loss": 0.8537,
"step": 11000
},
{
"epoch": 2.18,
"eval_COMMENT": {
"f1": 0.741655859668282,
"number": 6735,
"precision": 0.6863314805457301,
"recall": 0.8066815144766147
},
"eval_NAME": {
"f1": 0.8129971988795517,
"number": 8801,
"precision": 0.8018565587357719,
"recall": 0.8244517668446767
},
"eval_QTY": {
"f1": 0.9869308600337269,
"number": 7088,
"precision": 0.9830627099664053,
"recall": 0.9908295711060948
},
"eval_RANGE_END": {
"f1": 0.792626728110599,
"number": 91,
"precision": 0.6825396825396826,
"recall": 0.945054945054945
},
"eval_UNIT": {
"f1": 0.9528510638297872,
"number": 5697,
"precision": 0.9248306624814142,
"recall": 0.9826224328593997
},
"eval_loss": 0.8804447650909424,
"eval_overall_accuracy": 0.8384022747795347,
"eval_overall_f1": 0.8652810902896081,
"eval_overall_precision": 0.8384838880084522,
"eval_overall_recall": 0.8938476699985921,
"eval_runtime": 13.7729,
"eval_samples_per_second": 617.589,
"eval_steps_per_second": 19.313,
"step": 11000
},
{
"epoch": 2.28,
"learning_rate": 2.7232231241338353e-05,
"loss": 0.8543,
"step": 11500
},
{
"epoch": 2.38,
"learning_rate": 2.6242328251831323e-05,
"loss": 0.854,
"step": 12000
},
{
"epoch": 2.38,
"eval_COMMENT": {
"f1": 0.7438095238095238,
"number": 6735,
"precision": 0.6863779033270558,
"recall": 0.8117297698589458
},
"eval_NAME": {
"f1": 0.8151350137539999,
"number": 8801,
"precision": 0.8055925432756325,
"recall": 0.8249062606521986
},
"eval_QTY": {
"f1": 0.9872119168071951,
"number": 7088,
"precision": 0.9833426651735723,
"recall": 0.9911117381489842
},
"eval_RANGE_END": {
"f1": 0.7982062780269058,
"number": 91,
"precision": 0.6742424242424242,
"recall": 0.978021978021978
},
"eval_UNIT": {
"f1": 0.9521952873368368,
"number": 5697,
"precision": 0.9206687428290444,
"recall": 0.9859575215025452
},
"eval_loss": 0.8816655278205872,
"eval_overall_accuracy": 0.8389594420642087,
"eval_overall_f1": 0.8664193581322533,
"eval_overall_precision": 0.8387033010476379,
"eval_overall_recall": 0.8960298465437139,
"eval_runtime": 12.7157,
"eval_samples_per_second": 668.937,
"eval_steps_per_second": 20.919,
"step": 12000
},
{
"epoch": 2.47,
"learning_rate": 2.5252425262324292e-05,
"loss": 0.8609,
"step": 12500
},
{
"epoch": 2.57,
"learning_rate": 2.4262522272817265e-05,
"loss": 0.8582,
"step": 13000
},
{
"epoch": 2.57,
"eval_COMMENT": {
"f1": 0.7477459155311504,
"number": 6735,
"precision": 0.6879990019960079,
"recall": 0.8188567186340014
},
"eval_NAME": {
"f1": 0.8148396844049018,
"number": 8801,
"precision": 0.8027563395810364,
"recall": 0.8272923531416885
},
"eval_QTY": {
"f1": 0.9867996067967982,
"number": 7088,
"precision": 0.9822476935979871,
"recall": 0.9913939051918735
},
"eval_RANGE_END": {
"f1": 0.772093023255814,
"number": 91,
"precision": 0.6693548387096774,
"recall": 0.9120879120879121
},
"eval_UNIT": {
"f1": 0.9524215552523875,
"number": 5697,
"precision": 0.9260487481346377,
"recall": 0.9803405301035633
},
"eval_loss": 0.8745654225349426,
"eval_overall_accuracy": 0.8401890526234894,
"eval_overall_f1": 0.8669376094682606,
"eval_overall_precision": 0.8386576739595328,
"eval_overall_recall": 0.897191327608053,
"eval_runtime": 10.2599,
"eval_samples_per_second": 829.055,
"eval_steps_per_second": 25.926,
"step": 13000
},
{
"epoch": 2.67,
"learning_rate": 2.3272619283310237e-05,
"loss": 0.8617,
"step": 13500
},
{
"epoch": 2.77,
"learning_rate": 2.2282716293803206e-05,
"loss": 0.8554,
"step": 14000
},
{
"epoch": 2.77,
"eval_COMMENT": {
"f1": 0.7481907338518768,
"number": 6735,
"precision": 0.6870807453416149,
"recall": 0.8212323682256867
},
"eval_NAME": {
"f1": 0.8165394973070018,
"number": 8801,
"precision": 0.8064945140197274,
"recall": 0.8268378593341665
},
"eval_QTY": {
"f1": 0.9876282862364684,
"number": 7088,
"precision": 0.9841692350798543,
"recall": 0.9911117381489842
},
"eval_RANGE_END": {
"f1": 0.7777777777777778,
"number": 91,
"precision": 0.672,
"recall": 0.9230769230769231
},
"eval_UNIT": {
"f1": 0.9534646739130435,
"number": 5697,
"precision": 0.923507155782201,
"recall": 0.9854309285588907
},
"eval_loss": 0.8742881417274475,
"eval_overall_accuracy": 0.8416107898326577,
"eval_overall_f1": 0.8680027878355177,
"eval_overall_precision": 0.8394213381555153,
"eval_overall_recall": 0.8985991834436153,
"eval_runtime": 10.2908,
"eval_samples_per_second": 826.561,
"eval_steps_per_second": 25.848,
"step": 14000
},
{
"epoch": 2.87,
"learning_rate": 2.129281330429618e-05,
"loss": 0.8553,
"step": 14500
},
{
"epoch": 2.97,
"learning_rate": 2.0302910314789152e-05,
"loss": 0.86,
"step": 15000
},
{
"epoch": 2.97,
"eval_COMMENT": {
"f1": 0.7449105068998496,
"number": 6735,
"precision": 0.6898646083765658,
"recall": 0.8095025983667409
},
"eval_NAME": {
"f1": 0.8143625364104862,
"number": 8801,
"precision": 0.8031156778256546,
"recall": 0.8259288717191229
},
"eval_QTY": {
"f1": 0.9873542222846705,
"number": 7088,
"precision": 0.9833473271760426,
"recall": 0.9913939051918735
},
"eval_RANGE_END": {
"f1": 0.7547169811320755,
"number": 91,
"precision": 0.6611570247933884,
"recall": 0.8791208791208791
},
"eval_UNIT": {
"f1": 0.9538566320449514,
"number": 5697,
"precision": 0.9261034881798644,
"recall": 0.9833245567842724
},
"eval_loss": 0.873456597328186,
"eval_overall_accuracy": 0.8422640204422756,
"eval_overall_f1": 0.866705292934801,
"eval_overall_precision": 0.8401057152296003,
"eval_overall_recall": 0.8950443474588202,
"eval_runtime": 10.9665,
"eval_samples_per_second": 775.635,
"eval_steps_per_second": 24.256,
"step": 15000
},
{
"epoch": 3.07,
"learning_rate": 1.9313007325282124e-05,
"loss": 0.8414,
"step": 15500
},
{
"epoch": 3.17,
"learning_rate": 1.8323104335775097e-05,
"loss": 0.845,
"step": 16000
},
{
"epoch": 3.17,
"eval_COMMENT": {
"f1": 0.7413599325653274,
"number": 6735,
"precision": 0.7035061991734436,
"recall": 0.7835189309576838
},
"eval_NAME": {
"f1": 0.8080446927374302,
"number": 8801,
"precision": 0.7948126167710737,
"recall": 0.8217248039995455
},
"eval_QTY": {
"f1": 0.9871533871533871,
"number": 7088,
"precision": 0.982394858180802,
"recall": 0.9919582392776524
},
"eval_RANGE_END": {
"f1": 0.7777777777777778,
"number": 91,
"precision": 0.719626168224299,
"recall": 0.8461538461538461
},
"eval_UNIT": {
"f1": 0.9531036834924966,
"number": 5697,
"precision": 0.9267119880616813,
"recall": 0.981042654028436
},
"eval_loss": 0.878207266330719,
"eval_overall_accuracy": 0.8396895233337817,
"eval_overall_f1": 0.8645960176308162,
"eval_overall_precision": 0.8431510286001004,
"eval_overall_recall": 0.8871603547796706,
"eval_runtime": 11.5191,
"eval_samples_per_second": 738.424,
"eval_steps_per_second": 23.092,
"step": 16000
},
{
"epoch": 3.27,
"learning_rate": 1.7333201346268066e-05,
"loss": 0.8353,
"step": 16500
},
{
"epoch": 3.37,
"learning_rate": 1.634329835676104e-05,
"loss": 0.846,
"step": 17000
},
{
"epoch": 3.37,
"eval_COMMENT": {
"f1": 0.7456715182451542,
"number": 6735,
"precision": 0.6963411491883535,
"recall": 0.8025241276911655
},
"eval_NAME": {
"f1": 0.8116995693753145,
"number": 8801,
"precision": 0.7992290748898678,
"recall": 0.8245653902965572
},
"eval_QTY": {
"f1": 0.9874859392575928,
"number": 7088,
"precision": 0.984164798206278,
"recall": 0.9908295711060948
},
"eval_RANGE_END": {
"f1": 0.7641509433962264,
"number": 91,
"precision": 0.6694214876033058,
"recall": 0.8901098901098901
},
"eval_UNIT": {
"f1": 0.9531343029684443,
"number": 5697,
"precision": 0.9245874587458746,
"recall": 0.9835000877654906
},
"eval_loss": 0.8758910298347473,
"eval_overall_accuracy": 0.8402659032834444,
"eval_overall_f1": 0.8662648751088423,
"eval_overall_precision": 0.8411751052753739,
"eval_overall_recall": 0.8928973673095875,
"eval_runtime": 12.1757,
"eval_samples_per_second": 698.602,
"eval_steps_per_second": 21.847,
"step": 17000
},
{
"epoch": 3.46,
"learning_rate": 1.535339536725401e-05,
"loss": 0.8452,
"step": 17500
},
{
"epoch": 3.56,
"learning_rate": 1.4363492377746981e-05,
"loss": 0.8392,
"step": 18000
},
{
"epoch": 3.56,
"eval_COMMENT": {
"f1": 0.7475519133273144,
"number": 6735,
"precision": 0.7022442588726514,
"recall": 0.799109131403118
},
"eval_NAME": {
"f1": 0.8129017832187377,
"number": 8801,
"precision": 0.8000660211267606,
"recall": 0.8261561186228837
},
"eval_QTY": {
"f1": 0.987295570997403,
"number": 7088,
"precision": 0.9823997765050985,
"recall": 0.9922404063205418
},
"eval_RANGE_END": {
"f1": 0.7809523809523808,
"number": 91,
"precision": 0.6890756302521008,
"recall": 0.9010989010989011
},
"eval_UNIT": {
"f1": 0.9535298615240847,
"number": 5697,
"precision": 0.9239380968060587,
"recall": 0.9850798665964543
},
"eval_loss": 0.8759370446205139,
"eval_overall_accuracy": 0.8409191338930623,
"eval_overall_f1": 0.8674550550276846,
"eval_overall_precision": 0.8430773319160244,
"eval_overall_recall": 0.8932845276643672,
"eval_runtime": 12.9734,
"eval_samples_per_second": 655.647,
"eval_steps_per_second": 20.503,
"step": 18000
},
{
"epoch": 3.66,
"learning_rate": 1.3373589388239954e-05,
"loss": 0.8436,
"step": 18500
},
{
"epoch": 3.76,
"learning_rate": 1.2383686398732925e-05,
"loss": 0.8375,
"step": 19000
},
{
"epoch": 3.76,
"eval_COMMENT": {
"f1": 0.7500341670083366,
"number": 6735,
"precision": 0.6947714900620332,
"recall": 0.8148478099480326
},
"eval_NAME": {
"f1": 0.8153302283822457,
"number": 8801,
"precision": 0.8054323725055432,
"recall": 0.8254743779116009
},
"eval_QTY": {
"f1": 0.9877046300850137,
"number": 7088,
"precision": 0.9837648705388383,
"recall": 0.991676072234763
},
"eval_RANGE_END": {
"f1": 0.7751196172248803,
"number": 91,
"precision": 0.6864406779661016,
"recall": 0.8901098901098901
},
"eval_UNIT": {
"f1": 0.9524700280588385,
"number": 5697,
"precision": 0.9236477572559367,
"recall": 0.9831490258030542
},
"eval_loss": 0.8779729008674622,
"eval_overall_accuracy": 0.8412841745278488,
"eval_overall_f1": 0.8682191687408367,
"eval_overall_precision": 0.8418964491172386,
"eval_overall_recall": 0.8962410249190483,
"eval_runtime": 12.8106,
"eval_samples_per_second": 663.98,
"eval_steps_per_second": 20.764,
"step": 19000
},
{
"epoch": 3.86,
"learning_rate": 1.1393783409225896e-05,
"loss": 0.8358,
"step": 19500
},
{
"epoch": 3.96,
"learning_rate": 1.0403880419718868e-05,
"loss": 0.8366,
"step": 20000
},
{
"epoch": 3.96,
"eval_COMMENT": {
"f1": 0.7509641873278236,
"number": 6735,
"precision": 0.7003211303789338,
"recall": 0.8095025983667409
},
"eval_NAME": {
"f1": 0.8146694330735154,
"number": 8801,
"precision": 0.804251550044287,
"recall": 0.8253607544597205
},
"eval_QTY": {
"f1": 0.9872137136433891,
"number": 7088,
"precision": 0.9832073887489504,
"recall": 0.9912528216704289
},
"eval_RANGE_END": {
"f1": 0.7783251231527095,
"number": 91,
"precision": 0.7053571428571429,
"recall": 0.8681318681318682
},
"eval_UNIT": {
"f1": 0.9528422125924038,
"number": 5697,
"precision": 0.9234189723320159,
"recall": 0.9842022116903634
},
"eval_loss": 0.8742325305938721,
"eval_overall_accuracy": 0.841668427827624,
"eval_overall_f1": 0.8684574531668914,
"eval_overall_precision": 0.8434670116429496,
"eval_overall_recall": 0.8949739546670421,
"eval_runtime": 12.4853,
"eval_samples_per_second": 681.281,
"eval_steps_per_second": 21.305,
"step": 20000
},
{
"epoch": 4.06,
"learning_rate": 9.41397743021184e-06,
"loss": 0.8274,
"step": 20500
},
{
"epoch": 4.16,
"learning_rate": 8.424074440704812e-06,
"loss": 0.8189,
"step": 21000
},
{
"epoch": 4.16,
"eval_COMMENT": {
"f1": 0.7531697905181918,
"number": 6735,
"precision": 0.7027131284557027,
"recall": 0.8114328136599851
},
"eval_NAME": {
"f1": 0.8157082748948107,
"number": 8801,
"precision": 0.8056294326241135,
"recall": 0.8260424951710033
},
"eval_QTY": {
"f1": 0.9872937872937874,
"number": 7088,
"precision": 0.9825345815285734,
"recall": 0.9920993227990971
},
"eval_RANGE_END": {
"f1": 0.7751196172248803,
"number": 91,
"precision": 0.6864406779661016,
"recall": 0.8901098901098901
},
"eval_UNIT": {
"f1": 0.9539115646258504,
"number": 5697,
"precision": 0.9251195777667821,
"recall": 0.9845532736527998
},
"eval_loss": 0.8799063563346863,
"eval_overall_accuracy": 0.8425137850871295,
"eval_overall_f1": 0.8695667025328346,
"eval_overall_precision": 0.8446531072696506,
"eval_overall_recall": 0.8959946501478249,
"eval_runtime": 14.411,
"eval_samples_per_second": 590.242,
"eval_steps_per_second": 18.458,
"step": 21000
},
{
"epoch": 4.26,
"learning_rate": 7.434171451197783e-06,
"loss": 0.8352,
"step": 21500
},
{
"epoch": 4.36,
"learning_rate": 6.444268461690754e-06,
"loss": 0.8269,
"step": 22000
},
{
"epoch": 4.36,
"eval_COMMENT": {
"f1": 0.7478056534660309,
"number": 6735,
"precision": 0.6995086630462891,
"recall": 0.8032665181885672
},
"eval_NAME": {
"f1": 0.8122026308424294,
"number": 8801,
"precision": 0.8004192409532216,
"recall": 0.8243381433927963
},
"eval_QTY": {
"f1": 0.987140749068934,
"number": 7088,
"precision": 0.9833403331933361,
"recall": 0.9909706546275395
},
"eval_RANGE_END": {
"f1": 0.7843137254901961,
"number": 91,
"precision": 0.7079646017699115,
"recall": 0.8791208791208791
},
"eval_UNIT": {
"f1": 0.9531422740028915,
"number": 5697,
"precision": 0.9244473771032663,
"recall": 0.9836756187467088
},
"eval_loss": 0.87808758020401,
"eval_overall_accuracy": 0.8418029164825453,
"eval_overall_f1": 0.8670379989065063,
"eval_overall_precision": 0.8425089653340417,
"eval_overall_recall": 0.8930381528931437,
"eval_runtime": 13.8025,
"eval_samples_per_second": 616.264,
"eval_steps_per_second": 19.272,
"step": 22000
},
{
"epoch": 4.45,
"learning_rate": 5.4543654721837265e-06,
"loss": 0.8231,
"step": 22500
},
{
"epoch": 4.55,
"learning_rate": 4.4644624826766974e-06,
"loss": 0.829,
"step": 23000
},
{
"epoch": 4.55,
"eval_COMMENT": {
"f1": 0.7491170971539367,
"number": 6735,
"precision": 0.70192058136517,
"recall": 0.8031180400890868
},
"eval_NAME": {
"f1": 0.8114726601811473,
"number": 8801,
"precision": 0.7987892129884425,
"recall": 0.8245653902965572
},
"eval_QTY": {
"f1": 0.9874929735806632,
"number": 7088,
"precision": 0.9836226203807391,
"recall": 0.9913939051918735
},
"eval_RANGE_END": {
"f1": 0.7745098039215685,
"number": 91,
"precision": 0.6991150442477876,
"recall": 0.8681318681318682
},
"eval_UNIT": {
"f1": 0.9533855052739026,
"number": 5697,
"precision": 0.9249050998514606,
"recall": 0.9836756187467088
},
"eval_loss": 0.8793897032737732,
"eval_overall_accuracy": 0.8421679571173317,
"eval_overall_f1": 0.8672738768605068,
"eval_overall_precision": 0.8428604643438403,
"eval_overall_recall": 0.8931437420808109,
"eval_runtime": 11.6472,
"eval_samples_per_second": 730.305,
"eval_steps_per_second": 22.838,
"step": 23000
},
{
"epoch": 4.65,
"learning_rate": 3.4745594931696697e-06,
"loss": 0.8202,
"step": 23500
},
{
"epoch": 4.75,
"learning_rate": 2.484656503662641e-06,
"loss": 0.8183,
"step": 24000
},
{
"epoch": 4.75,
"eval_COMMENT": {
"f1": 0.7519550006859651,
"number": 6735,
"precision": 0.6988397296952696,
"recall": 0.8138084632516703
},
"eval_NAME": {
"f1": 0.8162898973467212,
"number": 8801,
"precision": 0.806115665854199,
"recall": 0.826724235882286
},
"eval_QTY": {
"f1": 0.9871389415981446,
"number": 7088,
"precision": 0.9834757036829576,
"recall": 0.9908295711060948
},
"eval_RANGE_END": {
"f1": 0.7692307692307692,
"number": 91,
"precision": 0.6837606837606838,
"recall": 0.8791208791208791
},
"eval_UNIT": {
"f1": 0.9531422740028915,
"number": 5697,
"precision": 0.9244473771032663,
"recall": 0.9836756187467088
},
"eval_loss": 0.8815182447433472,
"eval_overall_accuracy": 0.8428019750619609,
"eval_overall_f1": 0.8690636678554975,
"eval_overall_precision": 0.8434860379608466,
"eval_overall_recall": 0.8962410249190483,
"eval_runtime": 10.2447,
"eval_samples_per_second": 830.287,
"eval_steps_per_second": 25.965,
"step": 24000
},
{
"epoch": 4.85,
"learning_rate": 1.4947535141556129e-06,
"loss": 0.8271,
"step": 24500
},
{
"epoch": 4.95,
"learning_rate": 5.048505246485845e-07,
"loss": 0.8201,
"step": 25000
},
{
"epoch": 4.95,
"eval_COMMENT": {
"f1": 0.7506890848952591,
"number": 6735,
"precision": 0.7003986112897004,
"recall": 0.8087602078693392
},
"eval_NAME": {
"f1": 0.8135612216307089,
"number": 8801,
"precision": 0.8026315789473685,
"recall": 0.8247926372003181
},
"eval_QTY": {
"f1": 0.9874235930583853,
"number": 7088,
"precision": 0.9834849545136459,
"recall": 0.9913939051918735
},
"eval_RANGE_END": {
"f1": 0.7788461538461537,
"number": 91,
"precision": 0.6923076923076923,
"recall": 0.8901098901098901
},
"eval_UNIT": {
"f1": 0.9532153793807416,
"number": 5697,
"precision": 0.9247400561148704,
"recall": 0.9835000877654906
},
"eval_loss": 0.8807578682899475,
"eval_overall_accuracy": 0.8429172510518934,
"eval_overall_f1": 0.8681558902893056,
"eval_overall_precision": 0.8432419879238272,
"eval_overall_recall": 0.8945867943122624,
"eval_runtime": 10.211,
"eval_samples_per_second": 833.024,
"eval_steps_per_second": 26.05,
"step": 25000
},
{
"epoch": 5.0,
"step": 25255,
"total_flos": 3120524263271436.0,
"train_loss": 0.8656694423182368,
"train_runtime": 2424.3674,
"train_samples_per_second": 333.289,
"train_steps_per_second": 10.417
}
],
"logging_steps": 500,
"max_steps": 25255,
"num_train_epochs": 5,
"save_steps": 1000,
"total_flos": 3120524263271436.0,
"trial_name": null,
"trial_params": null
}