Theoreticallyhugo's picture
Training in progress, epoch 16, checkpoint
d22008d verified
raw
history blame
30.2 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 16.0,
"eval_steps": 500,
"global_step": 1296,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_B-Claim": {
"f1-score": 0.17153996101364524,
"precision": 0.25287356321839083,
"recall": 0.12979351032448377,
"support": 339.0
},
"eval_B-MajorClaim": {
"f1-score": 0.08383233532934131,
"precision": 1.0,
"recall": 0.04375,
"support": 160.0
},
"eval_B-Premise": {
"f1-score": 0.8469620831429876,
"precision": 0.7427884615384616,
"recall": 0.9851222104144527,
"support": 941.0
},
"eval_I-Claim": {
"f1-score": 0.5420081967213116,
"precision": 0.6803858520900321,
"recall": 0.4504044274159217,
"support": 4698.0
},
"eval_I-MajorClaim": {
"f1-score": 0.8343351767251743,
"precision": 0.8141717503519474,
"recall": 0.8555226824457594,
"support": 2028.0
},
"eval_I-Premise": {
"f1-score": 0.9004323458767015,
"precision": 0.8590809093131264,
"recall": 0.9459659511472983,
"support": 14861.0
},
"eval_O": {
"f1-score": 0.9988389078242631,
"precision": 0.9991008541885209,
"recall": 0.9985770987793006,
"support": 13353.0
},
"eval_accuracy": 0.8856789444749863,
"eval_loss": 0.28347474336624146,
"eval_macro avg": {
"f1-score": 0.6254212866619178,
"precision": 0.76405734152864,
"recall": 0.629876554361031,
"support": 36380.0
},
"eval_runtime": 5.0448,
"eval_samples_per_second": 16.056,
"eval_steps_per_second": 2.18,
"eval_weighted avg": {
"f1-score": 0.8748148382495958,
"precision": 0.8768575102351055,
"recall": 0.8856789444749863,
"support": 36380.0
},
"step": 81
},
{
"epoch": 2.0,
"eval_B-Claim": {
"f1-score": 0.5137931034482759,
"precision": 0.6182572614107884,
"recall": 0.43952802359882004,
"support": 339.0
},
"eval_B-MajorClaim": {
"f1-score": 0.7622641509433963,
"precision": 0.9619047619047619,
"recall": 0.63125,
"support": 160.0
},
"eval_B-Premise": {
"f1-score": 0.8853910477127397,
"precision": 0.8241758241758241,
"recall": 0.9564293304994687,
"support": 941.0
},
"eval_I-Claim": {
"f1-score": 0.5413588470388762,
"precision": 0.6279853891542568,
"recall": 0.47573435504469985,
"support": 4698.0
},
"eval_I-MajorClaim": {
"f1-score": 0.7949260042283298,
"precision": 0.856492027334852,
"recall": 0.7416173570019724,
"support": 2028.0
},
"eval_I-Premise": {
"f1-score": 0.9007064868336545,
"precision": 0.8614779777627618,
"recall": 0.9436780835744566,
"support": 14861.0
},
"eval_O": {
"f1-score": 0.9988389947942025,
"precision": 0.9990260713215463,
"recall": 0.9986519883172321,
"support": 13353.0
},
"eval_accuracy": 0.8864211105002748,
"eval_loss": 0.2809496521949768,
"eval_macro avg": {
"f1-score": 0.7710398049999251,
"precision": 0.8213313304378275,
"recall": 0.7409841625766643,
"support": 36380.0
},
"eval_runtime": 5.0579,
"eval_samples_per_second": 16.014,
"eval_steps_per_second": 2.175,
"eval_weighted avg": {
"f1-score": 0.8798131143596267,
"precision": 0.8787439244541853,
"recall": 0.8864211105002748,
"support": 36380.0
},
"step": 162
},
{
"epoch": 3.0,
"eval_B-Claim": {
"f1-score": 0.6401137980085349,
"precision": 0.6181318681318682,
"recall": 0.6637168141592921,
"support": 339.0
},
"eval_B-MajorClaim": {
"f1-score": 0.7918781725888324,
"precision": 0.6666666666666666,
"recall": 0.975,
"support": 160.0
},
"eval_B-Premise": {
"f1-score": 0.8866442199775534,
"precision": 0.93935790725327,
"recall": 0.8395324123273114,
"support": 941.0
},
"eval_I-Claim": {
"f1-score": 0.6254390633315594,
"precision": 0.6255056418990845,
"recall": 0.6253724989357173,
"support": 4698.0
},
"eval_I-MajorClaim": {
"f1-score": 0.76480605487228,
"precision": 0.6205096714768191,
"recall": 0.9965483234714004,
"support": 2028.0
},
"eval_I-Premise": {
"f1-score": 0.9049205625504156,
"precision": 0.9449897450922942,
"recall": 0.868111163447951,
"support": 14861.0
},
"eval_O": {
"f1-score": 0.9988758992805756,
"precision": 0.9995500562429697,
"recall": 0.9982026510896428,
"support": 13353.0
},
"eval_accuracy": 0.8894997251236944,
"eval_loss": 0.318760484457016,
"eval_macro avg": {
"f1-score": 0.8018111100871074,
"precision": 0.7735302223947104,
"recall": 0.852354837633045,
"support": 36380.0
},
"eval_runtime": 5.0862,
"eval_samples_per_second": 15.925,
"eval_steps_per_second": 2.163,
"eval_weighted avg": {
"f1-score": 0.8920666591013163,
"precision": 0.9012548868310761,
"recall": 0.8894997251236944,
"support": 36380.0
},
"step": 243
},
{
"epoch": 4.0,
"eval_B-Claim": {
"f1-score": 0.7034883720930232,
"precision": 0.6934097421203438,
"recall": 0.7138643067846607,
"support": 339.0
},
"eval_B-MajorClaim": {
"f1-score": 0.8958990536277602,
"precision": 0.9044585987261147,
"recall": 0.8875,
"support": 160.0
},
"eval_B-Premise": {
"f1-score": 0.9051172707889126,
"precision": 0.9080213903743316,
"recall": 0.9022316684378321,
"support": 941.0
},
"eval_I-Claim": {
"f1-score": 0.6932699265998139,
"precision": 0.6739698492462312,
"recall": 0.7137079608343976,
"support": 4698.0
},
"eval_I-MajorClaim": {
"f1-score": 0.8904009720534629,
"precision": 0.877815045519885,
"recall": 0.903353057199211,
"support": 2028.0
},
"eval_I-Premise": {
"f1-score": 0.9127480293558032,
"precision": 0.9218310342461052,
"recall": 0.9038422717179194,
"support": 14861.0
},
"eval_O": {
"f1-score": 0.9981619715668254,
"precision": 0.9999248459341651,
"recall": 0.9964053021792856,
"support": 13353.0
},
"eval_accuracy": 0.9113523914238593,
"eval_loss": 0.2517726719379425,
"eval_macro avg": {
"f1-score": 0.8570122280122289,
"precision": 0.8542043580238825,
"recall": 0.8601292238790438,
"support": 36380.0
},
"eval_runtime": 5.062,
"eval_samples_per_second": 16.002,
"eval_steps_per_second": 2.173,
"eval_weighted avg": {
"f1-score": 0.9122886837716081,
"precision": 0.9134709768686261,
"recall": 0.9113523914238593,
"support": 36380.0
},
"step": 324
},
{
"epoch": 5.0,
"eval_B-Claim": {
"f1-score": 0.6590538336052201,
"precision": 0.7372262773722628,
"recall": 0.5958702064896755,
"support": 339.0
},
"eval_B-MajorClaim": {
"f1-score": 0.9078947368421054,
"precision": 0.9583333333333334,
"recall": 0.8625,
"support": 160.0
},
"eval_B-Premise": {
"f1-score": 0.9066802651708312,
"precision": 0.8715686274509804,
"recall": 0.944739638682253,
"support": 941.0
},
"eval_I-Claim": {
"f1-score": 0.6513589503280225,
"precision": 0.7243355914538823,
"recall": 0.5917411664538101,
"support": 4698.0
},
"eval_I-MajorClaim": {
"f1-score": 0.8981975120588981,
"precision": 0.9256933542647828,
"recall": 0.8722879684418146,
"support": 2028.0
},
"eval_I-Premise": {
"f1-score": 0.9158848058378942,
"precision": 0.8877170824123777,
"recall": 0.9458986609245676,
"support": 14861.0
},
"eval_O": {
"f1-score": 0.9994384336041331,
"precision": 0.9992513849378649,
"recall": 0.9996255523103422,
"support": 13353.0
},
"eval_accuracy": 0.9121220450797142,
"eval_loss": 0.2739432156085968,
"eval_macro avg": {
"f1-score": 0.8483583624924435,
"precision": 0.8720179501750691,
"recall": 0.8303804561860663,
"support": 36380.0
},
"eval_runtime": 5.0932,
"eval_samples_per_second": 15.904,
"eval_steps_per_second": 2.16,
"eval_weighted avg": {
"f1-score": 0.9087400479269403,
"precision": 0.9081638580455985,
"recall": 0.9121220450797142,
"support": 36380.0
},
"step": 405
},
{
"epoch": 6.0,
"eval_B-Claim": {
"f1-score": 0.6675461741424802,
"precision": 0.60381861575179,
"recall": 0.7463126843657817,
"support": 339.0
},
"eval_B-MajorClaim": {
"f1-score": 0.887608069164265,
"precision": 0.8235294117647058,
"recall": 0.9625,
"support": 160.0
},
"eval_B-Premise": {
"f1-score": 0.8737316798196167,
"precision": 0.9303721488595438,
"recall": 0.8235919234856536,
"support": 941.0
},
"eval_I-Claim": {
"f1-score": 0.6529236868186323,
"precision": 0.6109050445103857,
"recall": 0.7011494252873564,
"support": 4698.0
},
"eval_I-MajorClaim": {
"f1-score": 0.8689320388349515,
"precision": 0.7863418530351438,
"recall": 0.9709072978303748,
"support": 2028.0
},
"eval_I-Premise": {
"f1-score": 0.8937734066010992,
"precision": 0.9312910284463894,
"recall": 0.8591615638247763,
"support": 14861.0
},
"eval_O": {
"f1-score": 0.9988009592326139,
"precision": 0.9994750656167979,
"recall": 0.9981277615517112,
"support": 13353.0
},
"eval_accuracy": 0.8944749862561847,
"eval_loss": 0.37784042954444885,
"eval_macro avg": {
"f1-score": 0.8347594306590942,
"precision": 0.8122475954263937,
"recall": 0.8659643794779507,
"support": 36380.0
},
"eval_runtime": 5.0734,
"eval_samples_per_second": 15.966,
"eval_steps_per_second": 2.168,
"eval_weighted avg": {
"f1-score": 0.8971820344797716,
"precision": 0.9033144340485707,
"recall": 0.8944749862561847,
"support": 36380.0
},
"step": 486
},
{
"epoch": 6.17,
"grad_norm": 21.778270721435547,
"learning_rate": 1.7530864197530865e-05,
"loss": 0.2481,
"step": 500
},
{
"epoch": 7.0,
"eval_B-Claim": {
"f1-score": 0.6489859594383774,
"precision": 0.6887417218543046,
"recall": 0.6135693215339233,
"support": 339.0
},
"eval_B-MajorClaim": {
"f1-score": 0.8852459016393444,
"precision": 0.9310344827586207,
"recall": 0.84375,
"support": 160.0
},
"eval_B-Premise": {
"f1-score": 0.9011898603207449,
"precision": 0.8780241935483871,
"recall": 0.9256110520722636,
"support": 941.0
},
"eval_I-Claim": {
"f1-score": 0.626564114338193,
"precision": 0.6800398704211313,
"recall": 0.5808854831843338,
"support": 4698.0
},
"eval_I-MajorClaim": {
"f1-score": 0.8813559322033898,
"precision": 0.9049350649350649,
"recall": 0.8589743589743589,
"support": 2028.0
},
"eval_I-Premise": {
"f1-score": 0.9073595340161655,
"precision": 0.8831698305516626,
"recall": 0.9329116479375547,
"support": 14861.0
},
"eval_O": {
"f1-score": 0.9981994148098132,
"precision": 1.0,
"recall": 0.9964053021792856,
"support": 13353.0
},
"eval_accuracy": 0.9030786146234194,
"eval_loss": 0.4109443426132202,
"eval_macro avg": {
"f1-score": 0.8355572452522898,
"precision": 0.8522778805813102,
"recall": 0.8217295951259599,
"support": 36380.0
},
"eval_runtime": 5.0454,
"eval_samples_per_second": 16.054,
"eval_steps_per_second": 2.18,
"eval_weighted avg": {
"f1-score": 0.9003265559019435,
"precision": 0.8992988510674564,
"recall": 0.9030786146234194,
"support": 36380.0
},
"step": 567
},
{
"epoch": 8.0,
"eval_B-Claim": {
"f1-score": 0.7029972752043596,
"precision": 0.6531645569620254,
"recall": 0.7610619469026548,
"support": 339.0
},
"eval_B-MajorClaim": {
"f1-score": 0.9134328358208955,
"precision": 0.8742857142857143,
"recall": 0.95625,
"support": 160.0
},
"eval_B-Premise": {
"f1-score": 0.8914728682170544,
"precision": 0.930635838150289,
"recall": 0.8554729011689692,
"support": 941.0
},
"eval_I-Claim": {
"f1-score": 0.6790487421383647,
"precision": 0.6307046367287331,
"recall": 0.7354193273733504,
"support": 4698.0
},
"eval_I-MajorClaim": {
"f1-score": 0.8939393939393939,
"precision": 0.836340206185567,
"recall": 0.9600591715976331,
"support": 2028.0
},
"eval_I-Premise": {
"f1-score": 0.8993180625983564,
"precision": 0.9362166885102665,
"recall": 0.8652176838705337,
"support": 14861.0
},
"eval_O": {
"f1-score": 0.9979819119515658,
"precision": 0.9960462513987318,
"recall": 0.9999251104620684,
"support": 13353.0
},
"eval_accuracy": 0.902363936228697,
"eval_loss": 0.4763801097869873,
"eval_macro avg": {
"f1-score": 0.8540272985528559,
"precision": 0.8367705560316182,
"recall": 0.8762008773393156,
"support": 36380.0
},
"eval_runtime": 5.0791,
"eval_samples_per_second": 15.948,
"eval_steps_per_second": 2.166,
"eval_weighted avg": {
"f1-score": 0.9048169208096876,
"precision": 0.9101018951943243,
"recall": 0.902363936228697,
"support": 36380.0
},
"step": 648
},
{
"epoch": 9.0,
"eval_B-Claim": {
"f1-score": 0.6884779516358464,
"precision": 0.6648351648351648,
"recall": 0.7138643067846607,
"support": 339.0
},
"eval_B-MajorClaim": {
"f1-score": 0.8860759493670887,
"precision": 0.8974358974358975,
"recall": 0.875,
"support": 160.0
},
"eval_B-Premise": {
"f1-score": 0.8984416980118215,
"precision": 0.908695652173913,
"recall": 0.8884165781083954,
"support": 941.0
},
"eval_I-Claim": {
"f1-score": 0.6685829873309911,
"precision": 0.6687965921192758,
"recall": 0.6683695189442316,
"support": 4698.0
},
"eval_I-MajorClaim": {
"f1-score": 0.8819011041766683,
"precision": 0.8592142188961647,
"recall": 0.9058185404339251,
"support": 2028.0
},
"eval_I-Premise": {
"f1-score": 0.9072658065820057,
"precision": 0.9083367057871308,
"recall": 0.9061974295134917,
"support": 14861.0
},
"eval_O": {
"f1-score": 0.9971465044679734,
"precision": 0.9998494089300505,
"recall": 0.9944581741930653,
"support": 13353.0
},
"eval_accuracy": 0.9054700384826828,
"eval_loss": 0.43875375390052795,
"eval_macro avg": {
"f1-score": 0.8468417145103421,
"precision": 0.843880520025371,
"recall": 0.8503035068539672,
"support": 36380.0
},
"eval_runtime": 5.0863,
"eval_samples_per_second": 15.925,
"eval_steps_per_second": 2.163,
"eval_weighted avg": {
"f1-score": 0.9056589487317133,
"precision": 0.9059462683069767,
"recall": 0.9054700384826828,
"support": 36380.0
},
"step": 729
},
{
"epoch": 10.0,
"eval_B-Claim": {
"f1-score": 0.6910569105691057,
"precision": 0.6390977443609023,
"recall": 0.7522123893805309,
"support": 339.0
},
"eval_B-MajorClaim": {
"f1-score": 0.9046153846153846,
"precision": 0.8909090909090909,
"recall": 0.91875,
"support": 160.0
},
"eval_B-Premise": {
"f1-score": 0.8888888888888888,
"precision": 0.9213226909920182,
"recall": 0.8586609989373007,
"support": 941.0
},
"eval_I-Claim": {
"f1-score": 0.6645316253002403,
"precision": 0.6271250472232717,
"recall": 0.7066836951894423,
"support": 4698.0
},
"eval_I-MajorClaim": {
"f1-score": 0.886980737990253,
"precision": 0.8377904427882508,
"recall": 0.9423076923076923,
"support": 2028.0
},
"eval_I-Premise": {
"f1-score": 0.8983343700324833,
"precision": 0.9233501456276195,
"recall": 0.8746383150528229,
"support": 14861.0
},
"eval_O": {
"f1-score": 0.9975225225225225,
"precision": 1.0,
"recall": 0.9950572904965176,
"support": 13353.0
},
"eval_accuracy": 0.8995601979109401,
"eval_loss": 0.5381875038146973,
"eval_macro avg": {
"f1-score": 0.8474186342741253,
"precision": 0.8342278802715933,
"recall": 0.8640443401949011,
"support": 36380.0
},
"eval_runtime": 5.099,
"eval_samples_per_second": 15.885,
"eval_steps_per_second": 2.157,
"eval_weighted avg": {
"f1-score": 0.9017669881051834,
"precision": 0.9056169116577473,
"recall": 0.8995601979109401,
"support": 36380.0
},
"step": 810
},
{
"epoch": 11.0,
"eval_B-Claim": {
"f1-score": 0.7103825136612023,
"precision": 0.6615776081424937,
"recall": 0.7669616519174042,
"support": 339.0
},
"eval_B-MajorClaim": {
"f1-score": 0.9032258064516129,
"precision": 0.850828729281768,
"recall": 0.9625,
"support": 160.0
},
"eval_B-Premise": {
"f1-score": 0.8955223880597015,
"precision": 0.9331797235023042,
"recall": 0.8607863974495218,
"support": 941.0
},
"eval_I-Claim": {
"f1-score": 0.685932169375878,
"precision": 0.6488230827638573,
"recall": 0.7275436355896125,
"support": 4698.0
},
"eval_I-MajorClaim": {
"f1-score": 0.8921899617375647,
"precision": 0.820703933747412,
"recall": 0.9773175542406312,
"support": 2028.0
},
"eval_I-Premise": {
"f1-score": 0.9036754507628294,
"precision": 0.932183990271121,
"recall": 0.8768588924029338,
"support": 14861.0
},
"eval_O": {
"f1-score": 0.9971084156370874,
"precision": 1.0,
"recall": 0.9942335055792706,
"support": 13353.0
},
"eval_accuracy": 0.9051951621770203,
"eval_loss": 0.5869538187980652,
"eval_macro avg": {
"f1-score": 0.8554338150979823,
"precision": 0.8353281525298509,
"recall": 0.880885948168482,
"support": 36380.0
},
"eval_runtime": 5.0923,
"eval_samples_per_second": 15.906,
"eval_steps_per_second": 2.16,
"eval_weighted avg": {
"f1-score": 0.9071963301332511,
"precision": 0.9114149044954519,
"recall": 0.9051951621770203,
"support": 36380.0
},
"step": 891
},
{
"epoch": 12.0,
"eval_B-Claim": {
"f1-score": 0.6758409785932722,
"precision": 0.7015873015873015,
"recall": 0.6519174041297935,
"support": 339.0
},
"eval_B-MajorClaim": {
"f1-score": 0.916923076923077,
"precision": 0.9030303030303031,
"recall": 0.93125,
"support": 160.0
},
"eval_B-Premise": {
"f1-score": 0.8989473684210527,
"precision": 0.8905109489051095,
"recall": 0.9075451647183846,
"support": 941.0
},
"eval_I-Claim": {
"f1-score": 0.6533197602081212,
"precision": 0.6970794110547912,
"recall": 0.6147296722009365,
"support": 4698.0
},
"eval_I-MajorClaim": {
"f1-score": 0.9200480192076831,
"precision": 0.8965839962564343,
"recall": 0.9447731755424064,
"support": 2028.0
},
"eval_I-Premise": {
"f1-score": 0.9082653940478558,
"precision": 0.8948605759811924,
"recall": 0.922077922077922,
"support": 14861.0
},
"eval_O": {
"f1-score": 0.9988389947942025,
"precision": 0.9990260713215463,
"recall": 0.9986519883172321,
"support": 13353.0
},
"eval_accuracy": 0.9089059923034635,
"eval_loss": 0.5580677390098572,
"eval_macro avg": {
"f1-score": 0.8531690845993235,
"precision": 0.854668372590954,
"recall": 0.852992189569525,
"support": 36380.0
},
"eval_runtime": 5.0574,
"eval_samples_per_second": 16.016,
"eval_steps_per_second": 2.175,
"eval_weighted avg": {
"f1-score": 0.9068749310769137,
"precision": 0.9057713940131727,
"recall": 0.9089059923034635,
"support": 36380.0
},
"step": 972
},
{
"epoch": 12.35,
"grad_norm": 0.45772114396095276,
"learning_rate": 1.506172839506173e-05,
"loss": 0.0314,
"step": 1000
},
{
"epoch": 13.0,
"eval_B-Claim": {
"f1-score": 0.6760563380281691,
"precision": 0.72,
"recall": 0.6371681415929203,
"support": 339.0
},
"eval_B-MajorClaim": {
"f1-score": 0.9171974522292993,
"precision": 0.935064935064935,
"recall": 0.9,
"support": 160.0
},
"eval_B-Premise": {
"f1-score": 0.905503634475597,
"precision": 0.8852791878172589,
"recall": 0.926673751328374,
"support": 941.0
},
"eval_I-Claim": {
"f1-score": 0.6522588803310726,
"precision": 0.7090727318170458,
"recall": 0.6038739889314602,
"support": 4698.0
},
"eval_I-MajorClaim": {
"f1-score": 0.9228121927236971,
"precision": 0.9200980392156862,
"recall": 0.9255424063116371,
"support": 2028.0
},
"eval_I-Premise": {
"f1-score": 0.9102441910145594,
"precision": 0.8896312475909033,
"recall": 0.9318350043738645,
"support": 14861.0
},
"eval_O": {
"f1-score": 0.9992880428673137,
"precision": 1.0,
"recall": 0.9985770987793006,
"support": 13353.0
},
"eval_accuracy": 0.9106102253985706,
"eval_loss": 0.5264647603034973,
"eval_macro avg": {
"f1-score": 0.8547658188099584,
"precision": 0.8655923059294041,
"recall": 0.8462386273310795,
"support": 36380.0
},
"eval_runtime": 5.0562,
"eval_samples_per_second": 16.02,
"eval_steps_per_second": 2.176,
"eval_weighted avg": {
"f1-score": 0.9080379636257123,
"precision": 0.9070294280758862,
"recall": 0.9106102253985706,
"support": 36380.0
},
"step": 1053
},
{
"epoch": 14.0,
"eval_B-Claim": {
"f1-score": 0.6980609418282548,
"precision": 0.6579634464751958,
"recall": 0.7433628318584071,
"support": 339.0
},
"eval_B-MajorClaim": {
"f1-score": 0.9226006191950465,
"precision": 0.9141104294478528,
"recall": 0.93125,
"support": 160.0
},
"eval_B-Premise": {
"f1-score": 0.8921568627450981,
"precision": 0.9150837988826815,
"recall": 0.8703506907545164,
"support": 941.0
},
"eval_I-Claim": {
"f1-score": 0.6821321785751109,
"precision": 0.6614677064587082,
"recall": 0.7041294167730949,
"support": 4698.0
},
"eval_I-MajorClaim": {
"f1-score": 0.9124910093502757,
"precision": 0.8880074661689221,
"recall": 0.9383629191321499,
"support": 2028.0
},
"eval_I-Premise": {
"f1-score": 0.9052323204796293,
"precision": 0.9166609175577786,
"recall": 0.894085189421977,
"support": 14861.0
},
"eval_O": {
"f1-score": 0.9980114808839531,
"precision": 1.0,
"recall": 0.9960308544896278,
"support": 13353.0
},
"eval_accuracy": 0.9075865860362837,
"eval_loss": 0.6585939526557922,
"eval_macro avg": {
"f1-score": 0.8586693447224812,
"precision": 0.850470537855877,
"recall": 0.8682245574899676,
"support": 36380.0
},
"eval_runtime": 5.0606,
"eval_samples_per_second": 16.006,
"eval_steps_per_second": 2.174,
"eval_weighted avg": {
"f1-score": 0.9086880683615599,
"precision": 0.9102351141829325,
"recall": 0.9075865860362837,
"support": 36380.0
},
"step": 1134
},
{
"epoch": 15.0,
"eval_B-Claim": {
"f1-score": 0.6920731707317073,
"precision": 0.7160883280757098,
"recall": 0.6696165191740413,
"support": 339.0
},
"eval_B-MajorClaim": {
"f1-score": 0.90282131661442,
"precision": 0.9056603773584906,
"recall": 0.9,
"support": 160.0
},
"eval_B-Premise": {
"f1-score": 0.9076600209863588,
"precision": 0.8963730569948186,
"recall": 0.9192348565356004,
"support": 941.0
},
"eval_I-Claim": {
"f1-score": 0.6644877718922575,
"precision": 0.7061077844311378,
"recall": 0.6275010642826735,
"support": 4698.0
},
"eval_I-MajorClaim": {
"f1-score": 0.9016511127063891,
"precision": 0.8758716875871687,
"recall": 0.9289940828402367,
"support": 2028.0
},
"eval_I-Premise": {
"f1-score": 0.9134082844161443,
"precision": 0.9005362280931206,
"recall": 0.9266536572236054,
"support": 14861.0
},
"eval_O": {
"f1-score": 0.9987253505286046,
"precision": 0.9999249305607687,
"recall": 0.9975286452482588,
"support": 13353.0
},
"eval_accuracy": 0.9114623419461243,
"eval_loss": 0.6387954950332642,
"eval_macro avg": {
"f1-score": 0.854403861125126,
"precision": 0.8572231990144593,
"recall": 0.8527898321863451,
"support": 36380.0
},
"eval_runtime": 5.0835,
"eval_samples_per_second": 15.934,
"eval_steps_per_second": 2.164,
"eval_weighted avg": {
"f1-score": 0.9096653222792656,
"precision": 0.9087293921765042,
"recall": 0.9114623419461243,
"support": 36380.0
},
"step": 1215
},
{
"epoch": 16.0,
"eval_B-Claim": {
"f1-score": 0.6602254428341385,
"precision": 0.7269503546099291,
"recall": 0.6047197640117994,
"support": 339.0
},
"eval_B-MajorClaim": {
"f1-score": 0.8903225806451613,
"precision": 0.92,
"recall": 0.8625,
"support": 160.0
},
"eval_B-Premise": {
"f1-score": 0.9055441478439425,
"precision": 0.8758689175769613,
"recall": 0.9373007438894793,
"support": 941.0
},
"eval_I-Claim": {
"f1-score": 0.6361776387050188,
"precision": 0.7319302132373304,
"recall": 0.5625798212005109,
"support": 4698.0
},
"eval_I-MajorClaim": {
"f1-score": 0.9097614949594295,
"precision": 0.9073075036782736,
"recall": 0.9122287968441815,
"support": 2028.0
},
"eval_I-Premise": {
"f1-score": 0.9127908863717504,
"precision": 0.8816300940438871,
"recall": 0.9462351120382209,
"support": 14861.0
},
"eval_O": {
"f1-score": 0.9993256911665542,
"precision": 0.9997751293006522,
"recall": 0.9988766569310268,
"support": 13353.0
},
"eval_accuracy": 0.9103353490929081,
"eval_loss": 0.6975058317184448,
"eval_macro avg": {
"f1-score": 0.844878268932285,
"precision": 0.8633517446352906,
"recall": 0.8320629849878884,
"support": 36380.0
},
"eval_runtime": 5.0731,
"eval_samples_per_second": 15.967,
"eval_steps_per_second": 2.168,
"eval_weighted avg": {
"f1-score": 0.9060232340867683,
"precision": 0.9056723119856793,
"recall": 0.9103353490929081,
"support": 36380.0
},
"step": 1296
}
],
"logging_steps": 500,
"max_steps": 4050,
"num_input_tokens_seen": 0,
"num_train_epochs": 50,
"save_steps": 500,
"total_flos": 2293508118384000.0,
"train_batch_size": 4,
"trial_name": null,
"trial_params": null
}