{ "best_metric": 0.276384562253952, "best_model_checkpoint": "longformer-sep_tok_full_labels/checkpoint-324", "epoch": 16.0, "eval_steps": 500, "global_step": 1296, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_B-Claim": { "f1-score": 0.21800947867298578, "precision": 0.3333333333333333, "recall": 0.1619718309859155, "support": 284.0 }, "eval_B-MajorClaim": { "f1-score": 0.0, "precision": 0.0, "recall": 0.0, "support": 141.0 }, "eval_B-Premise": { "f1-score": 0.8305489260143198, "precision": 0.71900826446281, "recall": 0.9830508474576272, "support": 708.0 }, "eval_I-Claim": { "f1-score": 0.5590492696211935, "precision": 0.5643589102724319, "recall": 0.5538386068187393, "support": 4077.0 }, "eval_I-MajorClaim": { "f1-score": 0.7399038461538461, "precision": 0.7205056179775281, "recall": 0.7603754940711462, "support": 2024.0 }, "eval_I-Premise": { "f1-score": 0.8867229093291834, "precision": 0.8883965205974068, "recall": 0.8850555918901243, "support": 12232.0 }, "eval_O": { "f1-score": 0.9976548035383666, "precision": 0.9961383616794018, "recall": 0.9991758694577221, "support": 12134.0 }, "eval_accuracy": 0.8699050632911393, "eval_loss": 0.32671716809272766, "eval_macro avg": { "f1-score": 0.6045556047614136, "precision": 0.6031058583318446, "recall": 0.6204954629544678, "support": 31600.0 }, "eval_runtime": 6.234, "eval_samples_per_second": 12.833, "eval_steps_per_second": 1.604, "eval_weighted avg": { "f1-score": 0.8664142595402331, "precision": 0.8644597558999653, "recall": 0.8699050632911393, "support": 31600.0 }, "step": 81 }, { "epoch": 2.0, "eval_B-Claim": { "f1-score": 0.5352697095435685, "precision": 0.6515151515151515, "recall": 0.45422535211267606, "support": 284.0 }, "eval_B-MajorClaim": { "f1-score": 0.7766990291262136, "precision": 0.7142857142857143, "recall": 0.851063829787234, "support": 141.0 }, "eval_B-Premise": { "f1-score": 0.8802721088435375, "precision": 0.8490813648293963, "recall": 0.9138418079096046, "support": 708.0 }, "eval_I-Claim": { "f1-score": 0.5747557221255521, "precision": 0.6325869180907484, "recall": 0.5266127054206524, "support": 4077.0 }, "eval_I-MajorClaim": { "f1-score": 0.7833260963960051, "precision": 0.6986831913245546, "recall": 0.8913043478260869, "support": 2024.0 }, "eval_I-Premise": { "f1-score": 0.8995515695067264, "precision": 0.8971377459749553, "recall": 0.9019784172661871, "support": 12232.0 }, "eval_O": { "f1-score": 0.9971231300345225, "precision": 0.9945072962780783, "recall": 0.9997527608373167, "support": 12134.0 }, "eval_accuracy": 0.8864240506329114, "eval_loss": 0.28716403245925903, "eval_macro avg": { "f1-score": 0.7781424807965893, "precision": 0.7768281974712284, "recall": 0.791254174451394, "support": 31600.0 }, "eval_runtime": 6.2816, "eval_samples_per_second": 12.736, "eval_steps_per_second": 1.592, "eval_weighted avg": { "f1-score": 0.8834146129726252, "precision": 0.8835831101628018, "recall": 0.8864240506329114, "support": 31600.0 }, "step": 162 }, { "epoch": 3.0, "eval_B-Claim": { "f1-score": 0.5580448065173116, "precision": 0.6618357487922706, "recall": 0.4823943661971831, "support": 284.0 }, "eval_B-MajorClaim": { "f1-score": 0.8046875, "precision": 0.8956521739130435, "recall": 0.7304964539007093, "support": 141.0 }, "eval_B-Premise": { "f1-score": 0.8868421052631579, "precision": 0.8300492610837439, "recall": 0.9519774011299436, "support": 708.0 }, "eval_I-Claim": { "f1-score": 0.5488426262920367, "precision": 0.6751432664756447, "recall": 0.4623497669855286, "support": 4077.0 }, "eval_I-MajorClaim": { "f1-score": 0.8110936682365254, "precision": 0.8620689655172413, "recall": 0.7658102766798419, "support": 2024.0 }, "eval_I-Premise": { "f1-score": 0.9039491427470623, "precision": 0.854842235662756, "recall": 0.9590418574231524, "support": 12232.0 }, "eval_O": { "f1-score": 0.9979824597521307, "precision": 0.9972023368715544, "recall": 0.9987638041865832, "support": 12134.0 }, "eval_accuracy": 0.892373417721519, "eval_loss": 0.28271517157554626, "eval_macro avg": { "f1-score": 0.7873489012583177, "precision": 0.825256284045179, "recall": 0.7644048466432775, "support": 31600.0 }, "eval_runtime": 6.2071, "eval_samples_per_second": 12.888, "eval_steps_per_second": 1.611, "eval_weighted avg": { "f1-score": 0.88435885840807, "precision": 0.8846770016417851, "recall": 0.892373417721519, "support": 31600.0 }, "step": 243 }, { "epoch": 4.0, "eval_B-Claim": { "f1-score": 0.659016393442623, "precision": 0.6165644171779141, "recall": 0.7077464788732394, "support": 284.0 }, "eval_B-MajorClaim": { "f1-score": 0.8675496688741722, "precision": 0.8136645962732919, "recall": 0.9290780141843972, "support": 141.0 }, "eval_B-Premise": { "f1-score": 0.8698224852071005, "precision": 0.9130434782608695, "recall": 0.8305084745762712, "support": 708.0 }, "eval_I-Claim": { "f1-score": 0.6472172351885099, "precision": 0.5964839710444674, "recall": 0.70738287956831, "support": 4077.0 }, "eval_I-MajorClaim": { "f1-score": 0.8549332083430982, "precision": 0.8131966116807846, "recall": 0.9011857707509882, "support": 2024.0 }, "eval_I-Premise": { "f1-score": 0.8876102800153433, "precision": 0.9271658801531475, "recall": 0.8512916939175932, "support": 12232.0 }, "eval_O": { "f1-score": 0.9981065283609122, "precision": 0.9970394736842105, "recall": 0.9991758694577221, "support": 12134.0 }, "eval_accuracy": 0.8912974683544304, "eval_loss": 0.276384562253952, "eval_macro avg": { "f1-score": 0.8263222570616798, "precision": 0.8110226326106693, "recall": 0.8466241687612174, "support": 31600.0 }, "eval_runtime": 6.2529, "eval_samples_per_second": 12.794, "eval_steps_per_second": 1.599, "eval_weighted avg": { "f1-score": 0.8943886873545748, "precision": 0.9004180663566287, "recall": 0.8912974683544304, "support": 31600.0 }, "step": 324 }, { "epoch": 5.0, "eval_B-Claim": { "f1-score": 0.665474060822898, "precision": 0.6763636363636364, "recall": 0.6549295774647887, "support": 284.0 }, "eval_B-MajorClaim": { "f1-score": 0.8896551724137931, "precision": 0.8657718120805369, "recall": 0.9148936170212766, "support": 141.0 }, "eval_B-Premise": { "f1-score": 0.8843441466854725, "precision": 0.8830985915492958, "recall": 0.885593220338983, "support": 708.0 }, "eval_I-Claim": { "f1-score": 0.6698067632850242, "precision": 0.6597668332143707, "recall": 0.6801569781702232, "support": 4077.0 }, "eval_I-MajorClaim": { "f1-score": 0.8809815950920246, "precision": 0.8751828376401756, "recall": 0.8868577075098815, "support": 2024.0 }, "eval_I-Premise": { "f1-score": 0.9024631353488756, "precision": 0.9094305163539764, "recall": 0.8956017004578156, "support": 12232.0 }, "eval_O": { "f1-score": 0.9980246913580246, "precision": 0.9967121486108828, "recall": 0.9993406955661777, "support": 12134.0 }, "eval_accuracy": 0.9047784810126582, "eval_loss": 0.2893199920654297, "eval_macro avg": { "f1-score": 0.8415356521437304, "precision": 0.838046625116125, "recall": 0.8453390709327352, "support": 31600.0 }, "eval_runtime": 6.2466, "eval_samples_per_second": 12.807, "eval_steps_per_second": 1.601, "eval_weighted avg": { "f1-score": 0.9051715590931133, "precision": 0.9056611908459661, "recall": 0.9047784810126582, "support": 31600.0 }, "step": 405 }, { "epoch": 6.0, "eval_B-Claim": { "f1-score": 0.6263345195729537, "precision": 0.6330935251798561, "recall": 0.6197183098591549, "support": 284.0 }, "eval_B-MajorClaim": { "f1-score": 0.8372093023255814, "precision": 0.9230769230769231, "recall": 0.7659574468085106, "support": 141.0 }, "eval_B-Premise": { "f1-score": 0.8784530386740332, "precision": 0.8594594594594595, "recall": 0.8983050847457628, "support": 708.0 }, "eval_I-Claim": { "f1-score": 0.6109127995920448, "precision": 0.6360499070878683, "recall": 0.5876870247731175, "support": 4077.0 }, "eval_I-MajorClaim": { "f1-score": 0.8409272581934453, "precision": 0.9126662810873337, "recall": 0.7796442687747036, "support": 2024.0 }, "eval_I-Premise": { "f1-score": 0.8964938902643559, "precision": 0.8762685402029664, "recall": 0.9176749509483323, "support": 12232.0 }, "eval_O": { "f1-score": 0.9987239122380934, "precision": 0.9976971790443293, "recall": 0.9997527608373167, "support": 12134.0 }, "eval_accuracy": 0.8939873417721519, "eval_loss": 0.33532533049583435, "eval_macro avg": { "f1-score": 0.8127221029800725, "precision": 0.8340445450198194, "recall": 0.7955342638209855, "support": 31600.0 }, "eval_runtime": 6.2278, "eval_samples_per_second": 12.846, "eval_steps_per_second": 1.606, "eval_weighted avg": { "f1-score": 0.8922477132246446, "precision": 0.891880888702747, "recall": 0.8939873417721519, "support": 31600.0 }, "step": 486 }, { "epoch": 6.17, "grad_norm": 4.557807445526123, "learning_rate": 1.3827160493827162e-05, "loss": 0.2608, "step": 500 }, { "epoch": 7.0, "eval_B-Claim": { "f1-score": 0.5553235908141962, "precision": 0.6820512820512821, "recall": 0.46830985915492956, "support": 284.0 }, "eval_B-MajorClaim": { "f1-score": 0.8412698412698413, "precision": 0.954954954954955, "recall": 0.75177304964539, "support": 141.0 }, "eval_B-Premise": { "f1-score": 0.8846905537459283, "precision": 0.8210399032648126, "recall": 0.9590395480225988, "support": 708.0 }, "eval_I-Claim": { "f1-score": 0.5484584747012834, "precision": 0.6880088823094005, "recall": 0.45597252882021094, "support": 4077.0 }, "eval_I-MajorClaim": { "f1-score": 0.8530857454942655, "precision": 0.9536019536019537, "recall": 0.7717391304347826, "support": 2024.0 }, "eval_I-Premise": { "f1-score": 0.900171657448026, "precision": 0.8438103411285132, "recall": 0.9646010464355788, "support": 12232.0 }, "eval_O": { "f1-score": 0.9986819342614713, "precision": 0.9982707509881423, "recall": 0.9990934564034943, "support": 12134.0 }, "eval_accuracy": 0.8943354430379746, "eval_loss": 0.45137375593185425, "eval_macro avg": { "f1-score": 0.7973831139621446, "precision": 0.8488197240427228, "recall": 0.7672183741309979, "support": 31600.0 }, "eval_runtime": 6.1951, "eval_samples_per_second": 12.913, "eval_steps_per_second": 1.614, "eval_weighted avg": { "f1-score": 0.8858958517067363, "precision": 0.8885840321741321, "recall": 0.8943354430379746, "support": 31600.0 }, "step": 567 }, { "epoch": 8.0, "eval_B-Claim": { "f1-score": 0.6642599277978338, "precision": 0.6814814814814815, "recall": 0.647887323943662, "support": 284.0 }, "eval_B-MajorClaim": { "f1-score": 0.9015151515151516, "precision": 0.967479674796748, "recall": 0.8439716312056738, "support": 141.0 }, "eval_B-Premise": { "f1-score": 0.8873531444367657, "precision": 0.8687415426251691, "recall": 0.9067796610169492, "support": 708.0 }, "eval_I-Claim": { "f1-score": 0.6521516393442622, "precision": 0.6823907799517556, "recall": 0.6244787834191807, "support": 4077.0 }, "eval_I-MajorClaim": { "f1-score": 0.8962213943587014, "precision": 0.9711649365628604, "recall": 0.8320158102766798, "support": 2024.0 }, "eval_I-Premise": { "f1-score": 0.9046460618145563, "precision": 0.8831269952503309, "recall": 0.9272400261608895, "support": 12232.0 }, "eval_O": { "f1-score": 0.9979418786531653, "precision": 0.996875, "recall": 0.9990110433492665, "support": 12134.0 }, "eval_accuracy": 0.9062974683544304, "eval_loss": 0.40965867042541504, "eval_macro avg": { "f1-score": 0.8434413139886338, "precision": 0.8644657729526208, "recall": 0.8259120399103289, "support": 31600.0 }, "eval_runtime": 6.2033, "eval_samples_per_second": 12.896, "eval_steps_per_second": 1.612, "eval_weighted avg": { "f1-score": 0.9047924430886448, "precision": 0.9047867115327305, "recall": 0.9062974683544304, "support": 31600.0 }, "step": 648 }, { "epoch": 9.0, "eval_B-Claim": { "f1-score": 0.6900175131348512, "precision": 0.686411149825784, "recall": 0.6936619718309859, "support": 284.0 }, "eval_B-MajorClaim": { "f1-score": 0.9064748201438848, "precision": 0.9197080291970803, "recall": 0.8936170212765957, "support": 141.0 }, "eval_B-Premise": { "f1-score": 0.8892025405786873, "precision": 0.8885754583921015, "recall": 0.8898305084745762, "support": 708.0 }, "eval_I-Claim": { "f1-score": 0.6670815183571872, "precision": 0.6771096513390601, "recall": 0.657346087809664, "support": 4077.0 }, "eval_I-MajorClaim": { "f1-score": 0.8905813658288906, "precision": 0.9159268929503916, "recall": 0.866600790513834, "support": 2024.0 }, "eval_I-Premise": { "f1-score": 0.9051692681937971, "precision": 0.8978524893428779, "recall": 0.9126062786134729, "support": 12232.0 }, "eval_O": { "f1-score": 0.9987240172875077, "precision": 0.9976153276868679, "recall": 0.9998351738915444, "support": 12134.0 }, "eval_accuracy": 0.9076582278481012, "eval_loss": 0.44169458746910095, "eval_macro avg": { "f1-score": 0.849607291932115, "precision": 0.8547427141048803, "recall": 0.8447854046300962, "support": 31600.0 }, "eval_runtime": 6.2166, "eval_samples_per_second": 12.869, "eval_steps_per_second": 1.609, "eval_weighted avg": { "f1-score": 0.9071553503542205, "precision": 0.9068271879381139, "recall": 0.9076582278481012, "support": 31600.0 }, "step": 729 }, { "epoch": 10.0, "eval_B-Claim": { "f1-score": 0.6761565836298933, "precision": 0.6834532374100719, "recall": 0.6690140845070423, "support": 284.0 }, "eval_B-MajorClaim": { "f1-score": 0.8872727272727273, "precision": 0.9104477611940298, "recall": 0.8652482269503546, "support": 141.0 }, "eval_B-Premise": { "f1-score": 0.8901329601119664, "precision": 0.8821081830790569, "recall": 0.8983050847457628, "support": 708.0 }, "eval_I-Claim": { "f1-score": 0.6512742871561948, "precision": 0.6705637828007275, "recall": 0.6330635271032622, "support": 4077.0 }, "eval_I-MajorClaim": { "f1-score": 0.8682926829268293, "precision": 0.9037947621592731, "recall": 0.8354743083003953, "support": 2024.0 }, "eval_I-Premise": { "f1-score": 0.905623866156017, "precision": 0.8933428775948461, "recall": 0.9182472204054938, "support": 12232.0 }, "eval_O": { "f1-score": 0.9981898963304262, "precision": 0.9965500246426812, "recall": 0.9998351738915444, "support": 12134.0 }, "eval_accuracy": 0.9045569620253164, "eval_loss": 0.45926380157470703, "eval_macro avg": { "f1-score": 0.8395632862262934, "precision": 0.8486086612686695, "recall": 0.8313125179862652, "support": 31600.0 }, "eval_runtime": 6.2031, "eval_samples_per_second": 12.897, "eval_steps_per_second": 1.612, "eval_weighted avg": { "f1-score": 0.9034697801243392, "precision": 0.9028380907030437, "recall": 0.9045569620253164, "support": 31600.0 }, "step": 810 }, { "epoch": 11.0, "eval_B-Claim": { "f1-score": 0.6407766990291263, "precision": 0.7142857142857143, "recall": 0.5809859154929577, "support": 284.0 }, "eval_B-MajorClaim": { "f1-score": 0.9032258064516129, "precision": 0.9130434782608695, "recall": 0.8936170212765957, "support": 141.0 }, "eval_B-Premise": { "f1-score": 0.8872282608695653, "precision": 0.8547120418848168, "recall": 0.922316384180791, "support": 708.0 }, "eval_I-Claim": { "f1-score": 0.5974395448079659, "precision": 0.7111412123264477, "recall": 0.515084621044886, "support": 4077.0 }, "eval_I-MajorClaim": { "f1-score": 0.8862901219208758, "precision": 0.8927318295739348, "recall": 0.8799407114624506, "support": 2024.0 }, "eval_I-Premise": { "f1-score": 0.9007579901539423, "precision": 0.862670258943272, "recall": 0.9423642903858731, "support": 12232.0 }, "eval_O": { "f1-score": 0.9989708122349842, "precision": 0.9980258287406433, "recall": 0.9999175869457723, "support": 12134.0 }, "eval_accuracy": 0.9014240506329114, "eval_loss": 0.5345993638038635, "eval_macro avg": { "f1-score": 0.8306698907811532, "precision": 0.8495157662879569, "recall": 0.8191752186841895, "support": 31600.0 }, "eval_runtime": 6.2101, "eval_samples_per_second": 12.882, "eval_steps_per_second": 1.61, "eval_weighted avg": { "f1-score": 0.8957812921551218, "precision": 0.8957333024681017, "recall": 0.9014240506329114, "support": 31600.0 }, "step": 891 }, { "epoch": 12.0, "eval_B-Claim": { "f1-score": 0.6859083191850596, "precision": 0.6622950819672131, "recall": 0.7112676056338029, "support": 284.0 }, "eval_B-MajorClaim": { "f1-score": 0.8921933085501859, "precision": 0.9375, "recall": 0.851063829787234, "support": 141.0 }, "eval_B-Premise": { "f1-score": 0.8863636363636365, "precision": 0.8914285714285715, "recall": 0.8813559322033898, "support": 708.0 }, "eval_I-Claim": { "f1-score": 0.6563715953307394, "precision": 0.6508319266939957, "recall": 0.6620063772381654, "support": 4077.0 }, "eval_I-MajorClaim": { "f1-score": 0.8721605916534602, "precision": 0.9370034052213394, "recall": 0.8157114624505929, "support": 2024.0 }, "eval_I-Premise": { "f1-score": 0.9015022330491272, "precision": 0.8954670108081949, "recall": 0.907619359058208, "support": 12232.0 }, "eval_O": { "f1-score": 0.9988474520457726, "precision": 0.9977796052631579, "recall": 0.9999175869457723, "support": 12134.0 }, "eval_accuracy": 0.902879746835443, "eval_loss": 0.6067038774490356, "eval_macro avg": { "f1-score": 0.8419067337397116, "precision": 0.8531865144832105, "recall": 0.8327060219024521, "support": 31600.0 }, "eval_runtime": 6.2295, "eval_samples_per_second": 12.842, "eval_steps_per_second": 1.605, "eval_weighted avg": { "f1-score": 0.9030573735174033, "precision": 0.9038530884689406, "recall": 0.902879746835443, "support": 31600.0 }, "step": 972 }, { "epoch": 12.35, "grad_norm": 0.581019937992096, "learning_rate": 7.654320987654322e-06, "loss": 0.0322, "step": 1000 }, { "epoch": 13.0, "eval_B-Claim": { "f1-score": 0.6728624535315986, "precision": 0.7125984251968503, "recall": 0.6373239436619719, "support": 284.0 }, "eval_B-MajorClaim": { "f1-score": 0.9154929577464789, "precision": 0.9090909090909091, "recall": 0.9219858156028369, "support": 141.0 }, "eval_B-Premise": { "f1-score": 0.8905817174515235, "precision": 0.873641304347826, "recall": 0.9081920903954802, "support": 708.0 }, "eval_I-Claim": { "f1-score": 0.6460571129159025, "precision": 0.6932808546527973, "recall": 0.6048565121412803, "support": 4077.0 }, "eval_I-MajorClaim": { "f1-score": 0.9011916583912611, "precision": 0.905688622754491, "recall": 0.8967391304347826, "support": 2024.0 }, "eval_I-Premise": { "f1-score": 0.9046914370275567, "precision": 0.8856001879257693, "recall": 0.9246239372138653, "support": 12232.0 }, "eval_O": { "f1-score": 0.9991346985866744, "precision": 0.9990935311083642, "recall": 0.9991758694577221, "support": 12134.0 }, "eval_accuracy": 0.907246835443038, "eval_loss": 0.5913504362106323, "eval_macro avg": { "f1-score": 0.8471445765215709, "precision": 0.8541419764395725, "recall": 0.8418424712725627, "support": 31600.0 }, "eval_runtime": 6.2496, "eval_samples_per_second": 12.801, "eval_steps_per_second": 1.6, "eval_weighted avg": { "f1-score": 0.9050120935479347, "precision": 0.9039360771033997, "recall": 0.907246835443038, "support": 31600.0 }, "step": 1053 }, { "epoch": 14.0, "eval_B-Claim": { "f1-score": 0.6717267552182163, "precision": 0.7283950617283951, "recall": 0.6232394366197183, "support": 284.0 }, "eval_B-MajorClaim": { "f1-score": 0.9175627240143368, "precision": 0.927536231884058, "recall": 0.9078014184397163, "support": 141.0 }, "eval_B-Premise": { "f1-score": 0.8917808219178082, "precision": 0.8656914893617021, "recall": 0.9194915254237288, "support": 708.0 }, "eval_I-Claim": { "f1-score": 0.6362775598539159, "precision": 0.7092882991556092, "recall": 0.5768947755702722, "support": 4077.0 }, "eval_I-MajorClaim": { "f1-score": 0.8989160574741618, "precision": 0.9176531137416366, "recall": 0.8809288537549407, "support": 2024.0 }, "eval_I-Premise": { "f1-score": 0.9050800553469064, "precision": 0.8762918165811835, "recall": 0.9358240680183126, "support": 12232.0 }, "eval_O": { "f1-score": 0.9993821821327072, "precision": 0.9989296006587073, "recall": 0.9998351738915444, "support": 12134.0 }, "eval_accuracy": 0.9072784810126582, "eval_loss": 0.6610221862792969, "eval_macro avg": { "f1-score": 0.8458180222797218, "precision": 0.8605408018730417, "recall": 0.8348593216740333, "support": 31600.0 }, "eval_runtime": 6.2362, "eval_samples_per_second": 12.828, "eval_steps_per_second": 1.604, "eval_weighted avg": { "f1-score": 0.9038759465613782, "precision": 0.9031477200436355, "recall": 0.9072784810126582, "support": 31600.0 }, "step": 1134 }, { "epoch": 15.0, "eval_B-Claim": { "f1-score": 0.70223752151463, "precision": 0.6868686868686869, "recall": 0.7183098591549296, "support": 284.0 }, "eval_B-MajorClaim": { "f1-score": 0.9064748201438848, "precision": 0.9197080291970803, "recall": 0.8936170212765957, "support": 141.0 }, "eval_B-Premise": { "f1-score": 0.8898365316275765, "precision": 0.8955650929899857, "recall": 0.884180790960452, "support": 708.0 }, "eval_I-Claim": { "f1-score": 0.6806321205439176, "precision": 0.6798825256975036, "recall": 0.681383370125092, "support": 4077.0 }, "eval_I-MajorClaim": { "f1-score": 0.9012658227848102, "precision": 0.9241952232606438, "recall": 0.8794466403162056, "support": 2024.0 }, "eval_I-Premise": { "f1-score": 0.906661234467305, "precision": 0.9036790384146837, "recall": 0.9096631785480707, "support": 12232.0 }, "eval_O": { "f1-score": 0.9995056846267919, "precision": 0.9991764124526438, "recall": 0.9998351738915444, "support": 12134.0 }, "eval_accuracy": 0.9105379746835442, "eval_loss": 0.6556717157363892, "eval_macro avg": { "f1-score": 0.8552305336727023, "precision": 0.8584392869830325, "recall": 0.8523480048961273, "support": 31600.0 }, "eval_runtime": 6.2042, "eval_samples_per_second": 12.894, "eval_steps_per_second": 1.612, "eval_weighted avg": { "f1-score": 0.9105896850690615, "precision": 0.910730075973464, "recall": 0.9105379746835442, "support": 31600.0 }, "step": 1215 }, { "epoch": 16.0, "eval_B-Claim": { "f1-score": 0.6605504587155964, "precision": 0.6896551724137931, "recall": 0.6338028169014085, "support": 284.0 }, "eval_B-MajorClaim": { "f1-score": 0.8996282527881041, "precision": 0.9453125, "recall": 0.8581560283687943, "support": 141.0 }, "eval_B-Premise": { "f1-score": 0.8884297520661157, "precision": 0.8669354838709677, "recall": 0.9110169491525424, "support": 708.0 }, "eval_I-Claim": { "f1-score": 0.6305857685755472, "precision": 0.6769836803601575, "recall": 0.5901398086828551, "support": 4077.0 }, "eval_I-MajorClaim": { "f1-score": 0.8995610637748515, "precision": 0.9421308815575987, "recall": 0.8606719367588933, "support": 2024.0 }, "eval_I-Premise": { "f1-score": 0.9012483104078874, "precision": 0.8771861940876026, "recall": 0.9266677567037279, "support": 12232.0 }, "eval_O": { "f1-score": 0.9995056846267919, "precision": 0.9991764124526438, "recall": 0.9998351738915444, "support": 12134.0 }, "eval_accuracy": 0.9038291139240506, "eval_loss": 0.6791273951530457, "eval_macro avg": { "f1-score": 0.8399298987078421, "precision": 0.8567686178203948, "recall": 0.8257557814942523, "support": 31600.0 }, "eval_runtime": 6.2596, "eval_samples_per_second": 12.78, "eval_steps_per_second": 1.598, "eval_weighted avg": { "f1-score": 0.9014915588643904, "precision": 0.9007476246179443, "recall": 0.9038291139240506, "support": 31600.0 }, "step": 1296 } ], "logging_steps": 500, "max_steps": 1620, "num_input_tokens_seen": 0, "num_train_epochs": 20, "save_steps": 500, "total_flos": 2300653003488000.0, "train_batch_size": 4, "trial_name": null, "trial_params": null }