|
{ |
|
"best_metric": 0.1991778548194697, |
|
"best_model_checkpoint": "/content/drive/MyDrive/model_outputs/trial_5/checkpoint-146", |
|
"epoch": 1.0, |
|
"eval_steps": 500, |
|
"global_step": 146, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.0684931506849315, |
|
"grad_norm": 5.608231067657471, |
|
"learning_rate": 3.6003360497121445e-06, |
|
"loss": 2.2214, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 0.136986301369863, |
|
"grad_norm": 5.646218776702881, |
|
"learning_rate": 7.200672099424289e-06, |
|
"loss": 2.1624, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 0.2054794520547945, |
|
"grad_norm": 5.6624908447265625, |
|
"learning_rate": 1.041544648904501e-05, |
|
"loss": 2.1074, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 0.273972602739726, |
|
"grad_norm": 5.1634697914123535, |
|
"learning_rate": 1.0160165937842927e-05, |
|
"loss": 2.0965, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 0.3424657534246575, |
|
"grad_norm": 4.445455551147461, |
|
"learning_rate": 9.904885386640843e-06, |
|
"loss": 2.0527, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 0.410958904109589, |
|
"grad_norm": 4.640649795532227, |
|
"learning_rate": 9.64960483543876e-06, |
|
"loss": 2.0678, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 0.4794520547945205, |
|
"grad_norm": 5.322652816772461, |
|
"learning_rate": 9.394324284236676e-06, |
|
"loss": 2.0892, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 0.547945205479452, |
|
"grad_norm": 5.406436443328857, |
|
"learning_rate": 9.139043733034592e-06, |
|
"loss": 2.0179, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 0.6164383561643836, |
|
"grad_norm": 4.761965751647949, |
|
"learning_rate": 8.883763181832509e-06, |
|
"loss": 2.0074, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 0.684931506849315, |
|
"grad_norm": 4.901184558868408, |
|
"learning_rate": 8.628482630630425e-06, |
|
"loss": 2.0241, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.7534246575342466, |
|
"grad_norm": 5.2895941734313965, |
|
"learning_rate": 8.373202079428341e-06, |
|
"loss": 2.0019, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 0.821917808219178, |
|
"grad_norm": 4.653793811798096, |
|
"learning_rate": 8.117921528226258e-06, |
|
"loss": 2.0277, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 0.8904109589041096, |
|
"grad_norm": 5.342679977416992, |
|
"learning_rate": 7.862640977024174e-06, |
|
"loss": 1.9835, |
|
"step": 130 |
|
}, |
|
{ |
|
"epoch": 0.958904109589041, |
|
"grad_norm": 5.529128074645996, |
|
"learning_rate": 7.607360425822091e-06, |
|
"loss": 2.0019, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_classification_report": { |
|
"accuracy": 0.2285, |
|
"ar": { |
|
"f1-score": 0.0547945205479452, |
|
"precision": 0.46153846153846156, |
|
"recall": 0.02912621359223301, |
|
"support": 206.0 |
|
}, |
|
"cl": { |
|
"f1-score": 0.2222222222222222, |
|
"precision": 0.18932038834951456, |
|
"recall": 0.2689655172413793, |
|
"support": 290.0 |
|
}, |
|
"co": { |
|
"f1-score": 0.2832980972515856, |
|
"precision": 0.20458015267175572, |
|
"recall": 0.46048109965635736, |
|
"support": 291.0 |
|
}, |
|
"es": { |
|
"f1-score": 0.2547993019197208, |
|
"precision": 0.24829931972789115, |
|
"recall": 0.2616487455197133, |
|
"support": 279.0 |
|
}, |
|
"macro avg": { |
|
"f1-score": 0.1991778548194697, |
|
"precision": 0.27210428357115557, |
|
"recall": 0.2048681078220834, |
|
"support": 2000.0 |
|
}, |
|
"mx": { |
|
"f1-score": 0.23859649122807017, |
|
"precision": 0.24372759856630824, |
|
"recall": 0.23367697594501718, |
|
"support": 291.0 |
|
}, |
|
"pe": { |
|
"f1-score": 0.174573055028463, |
|
"precision": 0.19491525423728814, |
|
"recall": 0.15807560137457044, |
|
"support": 291.0 |
|
}, |
|
"pr": { |
|
"f1-score": 0.4567901234567901, |
|
"precision": 0.6065573770491803, |
|
"recall": 0.36633663366336633, |
|
"support": 101.0 |
|
}, |
|
"uy": { |
|
"f1-score": 0.10752688172043011, |
|
"precision": 0.3, |
|
"recall": 0.06550218340611354, |
|
"support": 229.0 |
|
}, |
|
"ve": { |
|
"f1-score": 0.0, |
|
"precision": 0.0, |
|
"recall": 0.0, |
|
"support": 22.0 |
|
}, |
|
"weighted avg": { |
|
"f1-score": 0.21012633177845003, |
|
"precision": 0.2681977677888293, |
|
"recall": 0.2285, |
|
"support": 2000.0 |
|
} |
|
}, |
|
"eval_f1": 0.1991778548194697, |
|
"eval_loss": 1.9731428623199463, |
|
"eval_runtime": 3.5688, |
|
"eval_samples_per_second": 560.405, |
|
"eval_steps_per_second": 17.653, |
|
"step": 146 |
|
} |
|
], |
|
"logging_steps": 10, |
|
"max_steps": 438, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 3, |
|
"save_steps": 500, |
|
"stateful_callbacks": { |
|
"TrainerControl": { |
|
"args": { |
|
"should_epoch_stop": false, |
|
"should_evaluate": false, |
|
"should_log": false, |
|
"should_save": true, |
|
"should_training_stop": false |
|
}, |
|
"attributes": {} |
|
} |
|
}, |
|
"total_flos": 306938335993344.0, |
|
"train_batch_size": 32, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|