deepseek_classifier / training_metrics /training_metrics.json
t8ix's picture
Upload folder using huggingface_hub
bfd111a verified
{
"training_sessions": [
{
"session_id": 1,
"epochs": [],
"parameters": {
"learning_rate": 0.0002,
"batch_size": 4,
"num_epochs": 3,
"warmup_steps": 0,
"gradient_accumulation_steps": 2,
"weight_decay": 0.01,
"lr_scheduler_type": "cosine",
"clip_grad_norm": 1.0,
"save_path": "/content/drive/MyDrive/deepseek_txt_classifier"
},
"training_started": "2025-01-30T19:27:27.458361",
"training_ended": null
},
{
"session_id": 2,
"epochs": [
{
"epoch": 1,
"timestamp": "2025-01-30T19:33:18.075195",
"train_loss": 4.0756168969514865,
"val_loss": 3.061457032888708,
"val_accuracy": 0.26017699115044246,
"f1_weighted": 0.2289007857934706,
"precision_weighted": 0.3235188957013108,
"recall_weighted": 0.26017699115044246
},
{
"epoch": 2,
"timestamp": "2025-01-30T19:33:18.075195",
"train_loss": 2.3547961317182544,
"val_loss": 2.5218266886724554,
"val_accuracy": 0.4088495575221239,
"f1_weighted": 0.3899156502168876,
"precision_weighted": 0.4584804625070112,
"recall_weighted": 0.4088495575221239
},
{
"epoch": 3,
"timestamp": "2025-01-30T19:33:18.075195",
"train_loss": 1.879219204586888,
"val_loss": 2.4548432421936117,
"val_accuracy": 0.42123893805309737,
"f1_weighted": 0.40484596795481426,
"precision_weighted": 0.4437322769455818,
"recall_weighted": 0.42123893805309737
}
],
"parameters": {
"learning_rate": 0.0002,
"batch_size": 4,
"num_epochs": 3,
"warmup_steps": 0,
"gradient_accumulation_steps": 2,
"weight_decay": 0.01,
"lr_scheduler_type": "cosine",
"clip_grad_norm": 1.0,
"save_path": "/content/drive/MyDrive/deepseek_txt_classifier"
},
"training_started": "2025-01-30T19:33:18.075195",
"training_ended": "2025-01-30T19:33:18.075195",
"final_metrics": {
"best_val_loss": 2.4548432421936117,
"total_epochs": 3,
"early_stopped": false
}
}
],
"current_session": null
}