catppt-7b-onc-v1 / trainer_log.jsonl
chenhugging's picture
Upload folder using huggingface_hub
b434d57 verified
{"current_steps": 10, "total_steps": 203, "loss": 0.5873, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00025, "epoch": 0.05, "percentage": 4.93, "elapsed_time": "0:00:43", "remaining_time": "0:14:00"}
{"current_steps": 20, "total_steps": 203, "loss": 0.18, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.0005, "epoch": 0.1, "percentage": 9.85, "elapsed_time": "0:01:25", "remaining_time": "0:13:01"}
{"current_steps": 30, "total_steps": 203, "loss": 0.1853, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.0004963251406715272, "epoch": 0.15, "percentage": 14.78, "elapsed_time": "0:02:06", "remaining_time": "0:12:10"}
{"current_steps": 40, "total_steps": 203, "loss": 0.1675, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.0004854085994147815, "epoch": 0.2, "percentage": 19.7, "elapsed_time": "0:02:50", "remaining_time": "0:11:33"}
{"current_steps": 50, "total_steps": 203, "loss": 0.1538, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00046757131025753886, "epoch": 0.25, "percentage": 24.63, "elapsed_time": "0:03:33", "remaining_time": "0:10:51"}
{"current_steps": 60, "total_steps": 203, "loss": 0.1566, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00044333766942743246, "epoch": 0.29, "percentage": 29.56, "elapsed_time": "0:04:17", "remaining_time": "0:10:12"}
{"current_steps": 70, "total_steps": 203, "loss": 0.1319, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.0004134201186930015, "epoch": 0.34, "percentage": 34.48, "elapsed_time": "0:05:01", "remaining_time": "0:09:32"}
{"current_steps": 80, "total_steps": 203, "loss": 0.1561, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00037869820037745775, "epoch": 0.39, "percentage": 39.41, "elapsed_time": "0:05:44", "remaining_time": "0:08:50"}
{"current_steps": 90, "total_steps": 203, "loss": 0.151, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.0003401926998041959, "epoch": 0.44, "percentage": 44.33, "elapsed_time": "0:06:26", "remaining_time": "0:08:05"}
{"current_steps": 100, "total_steps": 203, "loss": 0.1364, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00029903563535704927, "epoch": 0.49, "percentage": 49.26, "elapsed_time": "0:07:07", "remaining_time": "0:07:20"}
{"current_steps": 110, "total_steps": 203, "loss": 0.1346, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.0002564369784137472, "epoch": 0.54, "percentage": 54.19, "elapsed_time": "0:07:50", "remaining_time": "0:06:37"}
{"current_steps": 120, "total_steps": 203, "loss": 0.1329, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00021364908154907752, "epoch": 0.59, "percentage": 59.11, "elapsed_time": "0:08:37", "remaining_time": "0:05:57"}
{"current_steps": 130, "total_steps": 203, "loss": 0.1321, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.00017192986077855136, "epoch": 0.64, "percentage": 64.04, "elapsed_time": "0:09:20", "remaining_time": "0:05:14"}
{"current_steps": 140, "total_steps": 203, "loss": 0.142, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.0001325058142431701, "epoch": 0.69, "percentage": 68.97, "elapsed_time": "0:10:04", "remaining_time": "0:04:31"}
{"current_steps": 150, "total_steps": 203, "loss": 0.1461, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.653596454434699e-05, "epoch": 0.74, "percentage": 73.89, "elapsed_time": "0:10:47", "remaining_time": "0:03:48"}
{"current_steps": 160, "total_steps": 203, "loss": 0.1352, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.507778478375834e-05, "epoch": 0.79, "percentage": 78.82, "elapsed_time": "0:11:32", "remaining_time": "0:03:05"}
{"current_steps": 170, "total_steps": 203, "loss": 0.1247, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.905611004420359e-05, "epoch": 0.84, "percentage": 83.74, "elapsed_time": "0:12:15", "remaining_time": "0:02:22"}
{"current_steps": 180, "total_steps": 203, "loss": 0.1318, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.9235948278956e-05, "epoch": 0.88, "percentage": 88.67, "elapsed_time": "0:12:59", "remaining_time": "0:01:39"}
{"current_steps": 190, "total_steps": 203, "loss": 0.1373, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.199989938854372e-06, "epoch": 0.93, "percentage": 93.6, "elapsed_time": "0:13:41", "remaining_time": "0:00:56"}
{"current_steps": 200, "total_steps": 203, "loss": 0.1067, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.314775287923677e-07, "epoch": 0.98, "percentage": 98.52, "elapsed_time": "0:14:24", "remaining_time": "0:00:12"}
{"current_steps": 203, "total_steps": 203, "loss": null, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "0:14:38", "remaining_time": "0:00:00"}