Gemma-7B-It-ORPO-SFT / trainer_log.jsonl
chchen's picture
Model save
f651cd7 verified
raw
history blame contribute delete
No virus
3.41 kB
{"current_steps": 10, "total_steps": 168, "loss": 0.7526, "learning_rate": 4.957230266673969e-06, "epoch": 0.17777777777777778, "percentage": 5.95, "elapsed_time": "0:00:42", "remaining_time": "0:11:14"}
{"current_steps": 20, "total_steps": 168, "loss": 0.4679, "learning_rate": 4.828686741593921e-06, "epoch": 0.35555555555555557, "percentage": 11.9, "elapsed_time": "0:01:24", "remaining_time": "0:10:23"}
{"current_steps": 30, "total_steps": 168, "loss": 0.2544, "learning_rate": 4.618852307232078e-06, "epoch": 0.5333333333333333, "percentage": 17.86, "elapsed_time": "0:02:04", "remaining_time": "0:09:32"}
{"current_steps": 40, "total_steps": 168, "loss": 0.1482, "learning_rate": 4.335051964269395e-06, "epoch": 0.7111111111111111, "percentage": 23.81, "elapsed_time": "0:02:44", "remaining_time": "0:08:46"}
{"current_steps": 50, "total_steps": 168, "loss": 0.1171, "learning_rate": 3.987192750660719e-06, "epoch": 0.8888888888888888, "percentage": 29.76, "elapsed_time": "0:03:25", "remaining_time": "0:08:05"}
{"current_steps": 60, "total_steps": 168, "loss": 0.1406, "learning_rate": 3.587417902020876e-06, "epoch": 1.0666666666666667, "percentage": 35.71, "elapsed_time": "0:04:07", "remaining_time": "0:07:25"}
{"current_steps": 70, "total_steps": 168, "loss": 0.0862, "learning_rate": 3.1496829497545268e-06, "epoch": 1.2444444444444445, "percentage": 41.67, "elapsed_time": "0:04:47", "remaining_time": "0:06:42"}
{"current_steps": 80, "total_steps": 168, "loss": 0.0944, "learning_rate": 2.6892685546987724e-06, "epoch": 1.4222222222222223, "percentage": 47.62, "elapsed_time": "0:05:28", "remaining_time": "0:06:01"}
{"current_steps": 90, "total_steps": 168, "loss": 0.1177, "learning_rate": 2.2222470825144806e-06, "epoch": 1.6, "percentage": 53.57, "elapsed_time": "0:06:09", "remaining_time": "0:05:20"}
{"current_steps": 100, "total_steps": 168, "loss": 0.0735, "learning_rate": 1.7649215418673847e-06, "epoch": 1.7777777777777777, "percentage": 59.52, "elapsed_time": "0:06:51", "remaining_time": "0:04:39"}
{"current_steps": 110, "total_steps": 168, "loss": 0.1145, "learning_rate": 1.3332564712129845e-06, "epoch": 1.9555555555555557, "percentage": 65.48, "elapsed_time": "0:07:31", "remaining_time": "0:03:58"}
{"current_steps": 120, "total_steps": 168, "loss": 0.0876, "learning_rate": 9.423206410612498e-07, "epoch": 2.1333333333333333, "percentage": 71.43, "elapsed_time": "0:08:12", "remaining_time": "0:03:16"}
{"current_steps": 130, "total_steps": 168, "loss": 0.0931, "learning_rate": 6.057610261367044e-07, "epoch": 2.311111111111111, "percentage": 77.38, "elapsed_time": "0:08:53", "remaining_time": "0:02:35"}
{"current_steps": 140, "total_steps": 168, "loss": 0.1052, "learning_rate": 3.3532641026504415e-07, "epoch": 2.488888888888889, "percentage": 83.33, "elapsed_time": "0:09:33", "remaining_time": "0:01:54"}
{"current_steps": 150, "total_steps": 168, "loss": 0.0899, "learning_rate": 1.4045725421448332e-07, "epoch": 2.6666666666666665, "percentage": 89.29, "elapsed_time": "0:10:14", "remaining_time": "0:01:13"}
{"current_steps": 160, "total_steps": 168, "loss": 0.0744, "learning_rate": 2.7956143581177874e-08, "epoch": 2.8444444444444446, "percentage": 95.24, "elapsed_time": "0:10:56", "remaining_time": "0:00:32"}
{"current_steps": 168, "total_steps": 168, "epoch": 2.986666666666667, "percentage": 100.0, "elapsed_time": "0:11:29", "remaining_time": "0:00:00"}