Falcon-7B-Instruct-ORPO-SFT / trainer_log.jsonl
chchen's picture
Model save
3142e70 verified
raw
history blame contribute delete
No virus
3.41 kB
{"current_steps": 10, "total_steps": 168, "loss": 0.8422, "learning_rate": 4.957230266673969e-06, "epoch": 0.17777777777777778, "percentage": 5.95, "elapsed_time": "0:00:16", "remaining_time": "0:04:23"}
{"current_steps": 20, "total_steps": 168, "loss": 0.7171, "learning_rate": 4.828686741593921e-06, "epoch": 0.35555555555555557, "percentage": 11.9, "elapsed_time": "0:00:32", "remaining_time": "0:04:00"}
{"current_steps": 30, "total_steps": 168, "loss": 0.5551, "learning_rate": 4.618852307232078e-06, "epoch": 0.5333333333333333, "percentage": 17.86, "elapsed_time": "0:00:48", "remaining_time": "0:03:42"}
{"current_steps": 40, "total_steps": 168, "loss": 0.4059, "learning_rate": 4.335051964269395e-06, "epoch": 0.7111111111111111, "percentage": 23.81, "elapsed_time": "0:01:04", "remaining_time": "0:03:24"}
{"current_steps": 50, "total_steps": 168, "loss": 0.3053, "learning_rate": 3.987192750660719e-06, "epoch": 0.8888888888888888, "percentage": 29.76, "elapsed_time": "0:01:19", "remaining_time": "0:03:08"}
{"current_steps": 60, "total_steps": 168, "loss": 0.2825, "learning_rate": 3.587417902020876e-06, "epoch": 1.0666666666666667, "percentage": 35.71, "elapsed_time": "0:01:35", "remaining_time": "0:02:52"}
{"current_steps": 70, "total_steps": 168, "loss": 0.2082, "learning_rate": 3.1496829497545268e-06, "epoch": 1.2444444444444445, "percentage": 41.67, "elapsed_time": "0:01:51", "remaining_time": "0:02:35"}
{"current_steps": 80, "total_steps": 168, "loss": 0.1955, "learning_rate": 2.6892685546987724e-06, "epoch": 1.4222222222222223, "percentage": 47.62, "elapsed_time": "0:02:07", "remaining_time": "0:02:19"}
{"current_steps": 90, "total_steps": 168, "loss": 0.2161, "learning_rate": 2.2222470825144806e-06, "epoch": 1.6, "percentage": 53.57, "elapsed_time": "0:02:22", "remaining_time": "0:02:03"}
{"current_steps": 100, "total_steps": 168, "loss": 0.169, "learning_rate": 1.7649215418673847e-06, "epoch": 1.7777777777777777, "percentage": 59.52, "elapsed_time": "0:02:38", "remaining_time": "0:01:47"}
{"current_steps": 110, "total_steps": 168, "loss": 0.2051, "learning_rate": 1.3332564712129845e-06, "epoch": 1.9555555555555557, "percentage": 65.48, "elapsed_time": "0:02:54", "remaining_time": "0:01:31"}
{"current_steps": 120, "total_steps": 168, "loss": 0.2007, "learning_rate": 9.423206410612498e-07, "epoch": 2.1333333333333333, "percentage": 71.43, "elapsed_time": "0:03:09", "remaining_time": "0:01:15"}
{"current_steps": 130, "total_steps": 168, "loss": 0.1866, "learning_rate": 6.057610261367044e-07, "epoch": 2.311111111111111, "percentage": 77.38, "elapsed_time": "0:03:25", "remaining_time": "0:01:00"}
{"current_steps": 140, "total_steps": 168, "loss": 0.2212, "learning_rate": 3.3532641026504415e-07, "epoch": 2.488888888888889, "percentage": 83.33, "elapsed_time": "0:03:41", "remaining_time": "0:00:44"}
{"current_steps": 150, "total_steps": 168, "loss": 0.1776, "learning_rate": 1.4045725421448332e-07, "epoch": 2.6666666666666665, "percentage": 89.29, "elapsed_time": "0:03:56", "remaining_time": "0:00:28"}
{"current_steps": 160, "total_steps": 168, "loss": 0.1686, "learning_rate": 2.7956143581177874e-08, "epoch": 2.8444444444444446, "percentage": 95.24, "elapsed_time": "0:04:11", "remaining_time": "0:00:12"}
{"current_steps": 168, "total_steps": 168, "epoch": 2.986666666666667, "percentage": 100.0, "elapsed_time": "0:04:24", "remaining_time": "0:00:00"}