ben81828 commited on
Commit
7be8e37
·
verified ·
1 Parent(s): 2c2790a

Training in progress, step 750

Browse files
Files changed (2) hide show
  1. adapter_model.safetensors +1 -1
  2. trainer_log.jsonl +11 -0
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2cc88a9133bd30e9f761aeca11737097aa2bc75e291ca7a8f1b1b21cc4ee3a5a
3
  size 29034840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61fe60cd6a5c594c616d66be0bb1d9dea2f9d3063cedfcf69a99a1e90689b1b0
3
  size 29034840
trainer_log.jsonl CHANGED
@@ -156,3 +156,14 @@
156
  {"current_steps": 695, "total_steps": 3400, "loss": 0.5351, "lr": 9.362182973536569e-05, "epoch": 0.17898532062838013, "percentage": 20.44, "elapsed_time": "0:31:00", "remaining_time": "2:00:42", "throughput": 3920.82, "total_tokens": 7295568}
157
  {"current_steps": 700, "total_steps": 3400, "loss": 0.5014, "lr": 9.35024767453647e-05, "epoch": 0.1802729848055627, "percentage": 20.59, "elapsed_time": "0:32:28", "remaining_time": "2:05:16", "throughput": 3770.1, "total_tokens": 7347040}
158
  {"current_steps": 700, "total_steps": 3400, "eval_loss": 0.5440100431442261, "epoch": 0.1802729848055627, "percentage": 20.59, "elapsed_time": "0:33:07", "remaining_time": "2:07:47", "throughput": 3695.91, "total_tokens": 7347040}
 
 
 
 
 
 
 
 
 
 
 
 
156
  {"current_steps": 695, "total_steps": 3400, "loss": 0.5351, "lr": 9.362182973536569e-05, "epoch": 0.17898532062838013, "percentage": 20.44, "elapsed_time": "0:31:00", "remaining_time": "2:00:42", "throughput": 3920.82, "total_tokens": 7295568}
157
  {"current_steps": 700, "total_steps": 3400, "loss": 0.5014, "lr": 9.35024767453647e-05, "epoch": 0.1802729848055627, "percentage": 20.59, "elapsed_time": "0:32:28", "remaining_time": "2:05:16", "throughput": 3770.1, "total_tokens": 7347040}
158
  {"current_steps": 700, "total_steps": 3400, "eval_loss": 0.5440100431442261, "epoch": 0.1802729848055627, "percentage": 20.59, "elapsed_time": "0:33:07", "remaining_time": "2:07:47", "throughput": 3695.91, "total_tokens": 7347040}
159
+ {"current_steps": 705, "total_steps": 3400, "loss": 0.543, "lr": 9.338209491537257e-05, "epoch": 0.1815606489827453, "percentage": 20.74, "elapsed_time": "0:34:43", "remaining_time": "2:12:44", "throughput": 3551.6, "total_tokens": 7399584}
160
+ {"current_steps": 710, "total_steps": 3400, "loss": 0.4995, "lr": 9.326068709243727e-05, "epoch": 0.1828483131599279, "percentage": 20.88, "elapsed_time": "0:36:11", "remaining_time": "2:17:07", "throughput": 3432.24, "total_tokens": 7452928}
161
+ {"current_steps": 715, "total_steps": 3400, "loss": 0.5109, "lr": 9.313825614787177e-05, "epoch": 0.18413597733711048, "percentage": 21.03, "elapsed_time": "0:37:39", "remaining_time": "2:21:26", "throughput": 3321.05, "total_tokens": 7505112}
162
+ {"current_steps": 720, "total_steps": 3400, "loss": 0.4932, "lr": 9.301480497718593e-05, "epoch": 0.18542364151429308, "percentage": 21.18, "elapsed_time": "0:39:07", "remaining_time": "2:25:37", "throughput": 3219.44, "total_tokens": 7557608}
163
+ {"current_steps": 725, "total_steps": 3400, "loss": 0.5573, "lr": 9.289033650001817e-05, "epoch": 0.18671130569147568, "percentage": 21.32, "elapsed_time": "0:40:36", "remaining_time": "2:29:51", "throughput": 3122.82, "total_tokens": 7610048}
164
+ {"current_steps": 730, "total_steps": 3400, "loss": 0.5305, "lr": 9.276485366006634e-05, "epoch": 0.18799896986865824, "percentage": 21.47, "elapsed_time": "0:42:04", "remaining_time": "2:33:54", "throughput": 3034.8, "total_tokens": 7662056}
165
+ {"current_steps": 735, "total_steps": 3400, "loss": 0.5369, "lr": 9.263835942501807e-05, "epoch": 0.18928663404584084, "percentage": 21.62, "elapsed_time": "0:43:34", "remaining_time": "2:37:58", "throughput": 2950.71, "total_tokens": 7713656}
166
+ {"current_steps": 740, "total_steps": 3400, "loss": 0.5397, "lr": 9.251085678648072e-05, "epoch": 0.19057429822302344, "percentage": 21.76, "elapsed_time": "0:45:02", "remaining_time": "2:41:54", "throughput": 2873.57, "total_tokens": 7765992}
167
+ {"current_steps": 745, "total_steps": 3400, "loss": 0.5116, "lr": 9.238234875991046e-05, "epoch": 0.19186196240020603, "percentage": 21.91, "elapsed_time": "0:46:31", "remaining_time": "2:45:49", "throughput": 2800.48, "total_tokens": 7818448}
168
+ {"current_steps": 750, "total_steps": 3400, "loss": 0.541, "lr": 9.225283838454111e-05, "epoch": 0.19314962657738863, "percentage": 22.06, "elapsed_time": "0:47:59", "remaining_time": "2:49:34", "throughput": 2733.14, "total_tokens": 7870520}
169
+ {"current_steps": 750, "total_steps": 3400, "eval_loss": 0.5273815989494324, "epoch": 0.19314962657738863, "percentage": 22.06, "elapsed_time": "0:48:38", "remaining_time": "2:51:53", "throughput": 2696.45, "total_tokens": 7870520}