Training in progress, step 100
Browse files- adapter_model.safetensors +1 -1
- trainer_log.jsonl +6 -0
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 83945296
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6da3ab11619d0446f40c3dbcaa0ea8306efeccccd3d875557a720ce0197721ed
|
3 |
size 83945296
|
trainer_log.jsonl
CHANGED
@@ -4,3 +4,9 @@
|
|
4 |
{"current_steps": 40, "total_steps": 450, "loss": 1.736, "accuracy": 0.706250011920929, "learning_rate": 4.444444444444444e-06, "epoch": 0.8888888888888888, "percentage": 8.89, "elapsed_time": "0:01:24", "remaining_time": "0:14:22"}
|
5 |
{"current_steps": 50, "total_steps": 450, "loss": 1.4945, "accuracy": 0.7875000238418579, "learning_rate": 4.998119881260576e-06, "epoch": 1.1111111111111112, "percentage": 11.11, "elapsed_time": "0:01:44", "remaining_time": "0:13:58"}
|
6 |
{"current_steps": 50, "total_steps": 450, "eval_loss": 1.276250958442688, "epoch": 1.1111111111111112, "percentage": 11.11, "elapsed_time": "0:01:48", "remaining_time": "0:14:25"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
4 |
{"current_steps": 40, "total_steps": 450, "loss": 1.736, "accuracy": 0.706250011920929, "learning_rate": 4.444444444444444e-06, "epoch": 0.8888888888888888, "percentage": 8.89, "elapsed_time": "0:01:24", "remaining_time": "0:14:22"}
|
5 |
{"current_steps": 50, "total_steps": 450, "loss": 1.4945, "accuracy": 0.7875000238418579, "learning_rate": 4.998119881260576e-06, "epoch": 1.1111111111111112, "percentage": 11.11, "elapsed_time": "0:01:44", "remaining_time": "0:13:58"}
|
6 |
{"current_steps": 50, "total_steps": 450, "eval_loss": 1.276250958442688, "epoch": 1.1111111111111112, "percentage": 11.11, "elapsed_time": "0:01:48", "remaining_time": "0:14:25"}
|
7 |
+
{"current_steps": 60, "total_steps": 450, "loss": 1.1242, "accuracy": 0.831250011920929, "learning_rate": 4.983095894354858e-06, "epoch": 1.3333333333333333, "percentage": 13.33, "elapsed_time": "0:02:10", "remaining_time": "0:14:07"}
|
8 |
+
{"current_steps": 70, "total_steps": 450, "loss": 0.7274, "accuracy": 0.800000011920929, "learning_rate": 4.953138276568462e-06, "epoch": 1.5555555555555556, "percentage": 15.56, "elapsed_time": "0:02:30", "remaining_time": "0:13:38"}
|
9 |
+
{"current_steps": 80, "total_steps": 450, "loss": 0.6374, "accuracy": 0.762499988079071, "learning_rate": 4.908427196539701e-06, "epoch": 1.7777777777777777, "percentage": 17.78, "elapsed_time": "0:02:51", "remaining_time": "0:13:11"}
|
10 |
+
{"current_steps": 90, "total_steps": 450, "loss": 0.3774, "accuracy": 0.8187500238418579, "learning_rate": 4.849231551964771e-06, "epoch": 2.0, "percentage": 20.0, "elapsed_time": "0:03:12", "remaining_time": "0:12:49"}
|
11 |
+
{"current_steps": 100, "total_steps": 450, "loss": 0.2666, "accuracy": 0.8062499761581421, "learning_rate": 4.775907352415367e-06, "epoch": 2.2222222222222223, "percentage": 22.22, "elapsed_time": "0:03:34", "remaining_time": "0:12:29"}
|
12 |
+
{"current_steps": 100, "total_steps": 450, "eval_loss": 0.24907442927360535, "epoch": 2.2222222222222223, "percentage": 22.22, "elapsed_time": "0:03:37", "remaining_time": "0:12:40"}
|