Training in progress, epoch 8
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +31 -3
- pytorch_model.bin +1 -1
- runs/May01_06-16-39_af1ffd0a72ec/events.out.tfevents.1682921804.af1ffd0a72ec.975.12 +2 -2
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 535707205
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e7e2d9069364a0c1e77dc58988ccf5e4e8a4ecdd81bfbc7f7e1ed5e9a7b82b5
|
3 |
size 535707205
|
last-checkpoint/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 267858605
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c84e4058a3c64eed475647e382baf9bc9aa51800a15b02015929e01dc37add66
|
3 |
size 267858605
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14575
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f146ca546ec8fc540669de1c29f4b92aed354ab067b78dc9ec30842fd86abb1b
|
3 |
size 14575
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a5d295224ad85fae86c0e88399ed6faedb60e913ff68e5079746d7ca3718a9d
|
3 |
size 627
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": 1.614416241645813,
|
3 |
"best_model_checkpoint": "distilbert_weight_decay_final_metrics/checkpoint-6872",
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -220,11 +220,39 @@
|
|
220 |
"eval_samples_per_second": 436.031,
|
221 |
"eval_steps_per_second": 27.267,
|
222 |
"step": 12026
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
223 |
}
|
224 |
],
|
225 |
"max_steps": 34360,
|
226 |
"num_train_epochs": 20,
|
227 |
-
"total_flos":
|
228 |
"trial_name": null,
|
229 |
"trial_params": null
|
230 |
}
|
|
|
1 |
{
|
2 |
"best_metric": 1.614416241645813,
|
3 |
"best_model_checkpoint": "distilbert_weight_decay_final_metrics/checkpoint-6872",
|
4 |
+
"epoch": 8.0,
|
5 |
+
"global_step": 13744,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
220 |
"eval_samples_per_second": 436.031,
|
221 |
"eval_steps_per_second": 27.267,
|
222 |
"step": 12026
|
223 |
+
},
|
224 |
+
{
|
225 |
+
"epoch": 7.28,
|
226 |
+
"learning_rate": 1.2724097788125728e-05,
|
227 |
+
"loss": 0.0239,
|
228 |
+
"step": 12500
|
229 |
+
},
|
230 |
+
{
|
231 |
+
"epoch": 7.57,
|
232 |
+
"learning_rate": 1.2433061699650757e-05,
|
233 |
+
"loss": 0.0261,
|
234 |
+
"step": 13000
|
235 |
+
},
|
236 |
+
{
|
237 |
+
"epoch": 7.86,
|
238 |
+
"learning_rate": 1.2142025611175788e-05,
|
239 |
+
"loss": 0.0194,
|
240 |
+
"step": 13500
|
241 |
+
},
|
242 |
+
{
|
243 |
+
"epoch": 8.0,
|
244 |
+
"eval_accuracy": 0.7869269949066214,
|
245 |
+
"eval_f1": 0.7901736955407076,
|
246 |
+
"eval_loss": 1.923709750175476,
|
247 |
+
"eval_runtime": 9.3451,
|
248 |
+
"eval_samples_per_second": 378.167,
|
249 |
+
"eval_steps_per_second": 23.649,
|
250 |
+
"step": 13744
|
251 |
}
|
252 |
],
|
253 |
"max_steps": 34360,
|
254 |
"num_train_epochs": 20,
|
255 |
+
"total_flos": 6256940082766560.0,
|
256 |
"trial_name": null,
|
257 |
"trial_params": null
|
258 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 267858605
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c84e4058a3c64eed475647e382baf9bc9aa51800a15b02015929e01dc37add66
|
3 |
size 267858605
|
runs/May01_06-16-39_af1ffd0a72ec/events.out.tfevents.1682921804.af1ffd0a72ec.975.12
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed4849df953d74acb8798ce1bc08ddfe231b22fce0bf72779d17c8bfeacc54ec
|
3 |
+
size 11378
|