cruiser commited on
Commit
6e5816c
1 Parent(s): 3876aa4

Training in progress, epoch 4

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0cbebfe87c4150823623cf4db06eebb2d117ca60c69ee0226024bda5e591814b
3
  size 535707205
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e7489ddabd3040de3491c14dae6f71bec7bc3101832294753f9f259d9dd0f5f
3
  size 535707205
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de3bcd2b4640ab63ff2bd32f5d297f744b2ca1336f50fd20445f9cd76739b5b6
3
  size 267858605
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25d29fa03522cd6c5bb404ab85b676cb04123d8c3995e8523340fdd0fa6ea677
3
  size 267858605
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:47fe60f138b6682f4f11f1710b9ddc0fb2882408668973136d874097a9110f35
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:baa3761bd22787daad9913f4844bcbcad10533ae7c4cd9a47b76e5790d0ecb0f
3
  size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:418275b5fc548956987d7f03901d0cd4d34ba2005600e9bf3d5900b248c41079
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c768291c0daa4d7057333ea067ae676107b99665e6dadce18b121cba5b1d1527
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 1.7141435146331787,
3
- "best_model_checkpoint": "distilbert_weight_decay_final_metrics/checkpoint-5154",
4
- "epoch": 3.0,
5
- "global_step": 5154,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -96,11 +96,39 @@
96
  "eval_samples_per_second": 436.712,
97
  "eval_steps_per_second": 27.31,
98
  "step": 5154
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
99
  }
100
  ],
101
  "max_steps": 34360,
102
  "num_train_epochs": 20,
103
- "total_flos": 2346352531037460.0,
104
  "trial_name": null,
105
  "trial_params": null
106
  }
 
1
  {
2
+ "best_metric": 1.614416241645813,
3
+ "best_model_checkpoint": "distilbert_weight_decay_final_metrics/checkpoint-6872",
4
+ "epoch": 4.0,
5
+ "global_step": 6872,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
96
  "eval_samples_per_second": 436.712,
97
  "eval_steps_per_second": 27.31,
98
  "step": 5154
99
+ },
100
+ {
101
+ "epoch": 3.2,
102
+ "learning_rate": 1.679860302677532e-05,
103
+ "loss": 0.0331,
104
+ "step": 5500
105
+ },
106
+ {
107
+ "epoch": 3.49,
108
+ "learning_rate": 1.650756693830035e-05,
109
+ "loss": 0.0402,
110
+ "step": 6000
111
+ },
112
+ {
113
+ "epoch": 3.78,
114
+ "learning_rate": 1.621653084982538e-05,
115
+ "loss": 0.0388,
116
+ "step": 6500
117
+ },
118
+ {
119
+ "epoch": 4.0,
120
+ "eval_accuracy": 0.7761743067345784,
121
+ "eval_f1": 0.7801920701860957,
122
+ "eval_loss": 1.614416241645813,
123
+ "eval_runtime": 8.1981,
124
+ "eval_samples_per_second": 431.077,
125
+ "eval_steps_per_second": 26.958,
126
+ "step": 6872
127
  }
128
  ],
129
  "max_steps": 34360,
130
  "num_train_epochs": 20,
131
+ "total_flos": 3128470041383280.0,
132
  "trial_name": null,
133
  "trial_params": null
134
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de3bcd2b4640ab63ff2bd32f5d297f744b2ca1336f50fd20445f9cd76739b5b6
3
  size 267858605
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25d29fa03522cd6c5bb404ab85b676cb04123d8c3995e8523340fdd0fa6ea677
3
  size 267858605
runs/May01_06-16-39_af1ffd0a72ec/events.out.tfevents.1682921804.af1ffd0a72ec.975.12 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d05061aa8da7e519e64457e4d7f45bca8e44c8c433924c43a82469e4753201a1
3
- size 6864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d1156f5f3753a509efcbb35df736db0526eacf984dce6e87909582c454c61ef
3
+ size 7704