dq158 commited on
Commit
fd9a490
1 Parent(s): f28be24

Training in progress, epoch 2, checkpoint

Browse files
last-checkpoint/adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3e8387a6b711dbe733802091f3fb62ee7fa86c449abfedb4e65346acd48fe344
3
  size 18980874
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb462ee5d4ed0064da716ca2c5594e3e3e5e70319a6ab418abac9cfb7d0edee2
3
  size 18980874
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:21afb3fbcfdf6ae8a3dbdda6079c6633801aedf8ea6d86885a05cb51c34e62b2
3
  size 37990394
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a19be04da38748a1cb039e6c0dfe07bb27492e90ebdf0e33f955d798f4daa98f
3
  size 37990394
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:97677b34e8dfeaf1cb59c897df795cae8a6cd1ffd721cb6a72c9218e318994ed
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:911b0a95cae6d6f41378e1da173908f3c8007c9ee9c948ae7dbbb7364f4aa68a
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d144a1c2bd6794181df2dc95832a4077b6570b2942de19e66d9c2cae2fcf7f99
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c109f720765794b94b48266e277c7993d9e80f89e80300af67dc66dd1122b7af
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 2.273033857345581,
3
- "best_model_checkpoint": "dq158/pingusPongus/checkpoint-6323",
4
- "epoch": 2.0,
5
  "eval_steps": 500,
6
- "global_step": 6323,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -117,13 +117,68 @@
117
  "eval_steps_per_second": 0.629,
118
  "eval_translation_length": 53403,
119
  "step": 6323
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
120
  }
121
  ],
122
  "logging_steps": 500,
123
  "max_steps": 94830,
124
  "num_train_epochs": 30,
125
  "save_steps": 500,
126
- "total_flos": 4.3332645393373594e+17,
127
  "trial_name": null,
128
  "trial_params": null
129
  }
 
1
  {
2
+ "best_metric": 2.2457683086395264,
3
+ "best_model_checkpoint": "dq158/pingusPongus/checkpoint-9484",
4
+ "epoch": 2.9998418472244186,
5
  "eval_steps": 500,
6
+ "global_step": 9484,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
117
  "eval_steps_per_second": 0.629,
118
  "eval_translation_length": 53403,
119
  "step": 6323
120
+ },
121
+ {
122
+ "epoch": 2.06,
123
+ "learning_rate": 0.00019775599595764338,
124
+ "loss": 2.3691,
125
+ "step": 6500
126
+ },
127
+ {
128
+ "epoch": 2.21,
129
+ "learning_rate": 0.0001973932645621972,
130
+ "loss": 2.3412,
131
+ "step": 7000
132
+ },
133
+ {
134
+ "epoch": 2.37,
135
+ "learning_rate": 0.00019700375482672989,
136
+ "loss": 2.3373,
137
+ "step": 7500
138
+ },
139
+ {
140
+ "epoch": 2.53,
141
+ "learning_rate": 0.00019658757384719084,
142
+ "loss": 2.3416,
143
+ "step": 8000
144
+ },
145
+ {
146
+ "epoch": 2.69,
147
+ "learning_rate": 0.0001961448360528051,
148
+ "loss": 2.3669,
149
+ "step": 8500
150
+ },
151
+ {
152
+ "epoch": 2.85,
153
+ "learning_rate": 0.0001956756631746107,
154
+ "loss": 2.347,
155
+ "step": 9000
156
+ },
157
+ {
158
+ "epoch": 3.0,
159
+ "eval_bleu": 1.0,
160
+ "eval_brevity_penalty": 1.0,
161
+ "eval_length_ratio": 1.0,
162
+ "eval_loss": 2.2457683086395264,
163
+ "eval_precisions": [
164
+ 1.0,
165
+ 1.0,
166
+ 1.0,
167
+ 1.0
168
+ ],
169
+ "eval_reference_length": 53407,
170
+ "eval_runtime": 1141.3701,
171
+ "eval_samples_per_second": 2.463,
172
+ "eval_steps_per_second": 0.616,
173
+ "eval_translation_length": 53407,
174
+ "step": 9484
175
  }
176
  ],
177
  "logging_steps": 500,
178
  "max_steps": 94830,
179
  "num_train_epochs": 30,
180
  "save_steps": 500,
181
+ "total_flos": 6.499896809006039e+17,
182
  "trial_name": null,
183
  "trial_params": null
184
  }