devvanshhh commited on
Commit
bc90b9d
1 Parent(s): 4eff2be

Training in progress, epoch 5, checkpoint

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:abcf9278bf80f871bbda4ffa9be883d3b9d1c52089b9d33c2ca021af12bc00f8
3
  size 615849402
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fbe6d608a942537e6292b2872403242323d8c3cd58fcf734be83e3dc6228f31
3
  size 615849402
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6da080e8fde1ff422407acfc1b0714d8f6aa1266c97fc465e5d731386708176d
3
  size 307910594
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2ef2d22ca2bff3aa3c27e6b5bb5fa7b38bb5a6fe226aa337d275d9e441e1668
3
  size 307910594
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:15552249b9c446195b97b2b0abd07e68ddc68dd1792bd9d1e769855d57c06f5e
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6806db7e12e994c3a92c927520fdf44bec2f8e45d8dde397c2681914b7c93270
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8387f825847a9b8a2c8387203584ce1062acc3caff7113d13f9f01240448459b
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e95f78bbbb9b613376b4c17ce129da2369a70a8610283ee10e8332a35cb2fc8
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.007984320633113384,
3
- "best_model_checkpoint": "flan-search-terms/checkpoint-6000",
4
- "epoch": 4.0,
5
  "eval_steps": 500,
6
- "global_step": 6000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -131,13 +131,44 @@
131
  "eval_samples_per_second": 11.748,
132
  "eval_steps_per_second": 1.468,
133
  "step": 6000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
134
  }
135
  ],
136
  "logging_steps": 500,
137
  "max_steps": 7500,
138
  "num_train_epochs": 5,
139
  "save_steps": 500,
140
- "total_flos": 8922744225792000.0,
141
  "trial_name": null,
142
  "trial_params": null
143
  }
 
1
  {
2
+ "best_metric": 0.0076544685289263725,
3
+ "best_model_checkpoint": "flan-search-terms/checkpoint-7500",
4
+ "epoch": 5.0,
5
  "eval_steps": 500,
6
+ "global_step": 7500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
131
  "eval_samples_per_second": 11.748,
132
  "eval_steps_per_second": 1.468,
133
  "step": 6000
134
+ },
135
+ {
136
+ "epoch": 4.33,
137
+ "learning_rate": 6.666666666666667e-06,
138
+ "loss": 0.011,
139
+ "step": 6500
140
+ },
141
+ {
142
+ "epoch": 4.67,
143
+ "learning_rate": 3.3333333333333333e-06,
144
+ "loss": 0.0112,
145
+ "step": 7000
146
+ },
147
+ {
148
+ "epoch": 5.0,
149
+ "learning_rate": 0.0,
150
+ "loss": 0.0105,
151
+ "step": 7500
152
+ },
153
+ {
154
+ "epoch": 5.0,
155
+ "eval_gen_len": 8.819,
156
+ "eval_loss": 0.0076544685289263725,
157
+ "eval_rouge1": 5.2275,
158
+ "eval_rouge2": 4.3657,
159
+ "eval_rougeL": 4.8365,
160
+ "eval_rougeLsum": 4.8414,
161
+ "eval_runtime": 257.9989,
162
+ "eval_samples_per_second": 11.628,
163
+ "eval_steps_per_second": 1.453,
164
+ "step": 7500
165
  }
166
  ],
167
  "logging_steps": 500,
168
  "max_steps": 7500,
169
  "num_train_epochs": 5,
170
  "save_steps": 500,
171
+ "total_flos": 1.115343028224e+16,
172
  "trial_name": null,
173
  "trial_params": null
174
  }