devvanshhh commited on
Commit
bb924ec
·
1 Parent(s): 6eb87b0

Training in progress, epoch 1, checkpoint

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9257626d935eea005747b6117f38e8db18007dbd38f54949943c9dcf0ab36545
3
  size 1256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e75e2c23c99eadad00497a3969a361337133cb50eb29550bcfd57d3c4416b3bf
3
  size 1256
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a7a27874f7dc93ced479b2661f0507a486022fb461d136d2fd60f69bdbbfaa50
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3206cfea353705871f16d46e55ccf93893b489d46b83fd7ba2c4d45d71b93a7
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f882d1e558074512a0f5a92bb9dda78e5353ba094d4875de647eb3d96a8f6114
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b9bfd309a58bb117e3966aecfcd713fe78e781c92b596afe99f2ae8dde39b29
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 3.0,
5
  "eval_steps": 500,
6
- "global_step": 984,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -16,49 +16,17 @@
16
  "eval_rouge2": 25.6511,
17
  "eval_rougeL": 30.5481,
18
  "eval_rougeLsum": 30.8868,
19
- "eval_runtime": 148.51,
20
- "eval_samples_per_second": 1.959,
21
- "eval_steps_per_second": 0.249,
22
  "step": 328
23
- },
24
- {
25
- "epoch": 1.52,
26
- "learning_rate": 3.125e-05,
27
- "loss": 0.7084,
28
- "step": 500
29
- },
30
- {
31
- "epoch": 2.0,
32
- "eval_gen_len": 10.608247422680412,
33
- "eval_loss": 0.6409556865692139,
34
- "eval_rouge1": 34.106,
35
- "eval_rouge2": 25.6511,
36
- "eval_rougeL": 30.5481,
37
- "eval_rougeLsum": 30.8868,
38
- "eval_runtime": 148.1245,
39
- "eval_samples_per_second": 1.965,
40
- "eval_steps_per_second": 0.25,
41
- "step": 656
42
- },
43
- {
44
- "epoch": 3.0,
45
- "eval_gen_len": 10.608247422680412,
46
- "eval_loss": 0.6409556865692139,
47
- "eval_rouge1": 34.106,
48
- "eval_rouge2": 25.6511,
49
- "eval_rougeL": 30.5481,
50
- "eval_rougeLsum": 30.8868,
51
- "eval_runtime": 142.7393,
52
- "eval_samples_per_second": 2.039,
53
- "eval_steps_per_second": 0.259,
54
- "step": 984
55
  }
56
  ],
57
  "logging_steps": 500,
58
  "max_steps": 2624,
59
  "num_train_epochs": 8,
60
  "save_steps": 500,
61
- "total_flos": 7374426541719552.0,
62
  "trial_name": null,
63
  "trial_params": null
64
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.0,
5
  "eval_steps": 500,
6
+ "global_step": 328,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
16
  "eval_rouge2": 25.6511,
17
  "eval_rougeL": 30.5481,
18
  "eval_rougeLsum": 30.8868,
19
+ "eval_runtime": 145.9508,
20
+ "eval_samples_per_second": 1.994,
21
+ "eval_steps_per_second": 0.254,
22
  "step": 328
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
23
  }
24
  ],
25
  "logging_steps": 500,
26
  "max_steps": 2624,
27
  "num_train_epochs": 8,
28
  "save_steps": 500,
29
+ "total_flos": 2458142180573184.0,
30
  "trial_name": null,
31
  "trial_params": null
32
  }
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9162668598cf13fecc16e9e9d7efcfa7ee698b28ece9be6da0a39db65802afa5
3
- size 4728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57fefa357a66f843a7892370f3ccf4b6c54dcf7fc01e2cacb473bbb4d60ec07a
3
+ size 4792