dq158 commited on
Commit
da117c8
1 Parent(s): a5ff9bb

Training in progress, epoch 0, checkpoint

Browse files
last-checkpoint/adapter_config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "auto_mapping": null,
3
- "base_model_name_or_path": "google/flan-t5-xxl",
4
  "bias": "none",
5
  "fan_in_fan_out": false,
6
  "inference_mode": true,
 
1
  {
2
  "auto_mapping": null,
3
+ "base_model_name_or_path": "google/flan-t5-xl",
4
  "bias": "none",
5
  "fan_in_fan_out": false,
6
  "inference_mode": true,
last-checkpoint/global_step790/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4be5091c1d4d363dd5d9eeb380cc1069ccee2d73d55ba4f8637006d5581477e4
3
+ size 28315088
last-checkpoint/global_step790/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bcca6fce13123f8cd9ec374ddf906c7b7e17d2a43f60cb5a3f97cf206923c37
3
+ size 28315088
last-checkpoint/global_step790/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64621a2d4d13b9e92b17253bfd2c4bfaab36e77444417075b812c0ad48aba63c
3
+ size 2850543502
last-checkpoint/global_step790/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e6f73fe9e7e2619f711c9811c18e0e7ca3757a4f3d858dd85f66e093697a8f9
3
+ size 2850543310
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step1581
 
1
+ global_step790
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f232d8d672d6ff9e3cc5ac4ba64234b9f002d5e144a43ee183dc01871e2f10e5
3
  size 14512
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16a7aa1548464e6c880ebd42aba4c07ee57fb38feb25979f4c82c0f0bec9f0e6
3
  size 14512
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e25f573f6bcb03f0bbfe93da192a1ab49ba692dcab33095de44fc91e5e4216a5
3
  size 14512
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38d40d71f540bdd7fdb4af7e756f13010eb6a96ab531b88e35903b066788ad63
3
  size 14512
last-checkpoint/trainer_state.json CHANGED
@@ -1,56 +1,44 @@
1
  {
2
- "best_metric": 2.2135026454925537,
3
- "best_model_checkpoint": "dq158/pingusPongus/checkpoint-1581",
4
- "epoch": 1.0,
5
  "eval_steps": 500,
6
- "global_step": 1581,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
- {
12
- "epoch": 0.32,
13
- "learning_rate": 0.0008497772211805019,
14
- "loss": 2.4966,
15
- "step": 500
16
- },
17
  {
18
  "epoch": 0.63,
19
- "learning_rate": 0.0009445572420019074,
20
- "loss": 2.3574,
21
- "step": 1000
22
- },
23
- {
24
- "epoch": 0.95,
25
- "learning_rate": 0.0009999999999999998,
26
- "loss": 2.3094,
27
- "step": 1500
28
  },
29
  {
30
  "epoch": 1.0,
31
  "eval_bleu": 1.0,
32
  "eval_brevity_penalty": 1.0,
33
  "eval_length_ratio": 1.0,
34
- "eval_loss": 2.2135026454925537,
35
  "eval_precisions": [
36
  1.0,
37
  1.0,
38
  1.0,
39
  1.0
40
  ],
41
- "eval_reference_length": 53394,
42
- "eval_runtime": 2937.3471,
43
- "eval_samples_per_second": 0.957,
44
- "eval_steps_per_second": 0.12,
45
- "eval_translation_length": 53394,
46
- "step": 1581
47
  }
48
  ],
49
  "logging_steps": 500,
50
- "max_steps": 15810,
51
- "num_train_epochs": 10,
52
  "save_steps": 500,
53
- "total_flos": 771945142419456.0,
54
  "trial_name": null,
55
  "trial_params": null
56
  }
 
1
  {
2
+ "best_metric": 2.392251491546631,
3
+ "best_model_checkpoint": "dq158/pingusPongus/checkpoint-790",
4
+ "epoch": 0.9993674889310563,
5
  "eval_steps": 500,
6
+ "global_step": 790,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
 
 
 
 
 
 
11
  {
12
  "epoch": 0.63,
13
+ "learning_rate": 8.49777221180502e-05,
14
+ "loss": 2.8794,
15
+ "step": 500
 
 
 
 
 
 
16
  },
17
  {
18
  "epoch": 1.0,
19
  "eval_bleu": 1.0,
20
  "eval_brevity_penalty": 1.0,
21
  "eval_length_ratio": 1.0,
22
+ "eval_loss": 2.392251491546631,
23
  "eval_precisions": [
24
  1.0,
25
  1.0,
26
  1.0,
27
  1.0
28
  ],
29
+ "eval_reference_length": 53098,
30
+ "eval_runtime": 1401.0268,
31
+ "eval_samples_per_second": 2.006,
32
+ "eval_steps_per_second": 0.126,
33
+ "eval_translation_length": 53098,
34
+ "step": 790
35
  }
36
  ],
37
  "logging_steps": 500,
38
+ "max_steps": 23700,
39
+ "num_train_epochs": 30,
40
  "save_steps": 500,
41
+ "total_flos": 385850466631680.0,
42
  "trial_name": null,
43
  "trial_params": null
44
  }
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:da68e390908bbf17cdb4f041431915c87c2f3f6b8699cebf8dcb70aae5296d20
3
  size 6648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7619c25d1f961a939120b81d521c14f9d13e3f5fcb5ceba87a0c9e7d8c62891c
3
  size 6648