Femboyuwu2000 commited on
Commit
7ab5bba
1 Parent(s): d658d44

Training in progress, step 380, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:55fbe6b68371476a49a5dcf47cb5f9d87019cedff7dbfeba90f3bd7c5af98334
3
  size 13982248
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53e100046bad02aa8795bb6d5922495b27c88ed4948d14bbd2da713babe5699f
3
  size 13982248
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8dc0adaf7cde965efef091b643e2b3d0711b0799235ea64091a8320ceeb4047b
3
  size 7062522
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c261a4d2f0733eaa1f3af190df879fff54eedd114cfa803ade74c2c83d00ea45
3
  size 7062522
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a768f08cb42c9ce59ce3607be711941a2de1bfe32b4b4e516fea093f13486afb
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0104c2c25b80b05f4aa46359191df58367bf4b542ff4aabbd3f340ab0f62cf58
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cf59311c497c1cc7e6cd717401fb1271b7c3333ced1b25ea886a7983f576a568
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4f8e4820960fcfc3b001f4fae5172b0e153f358171368526c212f8f5dffa68f
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.0288,
5
  "eval_steps": 500,
6
- "global_step": 360,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -133,6 +133,13 @@
133
  "learning_rate": 1.8e-05,
134
  "loss": 4.0832,
135
  "step": 360
 
 
 
 
 
 
 
136
  }
137
  ],
138
  "logging_steps": 20,
@@ -140,7 +147,7 @@
140
  "num_input_tokens_seen": 0,
141
  "num_train_epochs": 2,
142
  "save_steps": 20,
143
- "total_flos": 865682421055488.0,
144
  "train_batch_size": 8,
145
  "trial_name": null,
146
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.0304,
5
  "eval_steps": 500,
6
+ "global_step": 380,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
133
  "learning_rate": 1.8e-05,
134
  "loss": 4.0832,
135
  "step": 360
136
+ },
137
+ {
138
+ "epoch": 0.03,
139
+ "grad_norm": 28.68460464477539,
140
+ "learning_rate": 1.9e-05,
141
+ "loss": 3.9827,
142
+ "step": 380
143
  }
144
  ],
145
  "logging_steps": 20,
 
147
  "num_input_tokens_seen": 0,
148
  "num_train_epochs": 2,
149
  "save_steps": 20,
150
+ "total_flos": 911840340049920.0,
151
  "train_batch_size": 8,
152
  "trial_name": null,
153
  "trial_params": null