Femboyuwu2000 commited on
Commit
86f2869
1 Parent(s): 8d52a96

Training in progress, step 20, checkpoint

Browse files
last-checkpoint/adapter_config.json CHANGED
@@ -20,9 +20,8 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "dense_h_to_4h",
24
  "word_embeddings",
25
- "query_key_valuelm_head"
26
  ],
27
  "task_type": "CAUSAL_LM",
28
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
23
  "word_embeddings",
24
+ "query_key_value"
25
  ],
26
  "task_type": "CAUSAL_LM",
27
  "use_dora": false,
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b6b239758e5710fe78fd10d067ef696b9ecf7a57962dcbfc99ea16b5f0f15474
3
- size 13982248
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:386f7859b4de007c7ae7c61ec6cb00a515d4711ba21b1c67d45d80097a8fa61d
3
+ size 12803224
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:240c436b277f674752c771cab6fecf23fb9c30d6346d1eae1b590cffdd9c7a4a
3
- size 1128
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa0685b12efbb09b894e2972c18a08bca793a00db99b574a7e0547cacf1ffdbf
3
+ size 6472698
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:357fbaa636c40c1254d97d309539cc9555b5fab8ffbe087025279d50feec0849
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4435a7825b6133e5243ce242cb736cca7675210c39cbc95a71b79603a1500997
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f582b354f682a1388049ebe7692fec43d44fc4825862e8f8a7d835e907b849a9
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f4b34a50c55a680830f99a77a52585bb05290e33d30ce86746475157ba56d09
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.0002830335536277826,
5
  "eval_steps": 500,
6
  "global_step": 20,
7
  "is_hyper_param_search": false,
@@ -10,9 +10,9 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.0,
13
- "grad_norm": 0.0,
14
  "learning_rate": 0.0,
15
- "loss": 3.5917,
16
  "step": 20
17
  }
18
  ],
@@ -21,8 +21,8 @@
21
  "num_input_tokens_seen": 0,
22
  "num_train_epochs": 1,
23
  "save_steps": 20,
24
- "total_flos": 49799375290368.0,
25
- "train_batch_size": 8,
26
  "trial_name": null,
27
  "trial_params": null
28
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 3.1130100472399276e-05,
5
  "eval_steps": 500,
6
  "global_step": 20,
7
  "is_hyper_param_search": false,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.0,
13
+ "grad_norm": 55.33664321899414,
14
  "learning_rate": 0.0,
15
+ "loss": 3.9798,
16
  "step": 20
17
  }
18
  ],
 
21
  "num_input_tokens_seen": 0,
22
  "num_train_epochs": 1,
23
  "save_steps": 20,
24
+ "total_flos": 17506699161600.0,
25
+ "train_batch_size": 1,
26
  "trial_name": null,
27
  "trial_params": null
28
  }
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b6c34bfd1caa32715f73ad2763e8f79f467c0f7f673199f1db21d933e08b71a2
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aafe4b5783fda09fa4658a5b32dd84824c708b77a0e76c309db11ad31ee86141
3
  size 4984