Femboyuwu2000 commited on
Commit
abf420e
1 Parent(s): 720031a

Training in progress, step 60, checkpoint

Browse files
last-checkpoint/adapter_config.json CHANGED
@@ -20,8 +20,8 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "query_key_valuelm_head",
24
- "word_embeddings"
25
  ],
26
  "task_type": "CAUSAL_LM",
27
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
+ "word_embeddings",
24
+ "query_key_valuelm_head"
25
  ],
26
  "task_type": "CAUSAL_LM",
27
  "use_dora": false,
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de52612f18d94eb85267cdbaa87cfac914b5a3415370220f048ff6627b5dc973
3
  size 8077608
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b5e1d7fec5642c5a7eebc261811b86c8379352efb270f0d53c3bdd0277083ab
3
  size 8077608
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c7da0cccb26e635a9bb8fe359b98f58b1fe7d55939c5f6f51514ca872caa19e9
3
  size 4052500
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c295c871992ea2658a9d7ad487d59b40db23c7cfbb6615cf5f83edf6deb52d2c
3
  size 4052500
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:386fcc8cc1089aade9450d86fb239ea3483f455fd2d78d8378645feecfec9d69
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:384b1441690cc32db0a09ece90eb10816e434402fb6deac7559104dc40fcf585
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:960f0c2ec75c7a0d06bf09f5118049f84af6550acbf637b5ec1d7409c50149b7
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b215c0947378bd341b267cea5a7112696ec035345c849e38fb6a3c58f28d2185
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -10,28 +10,28 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.0,
13
- "grad_norm": 87.1609115600586,
14
- "learning_rate": 2.341780598043574e-05,
15
- "loss": 4.6745,
16
  "step": 20
17
  },
18
  {
19
  "epoch": 0.0,
20
- "grad_norm": 226.922119140625,
21
- "learning_rate": 7.97387338950315e-06,
22
- "loss": 4.5875,
23
  "step": 40
24
  },
25
  {
26
  "epoch": 0.0,
27
- "grad_norm": 86.45769500732422,
28
- "learning_rate": 0.0,
29
- "loss": 4.8834,
30
  "step": 60
31
  }
32
  ],
33
  "logging_steps": 20,
34
- "max_steps": 60,
35
  "num_input_tokens_seen": 0,
36
  "num_train_epochs": 1,
37
  "save_steps": 20,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.0,
13
+ "grad_norm": 79.12922668457031,
14
+ "learning_rate": 1e-06,
15
+ "loss": 4.6771,
16
  "step": 20
17
  },
18
  {
19
  "epoch": 0.0,
20
+ "grad_norm": 239.7991943359375,
21
+ "learning_rate": 2e-06,
22
+ "loss": 4.5023,
23
  "step": 40
24
  },
25
  {
26
  "epoch": 0.0,
27
+ "grad_norm": 77.5164794921875,
28
+ "learning_rate": 3e-06,
29
+ "loss": 4.8171,
30
  "step": 60
31
  }
32
  ],
33
  "logging_steps": 20,
34
+ "max_steps": 20000,
35
  "num_input_tokens_seen": 0,
36
  "num_train_epochs": 1,
37
  "save_steps": 20,
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:83256b55088d45d0ebeda1319a91e9b247c70b5f4d82cb04a018aa4a684554bc
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32e994f25267341e613f4d352977cc7a2847de358db5ece7a60fcf21be944170
3
  size 4984