EdBerg commited on
Commit
89adcd8
1 Parent(s): 7678da6

Training in progress, step 10

Browse files
adapter_config.json CHANGED
@@ -16,17 +16,17 @@
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": null,
18
  "peft_type": "LORA",
19
- "r": 32,
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
23
  "q_proj",
24
  "k_proj",
25
- "o_proj",
26
- "up_proj",
27
  "v_proj",
28
- "gate_proj",
29
- "down_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": null,
18
  "peft_type": "LORA",
19
+ "r": 64,
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
+ "gate_proj",
24
  "q_proj",
25
  "k_proj",
26
+ "down_proj",
 
27
  "v_proj",
28
+ "up_proj",
29
+ "o_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0a9694c2b0a560484b933753b1bd1481003b3091ac64b70ca0de564cfdd7c9a5
3
- size 335604696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d117f94bda35a5fe8ce444cc4a03fe11c786a11280edcc829fa69a8d576ee449
3
+ size 671149168
runs/Aug03_16-26-09_5f34e86bcde7/events.out.tfevents.1722702372.5f34e86bcde7.150.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a6b19c9b66785fb2d268343f95023d42097d0e01715d22f1eb01a7091b1f6e6
3
+ size 6129
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:44ca783bcb9ef55948934fe502424c227cb8712ea19569bd734e75ca7282c744
3
  size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4ba1769befa4cef566240dc0ebc51bea6057296a99e3dacc163ebe072010d59
3
  size 5432