Model save

Files changed (5) hide show

README.md CHANGED Viewed

@@ -47,7 +47,7 @@ The following hyperparameters were used during training:
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: constant
 - lr_scheduler_warmup_ratio: 0.03
-- num_epochs: 1
 ### Training results

 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: constant
 - lr_scheduler_warmup_ratio: 0.03
+- num_epochs: 3
 ### Training results

adapter_config.json CHANGED Viewed

@@ -20,14 +20,14 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "up_proj",
-    "k_proj",
-    "v_proj",
     "q_proj",
-    "o_proj",
     "lm_head",
-    "down_proj",
-    "gate_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "down_proj",
     "q_proj",
+    "k_proj",
     "lm_head",
+    "up_proj",
+    "gate_proj",
+    "v_proj",
+    "o_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2ddd2d4279ded06df82db35b29b4ff4826e50f2ca85ab6273a08614abdf483b1
 size 608759824

 version https://git-lfs.github.com/spec/v1
+oid sha256:2bb847e0b387b8ac2052c1d3aac738f9b163c62c5e0b7367fc7ca3f27efc9965
 size 608759824

tokenizer.json CHANGED Viewed

@@ -2,7 +2,7 @@
   "version": "1.0",
   "truncation": {
     "direction": "Right",
-    "max_length": 2200,
     "strategy": "LongestFirst",
     "stride": 0
   },

   "version": "1.0",
   "truncation": {
     "direction": "Right",
+    "max_length": 2048,
     "strategy": "LongestFirst",
     "stride": 0
   },

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:233f6807b54425a8b9f162bedd5dec21346d840c7dfb8bd4d1a0df89a9ea73bb
 size 5112

 version https://git-lfs.github.com/spec/v1
+oid sha256:6ba28abc75fdfa5fe3db8ed17f7d1f2b081ba34a74aa663f48e9138c67be2a6a
 size 5112