nblinh commited on
Commit
51b7662
·
verified ·
1 Parent(s): 041a05a

End of training

Browse files
README.md CHANGED
@@ -105,7 +105,7 @@ xformers_attention: true
105
 
106
  This model is a fine-tuned version of [VAGOsolutions/Llama-3.1-SauerkrautLM-8b-Instruct](https://huggingface.co/VAGOsolutions/Llama-3.1-SauerkrautLM-8b-Instruct) on the None dataset.
107
  It achieves the following results on the evaluation set:
108
- - Loss: 0.6540
109
 
110
  ## Model description
111
 
@@ -137,7 +137,7 @@ The following hyperparameters were used during training:
137
 
138
  | Training Loss | Epoch | Step | Validation Loss |
139
  |:-------------:|:------:|:----:|:---------------:|
140
- | 0.4057 | 0.0009 | 10 | 0.6540 |
141
 
142
 
143
  ### Framework versions
 
105
 
106
  This model is a fine-tuned version of [VAGOsolutions/Llama-3.1-SauerkrautLM-8b-Instruct](https://huggingface.co/VAGOsolutions/Llama-3.1-SauerkrautLM-8b-Instruct) on the None dataset.
107
  It achieves the following results on the evaluation set:
108
+ - Loss: 0.6444
109
 
110
  ## Model description
111
 
 
137
 
138
  | Training Loss | Epoch | Step | Validation Loss |
139
  |:-------------:|:------:|:----:|:---------------:|
140
+ | 0.49 | 0.0009 | 10 | 0.6444 |
141
 
142
 
143
  ### Framework versions
adapter_config.json CHANGED
@@ -20,13 +20,13 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "q_proj",
24
  "gate_proj",
25
- "k_proj",
26
- "o_proj",
27
  "down_proj",
 
 
 
28
  "v_proj",
29
- "up_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
23
  "gate_proj",
 
 
24
  "down_proj",
25
+ "up_proj",
26
+ "o_proj",
27
+ "k_proj",
28
  "v_proj",
29
+ "q_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d4d9f47c72103b77b08b72a2f2245620cd9ab4940370add92323bbcf81d568b
3
  size 167934026
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91449ae67b8632099d2b659d98eda2a02bb34154b01e0f786c080457f65e942a
3
  size 167934026
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bbd064c624155f4cb578cb0a690bba8bdfcccbfedc897f77e08dfbed72993b0c
3
  size 167832240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:667caf91752ffe9db39f5b00742e477b4ce371b95d0e04943747f0695278f49d
3
  size 167832240
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ecf9758ae99633e58b0d4a82d74cbc826c9b0dd8e8befb80c4f276ba231ad3b0
3
  size 6776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3f0f9fa537a4e1865c58c91bdacc639be08d5aede552f6054ce9954bbd6793c
3
  size 6776