kevinautomation/Llama-2-7b-hf_project_ask_reddit

Browse files

Files changed (8) hide show

README.md +28 -29
adapter_config.json +3 -3
adapter_model.safetensors +2 -2
runs/Feb04_01-12-08_6976d1dd0e6d/events.out.tfevents.1707009170.6976d1dd0e6d.804.0 +3 -0
special_tokens_map.json +3 -3
tokenizer.json +3 -3
tokenizer_config.json +3 -4
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -1,5 +1,4 @@
 ---
-license: apache-2.0
 library_name: peft
 tags:
 - trl
@@ -7,7 +6,7 @@ tags:
 - generated_from_trainer
 datasets:
 - generator
-base_model: TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T
 model-index:
 - name: tiny_llama_instruct_generation
   results: []
@@ -18,9 +17,9 @@ should probably proofread and complete it, then remove this comment. -->
 # tiny_llama_instruct_generation
-This model is a fine-tuned version of [TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T](https://huggingface.co/TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T) on the generator dataset.
 It achieves the following results on the evaluation set:
-- Loss: 2.0948
 ## Model description
@@ -52,31 +51,31 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
-| 2.3941        | 0.01  | 20   | 2.3714          |
-| 2.3059        | 0.01  | 40   | 2.2499          |
-| 2.2079        | 0.02  | 60   | 2.2003          |
-| 2.1916        | 0.02  | 80   | 2.1705          |
-| 2.1766        | 0.03  | 100  | 2.1457          |
-| 2.1583        | 0.03  | 120  | 2.1343          |
-| 2.1204        | 0.04  | 140  | 2.1238          |
-| 2.1493        | 0.04  | 160  | 2.1187          |
-| 2.1408        | 0.05  | 180  | 2.1145          |
-| 2.1331        | 0.06  | 200  | 2.1116          |
-| 2.1736        | 0.06  | 220  | 2.1094          |
-| 2.1299        | 0.07  | 240  | 2.1072          |
-| 2.1389        | 0.07  | 260  | 2.1050          |
-| 2.1164        | 0.08  | 280  | 2.1050          |
-| 2.1115        | 0.08  | 300  | 2.1040          |
-| 2.1139        | 0.09  | 320  | 2.1024          |
-| 2.1158        | 0.1   | 340  | 2.1021          |
-| 2.1342        | 0.1   | 360  | 2.1001          |
-| 2.1006        | 0.11  | 380  | 2.0989          |
-| 2.1287        | 0.11  | 400  | 2.0990          |
-| 2.1287        | 0.12  | 420  | 2.0975          |
-| 2.1573        | 0.12  | 440  | 2.0967          |
-| 2.119         | 0.13  | 460  | 2.0948          |
-| 2.1301        | 0.13  | 480  | 2.0947          |
-| 2.0913        | 0.14  | 500  | 2.0948          |
 ### Framework versions

 ---
 library_name: peft
 tags:
 - trl
 - generated_from_trainer
 datasets:
 - generator
+base_model: NousResearch/Llama-2-7b-hf
 model-index:
 - name: tiny_llama_instruct_generation
   results: []
 # tiny_llama_instruct_generation
+This model is a fine-tuned version of [NousResearch/Llama-2-7b-hf](https://huggingface.co/NousResearch/Llama-2-7b-hf) on the generator dataset.
 It achieves the following results on the evaluation set:
+- Loss: 1.8500
 ## Model description
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
+| 2.0445        | 0.01  | 20   | 2.0291          |
+| 1.9813        | 0.01  | 40   | 1.9775          |
+| 1.9752        | 0.02  | 60   | 1.9477          |
+| 1.953         | 0.02  | 80   | 1.8977          |
+| 1.9054        | 0.03  | 100  | 1.8774          |
+| 1.8665        | 0.03  | 120  | 1.8699          |
+| 1.845         | 0.04  | 140  | 1.8648          |
+| 1.8487        | 0.04  | 160  | 1.8626          |
+| 1.8557        | 0.05  | 180  | 1.8604          |
+| 1.8451        | 0.06  | 200  | 1.8589          |
+| 1.8557        | 0.06  | 220  | 1.8578          |
+| 1.7733        | 0.07  | 240  | 1.8570          |
+| 1.8652        | 0.07  | 260  | 1.8562          |
+| 1.8178        | 0.08  | 280  | 1.8552          |
+| 1.8102        | 0.08  | 300  | 1.8546          |
+| 1.8275        | 0.09  | 320  | 1.8541          |
+| 1.8405        | 0.1   | 340  | 1.8533          |
+| 1.8319        | 0.1   | 360  | 1.8530          |
+| 1.8411        | 0.11  | 380  | 1.8526          |
+| 1.8562        | 0.11  | 400  | 1.8520          |
+| 1.8505        | 0.12  | 420  | 1.8516          |
+| 1.8132        | 0.12  | 440  | 1.8514          |
+| 1.901         | 0.13  | 460  | 1.8509          |
+| 1.8138        | 0.13  | 480  | 1.8506          |
+| 1.8209        | 0.14  | 500  | 1.8500          |
 ### Framework versions

adapter_config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "alpha_pattern": {},
   "auto_mapping": null,
-  "base_model_name_or_path": "TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
@@ -19,8 +19,8 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "v_proj",
-    "q_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_rslora": false

 {
   "alpha_pattern": {},
   "auto_mapping": null,
+  "base_model_name_or_path": "NousResearch/Llama-2-7b-hf",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "q_proj",
+    "v_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_rslora": false

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3452543d7cb24130d26ed546534699a11ceaf6dfc88e8e5fb48d7dae4a505108
-size 36056608

 version https://git-lfs.github.com/spec/v1
+oid sha256:c122dee7a9ae92cd90008bf108857a8af499ffe96942bfb829c5c233fddf4f7b
+size 134235048

runs/Feb04_01-12-08_6976d1dd0e6d/events.out.tfevents.1707009170.6976d1dd0e6d.804.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d0586d35c962bb2ef1363b03f4a98e819c9f2586d3b1337ab578a22a897a03d8
+size 19761

special_tokens_map.json CHANGED Viewed

@@ -2,14 +2,14 @@
   "bos_token": {
     "content": "<s>",
     "lstrip": false,
-    "normalized": false,
     "rstrip": false,
     "single_word": false
   },
   "eos_token": {
     "content": "</s>",
     "lstrip": false,
-    "normalized": false,
     "rstrip": false,
     "single_word": false
   },
@@ -17,7 +17,7 @@
   "unk_token": {
     "content": "<unk>",
     "lstrip": false,
-    "normalized": false,
     "rstrip": false,
     "single_word": false
   }

   "bos_token": {
     "content": "<s>",
     "lstrip": false,
+    "normalized": true,
     "rstrip": false,
     "single_word": false
   },
   "eos_token": {
     "content": "</s>",
     "lstrip": false,
+    "normalized": true,
     "rstrip": false,
     "single_word": false
   },
   "unk_token": {
     "content": "<unk>",
     "lstrip": false,
+    "normalized": true,
     "rstrip": false,
     "single_word": false
   }

tokenizer.json CHANGED Viewed

@@ -9,7 +9,7 @@
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
-      "normalized": false,
       "special": true
     },
     {
@@ -18,7 +18,7 @@
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
-      "normalized": false,
       "special": true
     },
     {
@@ -27,7 +27,7 @@
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
-      "normalized": false,
       "special": true
     }
   ],

       "single_word": false,
       "lstrip": false,
       "rstrip": false,
+      "normalized": true,
       "special": true
     },
     {
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
+      "normalized": true,
       "special": true
     },
     {
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
+      "normalized": true,
       "special": true
     }
   ],

tokenizer_config.json CHANGED Viewed

@@ -5,7 +5,7 @@
     "0": {
       "content": "<unk>",
       "lstrip": false,
-      "normalized": false,
       "rstrip": false,
       "single_word": false,
       "special": true
@@ -13,7 +13,7 @@
     "1": {
       "content": "<s>",
       "lstrip": false,
-      "normalized": false,
       "rstrip": false,
       "single_word": false,
       "special": true
@@ -21,7 +21,7 @@
     "2": {
       "content": "</s>",
       "lstrip": false,
-      "normalized": false,
       "rstrip": false,
       "single_word": false,
       "special": true
@@ -33,7 +33,6 @@
   "legacy": false,
   "model_max_length": 1000000000000000019884624838656,
   "pad_token": "</s>",
-  "padding_side": "right",
   "sp_model_kwargs": {},
   "tokenizer_class": "LlamaTokenizer",
   "unk_token": "<unk>",

     "0": {
       "content": "<unk>",
       "lstrip": false,
+      "normalized": true,
       "rstrip": false,
       "single_word": false,
       "special": true
     "1": {
       "content": "<s>",
       "lstrip": false,
+      "normalized": true,
       "rstrip": false,
       "single_word": false,
       "special": true
     "2": {
       "content": "</s>",
       "lstrip": false,
+      "normalized": true,
       "rstrip": false,
       "single_word": false,
       "special": true
   "legacy": false,
   "model_max_length": 1000000000000000019884624838656,
   "pad_token": "</s>",
   "sp_model_kwargs": {},
   "tokenizer_class": "LlamaTokenizer",
   "unk_token": "<unk>",

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:23f0d3c3cd1af20ed00bb7c4d7339e6b0311d0b11de480f9e23c4938db40659a
 size 4728

 version https://git-lfs.github.com/spec/v1
+oid sha256:0713c92267567d8229e9fac0277db9a43929d8b595862660d804c148f41aa96b
 size 4728