nilq
/

mistral-2L-tiny

Text Generation

Generated from Trainer

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

nilq commited on Mar 2, 2024

Commit

789e36a

·

verified ·

1 Parent(s): bf1abdb

End of training

Files changed (4) hide show

README.md +19 -2
all_results.json +6 -5
eval_results.json +6 -5
trainer_state.json +2 -2

README.md CHANGED Viewed

@@ -1,9 +1,23 @@
 ---
 tags:
 - generated_from_trainer
 model-index:
 - name: mistral-2L-tiny
-  results: []
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -11,7 +25,10 @@ should probably proofread and complete it, then remove this comment. -->
 # mistral-2L-tiny
-This model is a fine-tuned version of [](https://huggingface.co/) on an unknown dataset.
 ## Model description

 ---
 tags:
 - generated_from_trainer
+datasets:
+- roneneldan/TinyStories
+metrics:
+- accuracy
 model-index:
 - name: mistral-2L-tiny
+  results:
+  - task:
+      name: Causal Language Modeling
+      type: text-generation
+    dataset:
+      name: roneneldan/TinyStories
+      type: roneneldan/TinyStories
+    metrics:
+    - name: Accuracy
+      type: accuracy
+      value: 0.6174228881132772
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 # mistral-2L-tiny
+This model is a fine-tuned version of [](https://huggingface.co/) on the roneneldan/TinyStories dataset.
+It achieves the following results on the evaluation set:
+- Loss: 1.4866
+- Accuracy: 0.6174
 ## Model description

all_results.json CHANGED Viewed

@@ -1,9 +1,10 @@
 {
     "epoch": 3.0,
-    "eval_loss": 1.6980599164962769,
-    "eval_runtime": 13.6038,
     "eval_samples": 19348,
-    "eval_samples_per_second": 1422.249,
-    "eval_steps_per_second": 177.818,
-    "perplexity": 5.463337771794384
 }

 {
     "epoch": 3.0,
+    "eval_accuracy": 0.6174228881132772,
+    "eval_loss": 1.4865760803222656,
+    "eval_runtime": 25.5787,
     "eval_samples": 19348,
+    "eval_samples_per_second": 756.411,
+    "eval_steps_per_second": 94.571,
+    "perplexity": 4.421929239222526
 }

eval_results.json CHANGED Viewed

@@ -1,9 +1,10 @@
 {
     "epoch": 3.0,
-    "eval_loss": 1.6980599164962769,
-    "eval_runtime": 13.6038,
     "eval_samples": 19348,
-    "eval_samples_per_second": 1422.249,
-    "eval_steps_per_second": 177.818,
-    "perplexity": 5.463337771794384
 }

 {
     "epoch": 3.0,
+    "eval_accuracy": 0.6174228881132772,
+    "eval_loss": 1.4865760803222656,
+    "eval_runtime": 25.5787,
     "eval_samples": 19348,
+    "eval_samples_per_second": 756.411,
+    "eval_steps_per_second": 94.571,
+    "perplexity": 4.421929239222526
 }

trainer_state.json CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9bfbb8ec65bb19617df170057c0323c4f16fc175ae394e988a2ec268648155f4
-size 14515348

 version https://git-lfs.github.com/spec/v1
+oid sha256:2c1c0cfcc5fd730dd9a9e33e960f8de9d2d43e7ddb436de8a836ce1e9c62e701
+size 14524352