Update README.md
Browse files
README.md
CHANGED
@@ -146,13 +146,13 @@ In this example, the model needs to understand and generate a coherent conversat
|
|
146 |
| Tasks |Version| Filter |n-shot| Metric | |Value | |Stderr|
|
147 |
|-----------------|-------|----------------|-----:|-----------|---|-----:|---|------|
|
148 |
|tinyBenchmarks | N/A| | | | | | | |
|
149 |
-
| - tinyArc | 0|none | 25|acc_norm |↑ |0.
|
150 |
-
| - tinyGSM8k | 0|flexible-extract| 5|exact_match|↑ |0.
|
151 |
-
| | |strict-match | 5|exact_match|↑ |0.
|
152 |
-
| - tinyHellaswag | 0|none | 10|acc_norm |↑ |0.
|
153 |
-
| - tinyMMLU | 0|none | 0|acc_norm |↑ |0.
|
154 |
-
| - tinyTruthfulQA| 0|none | 0|acc |↑ |0.
|
155 |
-
| - tinyWinogrande| 0|none | 5|acc_norm |↑ |0.
|
156 |
|
157 |
### Training Command
|
158 |
|
|
|
146 |
| Tasks |Version| Filter |n-shot| Metric | |Value | |Stderr|
|
147 |
|-----------------|-------|----------------|-----:|-----------|---|-----:|---|------|
|
148 |
|tinyBenchmarks | N/A| | | | | | | |
|
149 |
+
| - tinyArc | 0|none | 25|acc_norm |↑ |0.5821|± | N/A|
|
150 |
+
| - tinyGSM8k | 0|flexible-extract| 5|exact_match|↑ |0.4989|± | N/A|
|
151 |
+
| | |strict-match | 5|exact_match|↑ |0.4867|± | N/A|
|
152 |
+
| - tinyHellaswag | 0|none | 10|acc_norm |↑ |0.8307|± | N/A|
|
153 |
+
| - tinyMMLU | 0|none | 0|acc_norm |↑ |0.6651|± | N/A|
|
154 |
+
| - tinyTruthfulQA| 0|none | 0|acc |↑ |0.4991|± | N/A|
|
155 |
+
| - tinyWinogrande| 0|none | 5|acc_norm |↑ |0.7558|± | N/A|
|
156 |
|
157 |
### Training Command
|
158 |
|