kamilmuratyilmaz commited on
Commit
d236873
1 Parent(s): 489e5c7

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +100 -24
README.md CHANGED
@@ -12,31 +12,107 @@ language:
12
  pipeline_tag: text2text-generation
13
  base_model: mistralai/Mistral-7B-v0.3
14
 
 
15
  model-index:
16
- - name: cymist-2-v03-SFT
17
- results:
18
- - task:
19
- type: text-generation
20
- metrics:
21
- - name: ARC (25-Shot)
22
- type: arc_challenge (25-Shot)
23
- value: 59.12
24
- - name: Hellaswag (10-Shot)
25
- type: Hellaswag (10-Shot)
26
- value: 82.56
27
- - name: TruthfulQA
28
- type: TruthfulQA
29
- value: 52.12
30
- - name: GSM8K (5-Shot)
31
- type: GSM8K (5-Shot)
32
- value: 36.61
33
- - name: Winogrande (5-Shot)
34
- type: Winogrande (5-Shot)
35
- value: 77.43
36
- - name: MMLU (5-Shot)
37
- type: MMLU (5-Shot)
38
- value: 62.65
39
-
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
40
 
41
  ---
42
  # Model Card for Cymist2-v0.3-SFT
 
12
  pipeline_tag: text2text-generation
13
  base_model: mistralai/Mistral-7B-v0.3
14
 
15
+
16
  model-index:
17
+ - name: cymist-2-v03-SFT
18
+ results:
19
+ - task:
20
+ type: text-generation
21
+ name: Text Generation
22
+ dataset:
23
+ name: AI2 Reasoning Challenge (25-Shot)
24
+ type: ai2_arc
25
+ config: ARC-Challenge
26
+ split: test
27
+ args:
28
+ num_few_shot: 25
29
+ metrics:
30
+ - type: acc_norm
31
+ value: 59.12
32
+ name: normalized accuracy
33
+ source:
34
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=cypienai/cymist-2-v02-SFT
35
+ name: Open LLM Leaderboard
36
+ - task:
37
+ type: text-generation
38
+ name: Text Generation
39
+ dataset:
40
+ name: HellaSwag (10-Shot)
41
+ type: hellaswag
42
+ split: validation
43
+ args:
44
+ num_few_shot: 10
45
+ metrics:
46
+ - type: acc_norm
47
+ value: 82.56
48
+ name: normalized accuracy
49
+ source:
50
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=cypienai/cymist-2-v02-SFT
51
+ name: Open LLM Leaderboard
52
+ - task:
53
+ type: text-generation
54
+ name: Text Generation
55
+ dataset:
56
+ name: TruthfulQA (0-shot)
57
+ type: truthful_qa
58
+ config: multiple_choice
59
+ split: validation
60
+ args:
61
+ num_few_shot: 0
62
+ metrics:
63
+ - type: mc2
64
+ value: 52.12
65
+ source:
66
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=cypienai/cymist-2-v02-SFT
67
+ name: Open LLM Leaderboard
68
+ - task:
69
+ type: text-generation
70
+ name: Text Generation
71
+ dataset:
72
+ name: GSM8k (5-shot)
73
+ type: gsm8k
74
+ config: main
75
+ split: test
76
+ args:
77
+ num_few_shot: 5
78
+ metrics:
79
+ - type: acc
80
+ value: 36.61
81
+ name: accuracy
82
+ source:
83
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=cypienai/cymist-2-v02-SFT
84
+ name: Open LLM Leaderboard
85
+ - task:
86
+ type: text-generation
87
+ name: Text Generation
88
+ dataset:
89
+ name: Winogrande (5-shot)
90
+ type: winogrande
91
+ config: winogrande_xl
92
+ split: validation
93
+ args:
94
+ num_few_shot: 5
95
+ metrics:
96
+ - type: acc
97
+ value: 77.43
98
+ name: accuracy
99
+ source:
100
+ url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=cypienai/cymist-2-v02-SFT
101
+ name: Open LLM Leaderboard
102
+ - task:
103
+ type: text-generation
104
+ name: Text Generation
105
+ dataset:
106
+ name: MMLU (5-Shot)
107
+ type: cais/mmlu
108
+ config: all
109
+ split: test
110
+ args:
111
+ num_few_shot: 5
112
+ metrics:
113
+ - type: acc
114
+ value: 62.65
115
+ name: accuracy
116
 
117
  ---
118
  # Model Card for Cymist2-v0.3-SFT