mkurman commited on
Commit
8219d42
1 Parent(s): 01bab5f

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +0 -159
README.md CHANGED
@@ -14,137 +14,6 @@ datasets:
14
  - WizardLMTeam/WizardLM_evol_instruct_V2_196k
15
  - ProlificAI/social-reasoning-rlhf
16
  pipeline_tag: text-generation
17
- model-index:
18
- - name: Llama-3.2-SUN-2.4B-v1.0.0
19
- results:
20
- - task:
21
- type: text-generation
22
- name: Text Generation
23
- dataset:
24
- name: IFEval (0-Shot)
25
- type: HuggingFaceH4/ifeval
26
- args:
27
- num_few_shot: 0
28
- metrics:
29
- - type: inst_level_strict_acc and prompt_level_strict_acc
30
- value: 56.37
31
- name: strict accuracy
32
- - type: inst_level_strict_acc and prompt_level_strict_acc
33
- value: 55.37
34
- name: strict accuracy
35
- - type: inst_level_strict_acc and prompt_level_strict_acc
36
- value: 55.37
37
- name: strict accuracy
38
- source:
39
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=meditsolutions/Llama-3.2-SUN-2.4B-v1.0.0
40
- name: Open LLM Leaderboard
41
- - task:
42
- type: text-generation
43
- name: Text Generation
44
- dataset:
45
- name: BBH (3-Shot)
46
- type: BBH
47
- args:
48
- num_few_shot: 3
49
- metrics:
50
- - type: acc_norm
51
- value: 7.21
52
- name: normalized accuracy
53
- - type: acc_norm
54
- value: 7.17
55
- name: normalized accuracy
56
- - type: acc_norm
57
- value: 7.17
58
- name: normalized accuracy
59
- source:
60
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=meditsolutions/Llama-3.2-SUN-2.4B-v1.0.0
61
- name: Open LLM Leaderboard
62
- - task:
63
- type: text-generation
64
- name: Text Generation
65
- dataset:
66
- name: MATH Lvl 5 (4-Shot)
67
- type: hendrycks/competition_math
68
- args:
69
- num_few_shot: 4
70
- metrics:
71
- - type: exact_match
72
- value: 4.83
73
- name: exact match
74
- - type: exact_match
75
- value: 1.28
76
- name: exact match
77
- - type: exact_match
78
- value: 1.28
79
- name: exact match
80
- source:
81
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=meditsolutions/Llama-3.2-SUN-2.4B-v1.0.0
82
- name: Open LLM Leaderboard
83
- - task:
84
- type: text-generation
85
- name: Text Generation
86
- dataset:
87
- name: GPQA (0-shot)
88
- type: Idavidrein/gpqa
89
- args:
90
- num_few_shot: 0
91
- metrics:
92
- - type: acc_norm
93
- value: 1.01
94
- name: acc_norm
95
- - type: acc_norm
96
- value: 0.45
97
- name: acc_norm
98
- - type: acc_norm
99
- value: 0.45
100
- name: acc_norm
101
- source:
102
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=meditsolutions/Llama-3.2-SUN-2.4B-v1.0.0
103
- name: Open LLM Leaderboard
104
- - task:
105
- type: text-generation
106
- name: Text Generation
107
- dataset:
108
- name: MuSR (0-shot)
109
- type: TAUR-Lab/MuSR
110
- args:
111
- num_few_shot: 0
112
- metrics:
113
- - type: acc_norm
114
- value: 3.02
115
- name: acc_norm
116
- - type: acc_norm
117
- value: 0.13
118
- name: acc_norm
119
- - type: acc_norm
120
- value: 0.13
121
- name: acc_norm
122
- source:
123
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=meditsolutions/Llama-3.2-SUN-2.4B-v1.0.0
124
- name: Open LLM Leaderboard
125
- - task:
126
- type: text-generation
127
- name: Text Generation
128
- dataset:
129
- name: MMLU-PRO (5-shot)
130
- type: TIGER-Lab/MMLU-Pro
131
- config: main
132
- split: test
133
- args:
134
- num_few_shot: 5
135
- metrics:
136
- - type: acc
137
- value: 6.03
138
- name: accuracy
139
- - type: acc
140
- value: 7.17
141
- name: accuracy
142
- - type: acc
143
- value: 7.17
144
- name: accuracy
145
- source:
146
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=meditsolutions/Llama-3.2-SUN-2.4B-v1.0.0
147
- name: Open LLM Leaderboard
148
  ---
149
 
150
  # MedIT SUN 2.5B
@@ -183,31 +52,3 @@ As the model is still in training, performance and capabilities may vary. Users
183
 
184
  **Disclaimer and Safety Considerations**
185
  The Model is designed to be used as a smart assistant but not as a knowledge source within your applications, systems, or environments. It is not intended to provide 100% accurate answers, especially in scenarios where high precision and accuracy are
186
-
187
- # [Open LLM Leaderboard Evaluation Results](https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard)
188
- Detailed results can be found [here](https://huggingface.co/datasets/open-llm-leaderboard/details_meditsolutions__Llama-3.2-SUN-2.5B-chat)
189
-
190
- | Metric |Value|
191
- |-------------------|----:|
192
- |Avg. |11.93|
193
- |IFEval (0-Shot) |55.37|
194
- |BBH (3-Shot) | 7.17|
195
- |MATH Lvl 5 (4-Shot)| 1.28|
196
- |GPQA (0-shot) | 0.45|
197
- |MuSR (0-shot) | 0.13|
198
- |MMLU-PRO (5-shot) | 7.17|
199
-
200
-
201
- # [Open LLM Leaderboard Evaluation Results](https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard)
202
- Detailed results can be found [here](https://huggingface.co/datasets/open-llm-leaderboard/details_meditsolutions__Llama-3.2-SUN-2.5B-chat)
203
-
204
- | Metric |Value|
205
- |-------------------|----:|
206
- |Avg. |11.93|
207
- |IFEval (0-Shot) |55.37|
208
- |BBH (3-Shot) | 7.17|
209
- |MATH Lvl 5 (4-Shot)| 1.28|
210
- |GPQA (0-shot) | 0.45|
211
- |MuSR (0-shot) | 0.13|
212
- |MMLU-PRO (5-shot) | 7.17|
213
-
 
14
  - WizardLMTeam/WizardLM_evol_instruct_V2_196k
15
  - ProlificAI/social-reasoning-rlhf
16
  pipeline_tag: text-generation
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
17
  ---
18
 
19
  # MedIT SUN 2.5B
 
52
 
53
  **Disclaimer and Safety Considerations**
54
  The Model is designed to be used as a smart assistant but not as a knowledge source within your applications, systems, or environments. It is not intended to provide 100% accurate answers, especially in scenarios where high precision and accuracy are