OrlandoHugBot commited on
Commit
62794d3
Β·
verified Β·
1 Parent(s): 22aa9bd

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +5 -24
README.md CHANGED
@@ -103,8 +103,8 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
103
  <tr>
104
  <th>Model</th>
105
  <th align="center"><strong>Supports Vision</strong></th>
106
- <th align="center" colspan="8"><strong>TextΒ ReasoningΒ (%)</strong></th>
107
- <th align="center" colspan="5"><strong>MultimodalΒ ReasoningΒ (%)</strong></th>
108
  </tr>
109
  <tr>
110
  <th></th>
@@ -114,8 +114,6 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
114
  <th align="center">liveBench</th>
115
  <th align="center">IFEVAL</th>
116
  <th align="center">BFCL</th>
117
- <th align="center">MATH‑500</th>
118
- <th align="center">AIMEΒ 2024</th>
119
  <th align="center">GPQA</th>
120
  <th align="center">MMMU(val)</th>
121
  <th align="center">MathVista(mini)</th>
@@ -133,8 +131,6 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
133
  <td align="center">73.2</td>
134
  <td align="center">82.9</td>
135
  <td align="center">66.3</td>
136
- <td align="center">94.0</td>
137
- <td align="center">72.0</td>
138
  <td align="center">61.6</td>
139
  <td align="center">73.6</td>
140
  <td align="center">74.0</td>
@@ -151,8 +147,6 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
151
  <td align="center">72.5</td>
152
  <td align="center">53.5</td>
153
  <td align="center">–</td>
154
- <td align="center">–</td>
155
- <td align="center">–</td>
156
  <td align="center">68.0</td>
157
  <td align="center">67.0</td>
158
  <td align="center">–</td>
@@ -167,8 +161,6 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
167
  <td align="center">71.6</td>
168
  <td align="center">83.3</td>
169
  <td align="center">60.3</td>
170
- <td align="center">97.3</td>
171
- <td align="center">79.8</td>
172
  <td align="center">71.5</td>
173
  <td align="center">–</td>
174
  <td align="center">–</td>
@@ -190,8 +182,6 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
190
  <td align="center">–</td>
191
  <td align="center">–</td>
192
  <td align="center">–</td>
193
- <td align="center">–</td>
194
- <td align="center">–</td>
195
  </tr>
196
  <tr>
197
  <td>GPT‑o4‑mini</td>
@@ -201,8 +191,6 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
201
  <td align="center">78.1</td>
202
  <td align="center">–</td>
203
  <td align="center">–</td>
204
- <td align="center">74.6</td>
205
- <td align="center">9.3</td>
206
  <td align="center">49.9</td>
207
  <td align="center">81.6</td>
208
  <td align="center">84.3</td>
@@ -211,15 +199,13 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
211
  <td align="center">–</td>
212
  </tr>
213
  <tr>
214
- <td>ClaudeΒ 3.5Β Sonnet</td>
215
  <td align="center">βœ…</td>
216
  <td align="center">–</td>
217
  <td align="center">–</td>
218
  <td align="center">–</td>
219
  <td align="center">–</td>
220
  <td align="center">–</td>
221
- <td align="center">78.3</td>
222
- <td align="center">16.0</td>
223
  <td align="center">65.0</td>
224
  <td align="center">66.4</td>
225
  <td align="center">65.3</td>
@@ -228,15 +214,13 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
228
  <td align="center">–</td>
229
  </tr>
230
  <tr>
231
- <td>KimiΒ k1.5Β long-cot</td>
232
  <td align="center">βœ…</td>
233
  <td align="center">–</td>
234
  <td align="center">–</td>
235
  <td align="center">–</td>
236
  <td align="center">–</td>
237
  <td align="center">–</td>
238
- <td align="center">96.2</td>
239
- <td align="center">77.5</td>
240
  <td align="center">–</td>
241
  <td align="center">70.0</td>
242
  <td align="center">74.9</td>
@@ -253,8 +237,6 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
253
  <td align="center">–</td>
254
  <td align="center">–</td>
255
  <td align="center">–</td>
256
- <td align="center">–</td>
257
- <td align="center">–</td>
258
  <td align="center">70.2</td>
259
  <td align="center">74.8</td>
260
  <td align="center">–</td>
@@ -270,8 +252,6 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
270
  <td align="center">–</td>
271
  <td align="center">–</td>
272
  <td align="center">–</td>
273
- <td align="center">–</td>
274
- <td align="center">–</td>
275
  <td align="center">70.1</td>
276
  <td align="center">72.3</td>
277
  <td align="center">–</td>
@@ -285,6 +265,7 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
285
 
286
 
287
 
 
288
  ---
289
 
290
 
 
103
  <tr>
104
  <th>Model</th>
105
  <th align="center"><strong>Supports Vision</strong></th>
106
+ <th align="center" colspan="6"><strong>Text Reasoning (%)</strong></th>
107
+ <th align="center" colspan="5"><strong>Multimodal Reasoning (%)</strong></th>
108
  </tr>
109
  <tr>
110
  <th></th>
 
114
  <th align="center">liveBench</th>
115
  <th align="center">IFEVAL</th>
116
  <th align="center">BFCL</th>
 
 
117
  <th align="center">GPQA</th>
118
  <th align="center">MMMU(val)</th>
119
  <th align="center">MathVista(mini)</th>
 
131
  <td align="center">73.2</td>
132
  <td align="center">82.9</td>
133
  <td align="center">66.3</td>
 
 
134
  <td align="center">61.6</td>
135
  <td align="center">73.6</td>
136
  <td align="center">74.0</td>
 
147
  <td align="center">72.5</td>
148
  <td align="center">53.5</td>
149
  <td align="center">–</td>
 
 
150
  <td align="center">68.0</td>
151
  <td align="center">67.0</td>
152
  <td align="center">–</td>
 
161
  <td align="center">71.6</td>
162
  <td align="center">83.3</td>
163
  <td align="center">60.3</td>
 
 
164
  <td align="center">71.5</td>
165
  <td align="center">–</td>
166
  <td align="center">–</td>
 
182
  <td align="center">–</td>
183
  <td align="center">–</td>
184
  <td align="center">–</td>
 
 
185
  </tr>
186
  <tr>
187
  <td>GPT‑o4‑mini</td>
 
191
  <td align="center">78.1</td>
192
  <td align="center">–</td>
193
  <td align="center">–</td>
 
 
194
  <td align="center">49.9</td>
195
  <td align="center">81.6</td>
196
  <td align="center">84.3</td>
 
199
  <td align="center">–</td>
200
  </tr>
201
  <tr>
202
+ <td>Claude 3.5 Sonnet</td>
203
  <td align="center">βœ…</td>
204
  <td align="center">–</td>
205
  <td align="center">–</td>
206
  <td align="center">–</td>
207
  <td align="center">–</td>
208
  <td align="center">–</td>
 
 
209
  <td align="center">65.0</td>
210
  <td align="center">66.4</td>
211
  <td align="center">65.3</td>
 
214
  <td align="center">–</td>
215
  </tr>
216
  <tr>
217
+ <td>Kimi k1.5 long-cot</td>
218
  <td align="center">βœ…</td>
219
  <td align="center">–</td>
220
  <td align="center">–</td>
221
  <td align="center">–</td>
222
  <td align="center">–</td>
223
  <td align="center">–</td>
 
 
224
  <td align="center">–</td>
225
  <td align="center">70.0</td>
226
  <td align="center">74.9</td>
 
237
  <td align="center">–</td>
238
  <td align="center">–</td>
239
  <td align="center">–</td>
 
 
240
  <td align="center">70.2</td>
241
  <td align="center">74.8</td>
242
  <td align="center">–</td>
 
252
  <td align="center">–</td>
253
  <td align="center">–</td>
254
  <td align="center">–</td>
 
 
255
  <td align="center">70.1</td>
256
  <td align="center">72.3</td>
257
  <td align="center">–</td>
 
265
 
266
 
267
 
268
+
269
  ---
270
 
271