Update README.md
Browse files
README.md
CHANGED
@@ -103,8 +103,8 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
|
|
103 |
<tr>
|
104 |
<th>Model</th>
|
105 |
<th align="center"><strong>Supports Vision</strong></th>
|
106 |
-
<th align="center" colspan="
|
107 |
-
<th align="center" colspan="5"><strong>Multimodal
|
108 |
</tr>
|
109 |
<tr>
|
110 |
<th></th>
|
@@ -114,8 +114,6 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
|
|
114 |
<th align="center">liveBench</th>
|
115 |
<th align="center">IFEVAL</th>
|
116 |
<th align="center">BFCL</th>
|
117 |
-
<th align="center">MATHβ500</th>
|
118 |
-
<th align="center">AIMEΒ 2024</th>
|
119 |
<th align="center">GPQA</th>
|
120 |
<th align="center">MMMU(val)</th>
|
121 |
<th align="center">MathVista(mini)</th>
|
@@ -133,8 +131,6 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
|
|
133 |
<td align="center">73.2</td>
|
134 |
<td align="center">82.9</td>
|
135 |
<td align="center">66.3</td>
|
136 |
-
<td align="center">94.0</td>
|
137 |
-
<td align="center">72.0</td>
|
138 |
<td align="center">61.6</td>
|
139 |
<td align="center">73.6</td>
|
140 |
<td align="center">74.0</td>
|
@@ -151,8 +147,6 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
|
|
151 |
<td align="center">72.5</td>
|
152 |
<td align="center">53.5</td>
|
153 |
<td align="center">β</td>
|
154 |
-
<td align="center">β</td>
|
155 |
-
<td align="center">β</td>
|
156 |
<td align="center">68.0</td>
|
157 |
<td align="center">67.0</td>
|
158 |
<td align="center">β</td>
|
@@ -167,8 +161,6 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
|
|
167 |
<td align="center">71.6</td>
|
168 |
<td align="center">83.3</td>
|
169 |
<td align="center">60.3</td>
|
170 |
-
<td align="center">97.3</td>
|
171 |
-
<td align="center">79.8</td>
|
172 |
<td align="center">71.5</td>
|
173 |
<td align="center">β</td>
|
174 |
<td align="center">β</td>
|
@@ -190,8 +182,6 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
|
|
190 |
<td align="center">β</td>
|
191 |
<td align="center">β</td>
|
192 |
<td align="center">β</td>
|
193 |
-
<td align="center">β</td>
|
194 |
-
<td align="center">β</td>
|
195 |
</tr>
|
196 |
<tr>
|
197 |
<td>GPTβo4βmini</td>
|
@@ -201,8 +191,6 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
|
|
201 |
<td align="center">78.1</td>
|
202 |
<td align="center">β</td>
|
203 |
<td align="center">β</td>
|
204 |
-
<td align="center">74.6</td>
|
205 |
-
<td align="center">9.3</td>
|
206 |
<td align="center">49.9</td>
|
207 |
<td align="center">81.6</td>
|
208 |
<td align="center">84.3</td>
|
@@ -211,15 +199,13 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
|
|
211 |
<td align="center">β</td>
|
212 |
</tr>
|
213 |
<tr>
|
214 |
-
<td>Claude
|
215 |
<td align="center">β
</td>
|
216 |
<td align="center">β</td>
|
217 |
<td align="center">β</td>
|
218 |
<td align="center">β</td>
|
219 |
<td align="center">β</td>
|
220 |
<td align="center">β</td>
|
221 |
-
<td align="center">78.3</td>
|
222 |
-
<td align="center">16.0</td>
|
223 |
<td align="center">65.0</td>
|
224 |
<td align="center">66.4</td>
|
225 |
<td align="center">65.3</td>
|
@@ -228,15 +214,13 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
|
|
228 |
<td align="center">β</td>
|
229 |
</tr>
|
230 |
<tr>
|
231 |
-
<td>Kimi
|
232 |
<td align="center">β
</td>
|
233 |
<td align="center">β</td>
|
234 |
<td align="center">β</td>
|
235 |
<td align="center">β</td>
|
236 |
<td align="center">β</td>
|
237 |
<td align="center">β</td>
|
238 |
-
<td align="center">96.2</td>
|
239 |
-
<td align="center">77.5</td>
|
240 |
<td align="center">β</td>
|
241 |
<td align="center">70.0</td>
|
242 |
<td align="center">74.9</td>
|
@@ -253,8 +237,6 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
|
|
253 |
<td align="center">β</td>
|
254 |
<td align="center">β</td>
|
255 |
<td align="center">β</td>
|
256 |
-
<td align="center">β</td>
|
257 |
-
<td align="center">β</td>
|
258 |
<td align="center">70.2</td>
|
259 |
<td align="center">74.8</td>
|
260 |
<td align="center">β</td>
|
@@ -270,8 +252,6 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
|
|
270 |
<td align="center">β</td>
|
271 |
<td align="center">β</td>
|
272 |
<td align="center">β</td>
|
273 |
-
<td align="center">β</td>
|
274 |
-
<td align="center">β</td>
|
275 |
<td align="center">70.1</td>
|
276 |
<td align="center">72.3</td>
|
277 |
<td align="center">β</td>
|
@@ -285,6 +265,7 @@ Skywork-R1V2-38B is a **state-of-the-art open-source multimodal reasoning model*
|
|
285 |
|
286 |
|
287 |
|
|
|
288 |
---
|
289 |
|
290 |
|
|
|
103 |
<tr>
|
104 |
<th>Model</th>
|
105 |
<th align="center"><strong>Supports Vision</strong></th>
|
106 |
+
<th align="center" colspan="6"><strong>Text Reasoning (%)</strong></th>
|
107 |
+
<th align="center" colspan="5"><strong>Multimodal Reasoning (%)</strong></th>
|
108 |
</tr>
|
109 |
<tr>
|
110 |
<th></th>
|
|
|
114 |
<th align="center">liveBench</th>
|
115 |
<th align="center">IFEVAL</th>
|
116 |
<th align="center">BFCL</th>
|
|
|
|
|
117 |
<th align="center">GPQA</th>
|
118 |
<th align="center">MMMU(val)</th>
|
119 |
<th align="center">MathVista(mini)</th>
|
|
|
131 |
<td align="center">73.2</td>
|
132 |
<td align="center">82.9</td>
|
133 |
<td align="center">66.3</td>
|
|
|
|
|
134 |
<td align="center">61.6</td>
|
135 |
<td align="center">73.6</td>
|
136 |
<td align="center">74.0</td>
|
|
|
147 |
<td align="center">72.5</td>
|
148 |
<td align="center">53.5</td>
|
149 |
<td align="center">β</td>
|
|
|
|
|
150 |
<td align="center">68.0</td>
|
151 |
<td align="center">67.0</td>
|
152 |
<td align="center">β</td>
|
|
|
161 |
<td align="center">71.6</td>
|
162 |
<td align="center">83.3</td>
|
163 |
<td align="center">60.3</td>
|
|
|
|
|
164 |
<td align="center">71.5</td>
|
165 |
<td align="center">β</td>
|
166 |
<td align="center">β</td>
|
|
|
182 |
<td align="center">β</td>
|
183 |
<td align="center">β</td>
|
184 |
<td align="center">β</td>
|
|
|
|
|
185 |
</tr>
|
186 |
<tr>
|
187 |
<td>GPTβo4βmini</td>
|
|
|
191 |
<td align="center">78.1</td>
|
192 |
<td align="center">β</td>
|
193 |
<td align="center">β</td>
|
|
|
|
|
194 |
<td align="center">49.9</td>
|
195 |
<td align="center">81.6</td>
|
196 |
<td align="center">84.3</td>
|
|
|
199 |
<td align="center">β</td>
|
200 |
</tr>
|
201 |
<tr>
|
202 |
+
<td>Claude 3.5 Sonnet</td>
|
203 |
<td align="center">β
</td>
|
204 |
<td align="center">β</td>
|
205 |
<td align="center">β</td>
|
206 |
<td align="center">β</td>
|
207 |
<td align="center">β</td>
|
208 |
<td align="center">β</td>
|
|
|
|
|
209 |
<td align="center">65.0</td>
|
210 |
<td align="center">66.4</td>
|
211 |
<td align="center">65.3</td>
|
|
|
214 |
<td align="center">β</td>
|
215 |
</tr>
|
216 |
<tr>
|
217 |
+
<td>Kimi k1.5 long-cot</td>
|
218 |
<td align="center">β
</td>
|
219 |
<td align="center">β</td>
|
220 |
<td align="center">β</td>
|
221 |
<td align="center">β</td>
|
222 |
<td align="center">β</td>
|
223 |
<td align="center">β</td>
|
|
|
|
|
224 |
<td align="center">β</td>
|
225 |
<td align="center">70.0</td>
|
226 |
<td align="center">74.9</td>
|
|
|
237 |
<td align="center">β</td>
|
238 |
<td align="center">β</td>
|
239 |
<td align="center">β</td>
|
|
|
|
|
240 |
<td align="center">70.2</td>
|
241 |
<td align="center">74.8</td>
|
242 |
<td align="center">β</td>
|
|
|
252 |
<td align="center">β</td>
|
253 |
<td align="center">β</td>
|
254 |
<td align="center">β</td>
|
|
|
|
|
255 |
<td align="center">70.1</td>
|
256 |
<td align="center">72.3</td>
|
257 |
<td align="center">β</td>
|
|
|
265 |
|
266 |
|
267 |
|
268 |
+
|
269 |
---
|
270 |
|
271 |
|