kz-transformers commited on
Commit
bdcd265
·
verified ·
1 Parent(s): 266420a

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +106 -2
app.py CHANGED
@@ -225,9 +225,113 @@ def aggregate_leaderboard_data():
225
  "kk_biology_unt_mc": 0.22330729166666666,
226
  "kk_human_society_rights_unt_mc": 0.242152466367713,
227
  },
228
- # ...(rest of your baseline entries)...
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
229
  ]
230
-
231
  files_list = glob.glob("./m_data/model_data/external/*.json")
232
  logging.info(f'FILES LIST: {files_list}')
233
 
 
225
  "kk_biology_unt_mc": 0.22330729166666666,
226
  "kk_human_society_rights_unt_mc": 0.242152466367713,
227
  },
228
+ {
229
+ "model_dtype": "torch.float16",
230
+ "model": "gpt-4o-mini",
231
+ "ppl": 0,
232
+ "mmlu_translated_kk": 0.5623775310254735,
233
+ "kk_constitution_mc": 0.79,
234
+ "kk_dastur_mc": 0.755,
235
+ "kazakh_and_literature_unt_mc": 0.4953071672354949,
236
+ "kk_geography_unt_mc": 0.5675203725261933,
237
+ "kk_world_history_unt_mc": 0.6091205211726385,
238
+ "kk_history_of_kazakhstan_unt_mc": 0.47883435582822087,
239
+ "kk_english_unt_mc": 0.6763768775603095,
240
+ "kk_biology_unt_mc": 0.607421875,
241
+ "kk_human_society_rights_unt_mc": 0.7309417040358744,
242
+ },
243
+ {
244
+ "model_dtype": "api",
245
+ "model": "gpt-4o",
246
+ "ppl": 0,
247
+ "mmlu_translated_kk": 0.7419986936642717,
248
+ "kk_constitution_mc": 0.841,
249
+ "kk_dastur_mc": 0.798,
250
+ "kazakh_and_literature_unt_mc": 0.6785409556313993,
251
+ "kk_geography_unt_mc": 0.629802095459837,
252
+ "kk_world_history_unt_mc": 0.6783387622149837,
253
+ "kk_history_of_kazakhstan_unt_mc": 0.6785276073619632,
254
+ "kk_english_unt_mc": 0.7410104688211198,
255
+ "kk_biology_unt_mc": 0.6979166666666666,
256
+ "kk_human_society_rights_unt_mc": 0.7937219730941704,
257
+ },
258
+ {
259
+ "model_dtype": "torch.float16",
260
+ "model": "nova-pro-v1",
261
+ "ppl": 0,
262
+ "mmlu_translated_kk": 0.6792945787067276,
263
+ "kk_constitution_mc": 0.7753623188405797,
264
+ "kk_dastur_mc": 0.718407960199005,
265
+ "kazakh_and_literature_unt_mc": 0.4656569965870307,
266
+ "kk_geography_unt_mc": 0.5541327124563445,
267
+ "kk_world_history_unt_mc": 0.6425081433224755,
268
+ "kk_history_of_kazakhstan_unt_mc": 0.5,
269
+ "kk_english_unt_mc": 0.6845698680018206,
270
+ "kk_biology_unt_mc": 0.6197916666666666,
271
+ "kk_human_society_rights_unt_mc": 0.7713004484304933,
272
+ },
273
+ {
274
+ "model_dtype": "torch.float16",
275
+ "model": "gemini-1.5-pro",
276
+ "ppl": 0,
277
+ "mmlu_translated_kk": 0.7380796864794252,
278
+ "kk_constitution_mc": 0.8164251207729468,
279
+ "kk_dastur_mc": 0.7383084577114428,
280
+ "kazakh_and_literature_unt_mc": 0.5565273037542662,
281
+ "kk_geography_unt_mc": 0.6065192083818394,
282
+ "kk_world_history_unt_mc": 0.6669381107491856,
283
+ "kk_history_of_kazakhstan_unt_mc": 0.5791411042944785,
284
+ "kk_english_unt_mc": 0.7114246700045517,
285
+ "kk_biology_unt_mc": 0.6673177083333334,
286
+ "kk_human_society_rights_unt_mc": 0.7623318385650224,
287
+ },
288
+ {
289
+ "model_dtype": "torch.float16",
290
+ "model": "gemini-1.5-flash",
291
+ "ppl": 0,
292
+ "mmlu_translated_kk": 0.6335728282168517,
293
+ "kk_constitution_mc": 0.748792270531401,
294
+ "kk_dastur_mc": 0.7054726368159204,
295
+ "kazakh_and_literature_unt_mc": 0.4761092150170648,
296
+ "kk_geography_unt_mc": 0.5640279394644936,
297
+ "kk_world_history_unt_mc": 0.5838762214983714,
298
+ "kk_history_of_kazakhstan_unt_mc": 0.43374233128834355,
299
+ "kk_english_unt_mc": 0.6681838871187984,
300
+ "kk_biology_unt_mc": 0.6217447916666666,
301
+ "kk_human_society_rights_unt_mc": 0.7040358744394619,
302
+ },
303
+ {
304
+ "model_dtype": "torch.float16",
305
+ "model": "claude-3-5-sonnet",
306
+ "ppl": 0,
307
+ "mmlu_translated_kk": 0.7335075114304376,
308
+ "kk_constitution_mc": 0.8623188405797102,
309
+ "kk_dastur_mc": 0.7950248756218905,
310
+ "kazakh_and_literature_unt_mc": 0.6548634812286689,
311
+ "kk_geography_unt_mc": 0.6431897555296857,
312
+ "kk_world_history_unt_mc": 0.6669381107491856,
313
+ "kk_history_of_kazakhstan_unt_mc": 0.6251533742331289,
314
+ "kk_english_unt_mc": 0.7291761492944925,
315
+ "kk_biology_unt_mc": 0.6686197916666666,
316
+ "kk_human_society_rights_unt_mc": 0.8026905829596412,
317
+ },
318
+ {
319
+ "model_dtype": "torch.float16",
320
+ "model": "yandex-gpt",
321
+ "ppl": 0,
322
+ "mmlu_translated_kk": 0.39777922926192033,
323
+ "kk_constitution_mc": 0.7028985507246377,
324
+ "kk_dastur_mc": 0.6159203980099502,
325
+ "kazakh_and_literature_unt_mc": 0.3914249146757679,
326
+ "kk_geography_unt_mc": 0.4912689173457509,
327
+ "kk_world_history_unt_mc": 0.5244299674267101,
328
+ "kk_history_of_kazakhstan_unt_mc": 0.4030674846625767,
329
+ "kk_english_unt_mc": 0.5844333181611289,
330
+ "kk_biology_unt_mc": 0.4368489583333333,
331
+ "kk_human_society_rights_unt_mc": 0.6995515695067265,
332
+ },
333
  ]
334
+
335
  files_list = glob.glob("./m_data/model_data/external/*.json")
336
  logging.info(f'FILES LIST: {files_list}')
337