Spaces:

UltraRonin
/

LR2Bench

Running

App Files Files Community

UltraRonin commited on Mar 11

Commit

0d4e8d1

1 Parent(s): fced179

add

Browse files

Files changed (13) hide show

results/DeepSeek-R1.json +3 -1
results/Llama-3.1-70B-Instruct.json +3 -1
results/Llama-3.1-8B-Instruct.json +3 -1
results/Llama-3.3-70B-Instruct.json +3 -1
results/Mistral-7B-Instruct-v0.3.json +3 -1
results/Mistral-Large-Instruct-2411.json +3 -1
results/Mistral-Small-Instruct-2409.json +3 -1
results/QwQ-32B-Preview.json +3 -1
results/Qwen2.5-32B-Instruct.json +3 -1
results/Qwen2.5-72B-Instruct.json +3 -1
results/Qwen2.5-7B-Instruct.json +3 -1
src/display/formatting.py +2 -3
src/leaderboard/read_evals.py +12 -7

results/DeepSeek-R1.json CHANGED Viewed

@@ -1,6 +1,8 @@
 {
     "config": {
-        "model_name": "deepseek-ai/DeepSeek-R1"
     },
     "results": {
         "Overall": {

 {
     "config": {
+        "model_name": "deepseek-ai/DeepSeek-R1",
+        "link": "https://huggingface.co/deepseek-ai/DeepSeek-R1",
+        "Params": "671B"
     },
     "results": {
         "Overall": {

results/Llama-3.1-70B-Instruct.json CHANGED Viewed

@@ -1,6 +1,8 @@
 {
     "config": {
-        "model_name": "meta-llama/Meta-Llama-3.1-70B-Instruct"
     },
     "results": {
         "Overall": {

 {
     "config": {
+        "model_name": "meta-llama/Llama-3.1-70B-Instruct",
+        "link": "https://huggingface.co/meta-llama/Llama-3.1-70B-Instruct",
+        "Params": "70B"
     },
     "results": {
         "Overall": {

results/Llama-3.1-8B-Instruct.json CHANGED Viewed

@@ -1,6 +1,8 @@
 {
     "config": {
-        "model_name": "meta-llama/Meta-Llama-3.1-8B-Instruct"
     },
     "results": {
         "Overall": {

 {
     "config": {
+        "model_name": "meta-llama/Llama-3.1-8B-Instruct",
+        "link": "https://huggingface.co/meta-llama/Llama-3.1-8B-Instruct",
+        "Params": "8B"
     },
     "results": {
         "Overall": {

results/Llama-3.3-70B-Instruct.json CHANGED Viewed

@@ -1,6 +1,8 @@
 {
     "config": {
-        "model_name": "meta-llama/Llama-3.3-70B-Instruct"
     },
     "results": {
         "Overall": {

 {
     "config": {
+        "model_name": "meta-llama/Llama-3.3-70B-Instruct",
+        "link": "https://huggingface.co/meta-llama/Llama-3.3-70B-Instruct",
+        "Params": "70B"
     },
     "results": {
         "Overall": {

results/Mistral-7B-Instruct-v0.3.json CHANGED Viewed

@@ -1,6 +1,8 @@
 {
     "config": {
-        "model_name": "mistralai/Mistral-7B-Instruct-v0.3"
     },
     "results": {
         "Overall": {

 {
     "config": {
+        "model_name": "mistralai/Mistral-7B-Instruct-v0.3",
+        "link": "https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.3",
+        "Params": "7B"
     },
     "results": {
         "Overall": {

results/Mistral-Large-Instruct-2411.json CHANGED Viewed

@@ -1,6 +1,8 @@
 {
     "config": {
-        "model_name": "mistralai/Mistral-Large-Instruct-2411"
     },
     "results": {
         "Overall": {

 {
     "config": {
+        "model_name": "mistralai/Mistral-Large-Instruct-2411",
+        "link": "https://huggingface.co/mistralai/Mistral-Large-Instruct-2411",
+        "Params": "123B"
     },
     "results": {
         "Overall": {

results/Mistral-Small-Instruct-2409.json CHANGED Viewed

@@ -1,6 +1,8 @@
 {
     "config": {
-        "model_name": "mistralai/Mistral-Small-Instruct-2409"
     },
     "results": {
         "Overall": {

 {
     "config": {
+        "model_name": "mistralai/Mistral-Small-Instruct-2409",
+        "link": "https://huggingface.co/mistralai/Mistral-Small-Instruct-2409",
+        "Params": "22B"
     },
     "results": {
         "Overall": {

results/QwQ-32B-Preview.json CHANGED Viewed

@@ -1,6 +1,8 @@
 {
     "config": {
-        "model_name": "Qwen/QwQ-32B-Preview"
     },
     "results": {
         "Overall": {

 {
     "config": {
+        "model_name": "Qwen/QwQ-32B-Preview",
+        "link": "https://huggingface.co/Qwen/QwQ-32B-Preview",
+        "Params": "32B"
     },
     "results": {
         "Overall": {

results/Qwen2.5-32B-Instruct.json CHANGED Viewed

@@ -1,6 +1,8 @@
 {
     "config": {
-        "model_name": "Qwen/Qwen2.5-32B-Instruct"
     },
     "results": {
         "Overall": {

 {
     "config": {
+        "model_name": "Qwen/Qwen2.5-32B-Instruct",
+        "link": "https://huggingface.co/Qwen/Qwen2.5-32B-Instruct",
+        "Params": "32B"
     },
     "results": {
         "Overall": {

results/Qwen2.5-72B-Instruct.json CHANGED Viewed

@@ -1,6 +1,8 @@
 {
     "config": {
-        "model_name": "Qwen/Qwen2.5-72B-Instruct"
     },
     "results": {
         "Overall": {

 {
     "config": {
+        "model_name": "Qwen/Qwen2.5-72B-Instruct",
+        "link": "https://huggingface.co/Qwen/Qwen2.5-72B-Instruct",
+        "Params": "72B"
     },
     "results": {
         "Overall": {

results/Qwen2.5-7B-Instruct.json CHANGED Viewed

@@ -1,6 +1,8 @@
 {
     "config": {
-        "model_name": "Qwen/Qwen2.5-7B-Instruct"
     },
     "results": {
         "Overall": {

 {
     "config": {
+        "model_name": "Qwen/Qwen2.5-7B-Instruct",
+        "link": "https://huggingface.co/Qwen/Qwen2.5-7B-Instruct",
+        "Params": "7B"
     },
     "results": {
         "Overall": {

src/display/formatting.py CHANGED Viewed

@@ -2,9 +2,8 @@ def model_hyperlink(link, model_name):
     return f'<a target="_blank" href="{link}" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">{model_name}</a>'
-def make_clickable_model(model_name, still_on_hub=False):
-    if still_on_hub:
-        link = f"https://huggingface.co/{model_name}"
         return model_hyperlink(link, model_name)
     else:
         return f'<span>{model_name}</span>'

     return f'<a target="_blank" href="{link}" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">{model_name}</a>'
+def make_clickable_model(model_name, link=''):
+    if link:
         return model_hyperlink(link, model_name)
     else:
         return f'<span>{model_name}</span>'

src/leaderboard/read_evals.py CHANGED Viewed

@@ -28,9 +28,10 @@ class EvalResult:
     # architecture: str = "Unknown"
     # license: str = "?"
     # likes: int = 0
-    num_params: int = 0
     # date: str = "" # submission date of request file
-    still_on_hub: bool = False
     @classmethod
     def init_from_json_file(self, json_filepath):
@@ -46,6 +47,8 @@ class EvalResult:
         # Get model and org
         org_and_model = config.get("model_name", config.get("model_args", None))
         org_and_model = org_and_model.split("/", 1)
         if len(org_and_model) == 1:
             org = None
@@ -59,9 +62,9 @@ class EvalResult:
             result_key = f"{org}_{model}"
         full_model = "/".join(org_and_model)
-        still_on_hub, _, model_config = is_model_on_hub(
-            full_model, config.get("model_sha", "main"), trust_remote_code=True, test_tokenizer=False
-        )
         # architecture = "?"
         # if model_config is not None:
         #     architectures = getattr(model_config, "architectures", None)
@@ -87,9 +90,11 @@ class EvalResult:
             org=org,
             model=model,
             results=results,
             # precision=precision,
             # revision= config.get("model_sha", ""),
-            still_on_hub=still_on_hub,
             # architecture=architecture
         )
@@ -121,7 +126,7 @@ class EvalResult:
             # AutoEvalColumn.model_type_symbol.name: self.model_type.value.symbol,
             # AutoEvalColumn.weight_type.name: self.weight_type.value.name,
             # AutoEvalColumn.architecture.name: self.architecture,
-            AutoEvalColumn.model.name: make_clickable_model(self.full_model, self.still_on_hub),
             # AutoEvalColumn.revision.name: self.revision,
             AutoEvalColumn.average.name: average,
             # AutoEvalColumn.license.name: self.license,

     # architecture: str = "Unknown"
     # license: str = "?"
     # likes: int = 0
+    num_params: str = '-'
     # date: str = "" # submission date of request file
+    # still_on_hub: bool = False
+    link: str = ''
     @classmethod
     def init_from_json_file(self, json_filepath):
         # Get model and org
         org_and_model = config.get("model_name", config.get("model_args", None))
         org_and_model = org_and_model.split("/", 1)
+        link = config.get("link", '')
+        params = config.get("params", '-')
         if len(org_and_model) == 1:
             org = None
             result_key = f"{org}_{model}"
         full_model = "/".join(org_and_model)
+        # still_on_hub, _, model_config = is_model_on_hub(
+        #     full_model, config.get("model_sha", "main"), trust_remote_code=True, test_tokenizer=False
+        # )
         # architecture = "?"
         # if model_config is not None:
         #     architectures = getattr(model_config, "architectures", None)
             org=org,
             model=model,
             results=results,
+            link=link,
+            num_params=params,
             # precision=precision,
             # revision= config.get("model_sha", ""),
+            # still_on_hub=still_on_hub,
             # architecture=architecture
         )
             # AutoEvalColumn.model_type_symbol.name: self.model_type.value.symbol,
             # AutoEvalColumn.weight_type.name: self.weight_type.value.name,
             # AutoEvalColumn.architecture.name: self.architecture,
+            AutoEvalColumn.model.name: make_clickable_model(self.full_model, self.link),
             # AutoEvalColumn.revision.name: self.revision,
             AutoEvalColumn.average.name: average,
             # AutoEvalColumn.license.name: self.license,