Spaces:

librarian-bots
/

MetaRefine

Runtime error

App Files Files Community

davanstrien HF Staff commited on Jul 15, 2023

Commit

09af587

1 Parent(s): 3d56068

add metadat scoring explanation tab

Browse files

Files changed (1) hide show

app.py +44 -18

app.py CHANGED Viewed

@@ -1,5 +1,6 @@
 import asyncio
 import copy
 import os
 from dataclasses import asdict, dataclass
 from datetime import datetime, timedelta
@@ -12,14 +13,13 @@ import httpx
 import orjson
 from cachetools import TTLCache, cached
 from cashews import NOT_NONE, cache
 from httpx import AsyncClient, Client
 from huggingface_hub import hf_hub_url, logging
 from huggingface_hub.utils import disable_progress_bars
 from rich import print
 from tqdm.auto import tqdm
-from dotenv import load_dotenv
 load_dotenv()  # take environment variables from .env.
 CACHE_EXPIRY_TIME = timedelta(hours=3)
@@ -233,6 +233,10 @@ ALL_PIPELINES = {
     "zero-shot-image-classification",
 }
 @lru_cache()
 def generate_task_scores_dict():
@@ -575,20 +579,42 @@ with gr.Blocks() as demo:
             [query, min_metadata_score, mim_model_card_length],
             [filter_results, results_markdown],
         )
-    # with gr.Tab("Scoring metadata quality"):
-    #     with gr.Row():
-    #         gr.Markdown(
-    #             f"""
-    #         # Metadata quality scoring
-    #         ```
-    #         {COMMON_SCORES}
-    #         ```
-    #         For example, `TASK_TYPES_WITH_LANGUAGES` defines all the tasks for which it
-    #         is expected to have language metadata associated with the model.
-    #         ```
-    #         {TASK_TYPES_WITH_LANGUAGES}
-    #         ```
-    #         """
-    #         )
 demo.launch()

 import asyncio
 import copy
+import json
 import os
 from dataclasses import asdict, dataclass
 from datetime import datetime, timedelta
 import orjson
 from cachetools import TTLCache, cached
 from cashews import NOT_NONE, cache
+from dotenv import load_dotenv
 from httpx import AsyncClient, Client
 from huggingface_hub import hf_hub_url, logging
 from huggingface_hub.utils import disable_progress_bars
 from rich import print
 from tqdm.auto import tqdm
 load_dotenv()  # take environment variables from .env.
 CACHE_EXPIRY_TIME = timedelta(hours=3)
     "zero-shot-image-classification",
 }
+formatted_scores = "\n"
+for k, v in COMMON_SCORES.items():
+    formatted_scores += f"{k}:{v}" + "\n"
 @lru_cache()
 def generate_task_scores_dict():
             [query, min_metadata_score, mim_model_card_length],
             [filter_results, results_markdown],
         )
+    with gr.Tab("Scoring metadata quality (details)"):
+        with gr.Row():
+            gr.Markdown(
+                """# How metadata quality is scored?
+            The current approach to metadata scoring is based on checking if a particular piece of metadata is present or not i.e. is a dataset specified in the mode's metadata or not?
+            For each metadata field a score between 1 and 3 is given if that feature is present or not. These scores are based on the relative importance of the metadata field.
+            We do this on a task specific basis for models where a `pipeline_tag` exists.
+            For each task the scores achieved are compared to the maximum possible score for that field."""
+            )
+        with gr.Row():
+            gr.Markdown(
+                """
+                ### Common Scores
+                We start with some 'common scores'. These common scores are for fields which should be present for any model i.e. they are not specific to a particular task."""
+            )
+        with gr.Accordion(label="Common scores dictionary"):
+            gr.JSON(json.dumps(COMMON_SCORES))
+        with gr.Row():
+            gr.Markdown(
+                """# Task specific scoring.
+            We also define task specific scores for the following model task types. This allows are scoring to reflect the fact that different tasks have different metadata requirements. For example, the following set includes all tasks for which a language should be specified."""
+            )
+        with gr.Row():
+            markdown_formatted_languages = "".join(
+                "-" + " " + task + "\n" for task in TASK_TYPES_WITH_LANGUAGES
+            )
+            gr.Markdown(markdown_formatted_languages)
+        with gr.Row():
+            gr.Markdown(
+                """#### Text classification example
+                    Below you can see the example scoring dictionary for text-classification models."""
+            )
+        with gr.Accordion(label="Text classification dictionary"):
+            text_class_scores_example = SCORES["text-classification"]
+            gr.Json(json.dumps(text_class_scores_example))
+        with gr.Accordion(label="Full overview of all scores", open=False):
+            gr.Json(json.dumps(SCORES))
 demo.launch()