test2

Sleeping

Jimin Huang commited on Jan 28

Commit

507c509

2 Parent(s): 6875c1b 077602c

Merge branch 'main' of hf.co:spaces/TheFinAI/open_greek_finance_llm_leaderboard into main

Files changed (4) hide show

backend/app/services/leaderboard.py CHANGED Viewed

@@ -116,6 +116,11 @@ class LeaderboardService:
                     "value": data.get("QA Raw", 0),
                     "normalized_score": data.get("QA", 0)
                 },
             }
             features = {

                     "value": data.get("QA Raw", 0),
                     "normalized_score": data.get("QA", 0)
                 },
+                "fns": {
+                    "name": "FNS",
+                    "value": data.get("FNS Raw", 0),
+                    "normalized_score": data.get("FNS", 0)
+                },
             }
             features = {

frontend/src/pages/LeaderboardPage/components/Leaderboard/constants/defaults.js CHANGED Viewed

@@ -137,6 +137,12 @@ const COLUMNS = {
       defaultVisible: true,
       label: "QA",
     },
   },
   MODEL_INFO: {
     "metadata.co2_cost": {

       defaultVisible: true,
       label: "QA",
     },
+    "evaluations.fns.normalized_score": {
+      group: "evaluation",
+      size: COLUMN_SIZES.BENCHMARK,
+      defaultVisible: true,
+      label: "FNS",
+    },
   },
   MODEL_INFO: {
     "metadata.co2_cost": {

frontend/src/pages/LeaderboardPage/components/Leaderboard/constants/tooltips.js CHANGED Viewed

@@ -48,7 +48,7 @@ export const COLUMN_TOOLTIPS = {
       subItems: ["Language Understanding", "Classification"],
     },
     {
-      label: "Scoring: Micro F1",
       description: "Was the correct choice selected among the options.",
     },
   ]),
@@ -61,11 +61,24 @@ export const COLUMN_TOOLTIPS = {
       subItems: ["Language Understanding", "Classification"],
     },
     {
-      label: "Scoring: Micro F1",
       description: "Was the correct choice selected among the options.",
     },
   ]),
   ARCHITECTURE: createTooltipContent("Model Architecture Information:", [
     {
       label: "Definition",

       subItems: ["Language Understanding", "Classification"],
     },
     {
+      label: "Scoring: ACC Norm",
       description: "Was the correct choice selected among the options.",
     },
   ]),
       subItems: ["Language Understanding", "Classification"],
     },
     {
+      label: "Scoring: ACC Norm",
       description: "Was the correct choice selected among the options.",
     },
   ]),
+  FNS: createTooltipContent("Multilingual Financial NLP (FNS):", [
+    {
+      label: "Purpose",
+      description:
+        "Tests model's ability to summarize real-world financial annual reports",
+      subItems: ["Language Understanding", "Summarization"],
+    },
+    {
+      label: "Scoring: Rouge1",
+      description: "Was the overlap of unigrams (each word) between the predicted and reference summaries.",
+    },
+  ]),
   ARCHITECTURE: createTooltipContent("Model Architecture Information:", [
     {
       label: "Definition",

frontend/src/pages/LeaderboardPage/components/Leaderboard/utils/columnUtils.js CHANGED Viewed

@@ -768,6 +768,15 @@ export const createColumns = (
         "evaluations.qa.normalized_score"
       ],
     },
   ];
   const optionalColumns = [

         "evaluations.qa.normalized_score"
       ],
     },
+    {
+      accessorKey: "evaluations.fns.normalized_score",
+      header: createHeaderCell("FNS", COLUMN_TOOLTIPS.FNS),
+      cell: ({ row, getValue }) =>
+        createScoreCell(getValue, row, "evaluations.fns.normalized_score"),
+      size: TABLE_DEFAULTS.COLUMNS.COLUMN_SIZES[
+        "evaluations.fns.normalized_score"
+      ],
+    },
   ];
   const optionalColumns = [