Jimin Huang commited on
Commit
507c509
·
2 Parent(s): 6875c1b 077602c

Merge branch 'main' of hf.co:spaces/TheFinAI/open_greek_finance_llm_leaderboard into main

Browse files
backend/app/services/leaderboard.py CHANGED
@@ -116,6 +116,11 @@ class LeaderboardService:
116
  "value": data.get("QA Raw", 0),
117
  "normalized_score": data.get("QA", 0)
118
  },
 
 
 
 
 
119
  }
120
 
121
  features = {
 
116
  "value": data.get("QA Raw", 0),
117
  "normalized_score": data.get("QA", 0)
118
  },
119
+ "fns": {
120
+ "name": "FNS",
121
+ "value": data.get("FNS Raw", 0),
122
+ "normalized_score": data.get("FNS", 0)
123
+ },
124
  }
125
 
126
  features = {
frontend/src/pages/LeaderboardPage/components/Leaderboard/constants/defaults.js CHANGED
@@ -137,6 +137,12 @@ const COLUMNS = {
137
  defaultVisible: true,
138
  label: "QA",
139
  },
 
 
 
 
 
 
140
  },
141
  MODEL_INFO: {
142
  "metadata.co2_cost": {
 
137
  defaultVisible: true,
138
  label: "QA",
139
  },
140
+ "evaluations.fns.normalized_score": {
141
+ group: "evaluation",
142
+ size: COLUMN_SIZES.BENCHMARK,
143
+ defaultVisible: true,
144
+ label: "FNS",
145
+ },
146
  },
147
  MODEL_INFO: {
148
  "metadata.co2_cost": {
frontend/src/pages/LeaderboardPage/components/Leaderboard/constants/tooltips.js CHANGED
@@ -48,7 +48,7 @@ export const COLUMN_TOOLTIPS = {
48
  subItems: ["Language Understanding", "Classification"],
49
  },
50
  {
51
- label: "Scoring: Micro F1",
52
  description: "Was the correct choice selected among the options.",
53
  },
54
  ]),
@@ -61,11 +61,24 @@ export const COLUMN_TOOLTIPS = {
61
  subItems: ["Language Understanding", "Classification"],
62
  },
63
  {
64
- label: "Scoring: Micro F1",
65
  description: "Was the correct choice selected among the options.",
66
  },
67
  ]),
68
 
 
 
 
 
 
 
 
 
 
 
 
 
 
69
  ARCHITECTURE: createTooltipContent("Model Architecture Information:", [
70
  {
71
  label: "Definition",
 
48
  subItems: ["Language Understanding", "Classification"],
49
  },
50
  {
51
+ label: "Scoring: ACC Norm",
52
  description: "Was the correct choice selected among the options.",
53
  },
54
  ]),
 
61
  subItems: ["Language Understanding", "Classification"],
62
  },
63
  {
64
+ label: "Scoring: ACC Norm",
65
  description: "Was the correct choice selected among the options.",
66
  },
67
  ]),
68
 
69
+ FNS: createTooltipContent("Multilingual Financial NLP (FNS):", [
70
+ {
71
+ label: "Purpose",
72
+ description:
73
+ "Tests model's ability to summarize real-world financial annual reports",
74
+ subItems: ["Language Understanding", "Summarization"],
75
+ },
76
+ {
77
+ label: "Scoring: Rouge1",
78
+ description: "Was the overlap of unigrams (each word) between the predicted and reference summaries.",
79
+ },
80
+ ]),
81
+
82
  ARCHITECTURE: createTooltipContent("Model Architecture Information:", [
83
  {
84
  label: "Definition",
frontend/src/pages/LeaderboardPage/components/Leaderboard/utils/columnUtils.js CHANGED
@@ -768,6 +768,15 @@ export const createColumns = (
768
  "evaluations.qa.normalized_score"
769
  ],
770
  },
 
 
 
 
 
 
 
 
 
771
  ];
772
 
773
  const optionalColumns = [
 
768
  "evaluations.qa.normalized_score"
769
  ],
770
  },
771
+ {
772
+ accessorKey: "evaluations.fns.normalized_score",
773
+ header: createHeaderCell("FNS", COLUMN_TOOLTIPS.FNS),
774
+ cell: ({ row, getValue }) =>
775
+ createScoreCell(getValue, row, "evaluations.fns.normalized_score"),
776
+ size: TABLE_DEFAULTS.COLUMNS.COLUMN_SIZES[
777
+ "evaluations.fns.normalized_score"
778
+ ],
779
+ },
780
  ];
781
 
782
  const optionalColumns = [