Spaces:

whitecircle-ai
/

circle-guard-bench

Running

apsys commited on Apr 25

Commit

5125f34

1 Parent(s): a17bcda

categories rename

Files changed (2) hide show

app.py CHANGED Viewed

@@ -585,16 +585,24 @@ demo = gr.Blocks(css=custom_css, theme=custom_theme)
 # Mapping from original category names to display names
 CATEGORY_DISPLAY_MAP = {
-    "Criminal, Violent, and Terrorist Activity": "Crime & Violence",
-    "Manipulation, Deception, and Misinformation": "Misinformation",
-    "Creative Content Involving Illicit Themes": "Illicit Creative",
-    "Sexual Content and Violence": "Sexual Content",
-    "Political Corruption and Legal Evasion": "Corruption & Legal Evasion",
-    "Labor Exploitation and Human Trafficking": "Labor Exploitation",
-    "Environmental and Industrial Harm": "Environmental & Industrial Harm",
-    "Animal Cruelty and Exploitation": "Animal Harm",
-    "Self–Harm and Suicidal Ideation": "Self-Harm",
-    "Safe Prompts": "Safe Prompts"
 }
 # Create reverse mapping for lookups
 CATEGORY_REVERSE_MAP = {v: k for k, v in CATEGORY_DISPLAY_MAP.items()}

 # Mapping from original category names to display names
 CATEGORY_DISPLAY_MAP = {
+    'Political Corruption and Legal Evasion': 'Corruption & Legal Evasion',
+    'Financial Fraud and Unethical Business': 'Financial Fraud',
+    'AI Manipulation and Jailbreaking': 'AI Jailbreaking',
+    'Child Exploitation and Abuse': 'Child Exploitation',
+    'Hate Speech, Extremism, and Discrimination': 'Hate Speech',
+    'Labor Exploitation and Human Trafficking': 'Labor Exploitation',
+    'Manipulation, Deception, and Misinformation': 'Misinformation',
+    'Environmental and Industrial Harm': 'Environmental Harm',
+    'Academic Dishonesty and Cheating': 'Academic Dishonesty',
+    'Self–Harm and Suicidal Ideation': 'Self-Harm',
+    'Animal Cruelty and Exploitation': 'Animal Harm',
+    'Criminal, Violent, and Terrorist Activity': 'Crime & Violence',
+    'Drug– and Substance–Related Activities': 'Drug Use',
+    'Sexual Content and Violence': 'Sexual Content',
+    'Weapon, Explosives, and Hazardous Materials': 'Weapons & Hazmat',
+    'Safe Prompts': 'Safe Prompts',
+    'Cybercrime, Hacking, and Digital Exploits': 'Cybercrime',
+    'Creative Content Involving Illicit Themes': 'Illicit Creative'
 }
 # Create reverse mapping for lookups
 CATEGORY_REVERSE_MAP = {v: k for k, v in CATEGORY_DISPLAY_MAP.items()}

src/display/utils.py CHANGED Viewed

@@ -368,16 +368,24 @@ NEVER_HIDDEN_COLS = [getattr(GUARDBENCH_COLUMN, f.name).name for f in fields(GUA
 # Categories in GuardBench
 CATEGORIES = [
-    "Criminal, Violent, and Terrorist Activity",
-    "Manipulation, Deception, and Misinformation",
-    "Creative Content Involving Illicit Themes",
-    "Sexual Content and Violence",
-    "Political Corruption and Legal Evasion",
-    "Labor Exploitation and Human Trafficking",
-    "Environmental and Industrial Harm",
-    "Animal Cruelty and Exploitation",
-    "Self–Harm and Suicidal Ideation",
-    "Safe Prompts"
 ]
 # Test types in GuardBench

 # Categories in GuardBench
 CATEGORIES = [
+    'Political Corruption and Legal Evasion',
+    'Financial Fraud and Unethical Business',
+    'AI Manipulation and Jailbreaking',
+    'Child Exploitation and Abuse',
+    'Hate Speech, Extremism, and Discrimination',
+    'Labor Exploitation and Human Trafficking',
+    'Manipulation, Deception, and Misinformation',
+    'Environmental and Industrial Harm',
+    'Academic Dishonesty and Cheating',
+    'Self–Harm and Suicidal Ideation',
+    'Animal Cruelty and Exploitation',
+    'Criminal, Violent, and Terrorist Activity',
+    'Drug– and Substance–Related Activities',
+    'Sexual Content and Violence',
+    'Weapon, Explosives, and Hazardous Materials',
+    'Safe Prompts',
+    'Cybercrime, Hacking, and Digital Exploits',
+    'Creative Content Involving Illicit Themes'
 ]
 # Test types in GuardBench