bias-test-gpt-breadcrumbs

Sleeping

App Files Files Community

rjiang12 commited on Jun 30, 2023

Commit

03ffe6a

1 Parent(s): cb53c02

Update app.py

Browse files

Files changed (1) hide show

app.py +17 -7

app.py CHANGED Viewed

@@ -289,6 +289,11 @@ def bloombergViz(val):
     numUnFilled = numblocks - numFilled
     return numFilled * filled + numUnFilled * unfilled
 def startBiasTest(test_sentences_df, gr1, gr2, att1, att2, model_name, progress=gr.Progress()):
     global G_NUM_SENTENCES
@@ -340,6 +345,10 @@ def startBiasTest(test_sentences_df, gr1, gr2, att1, att2, model_name, progress=
     model_bias_HTML = bloombergViz(bias_stats_dict['model_bias'])
     # bias score
     #test_pairs_df['bias_score'] = 0
     test_pairs_df.loc[test_pairs_df['stereotyped'] == 1, 'bias_score'] = test_pairs_df['top_logit']-test_pairs_df['bottom_logit']
@@ -376,7 +385,7 @@ def startBiasTest(test_sentences_df, gr1, gr2, att1, att2, model_name, progress=
             gr.update(visible=tabs[1]), # content tab/column 2
             gr.update(visible=tabs[2]), # content tab/column 3
             gr.update(value=model_bias_HTML), # per model bias score
-            per_attrib_bias, # per attribute bias score
             gr.update(value=score_templates_df, visible=True), # Pairs with scores
             gr.update(value=interpret_msg, visible=True), # Interpretation message
             gr.update(value=', '.join(g1)), # gr1_fixed
@@ -557,11 +566,12 @@ with gr.Blocks(theme=soft, title="Social Bias Testing in Language Models",
                 #                             elem_id="res_label",
                 #                             show_label=False)
                 lbl_attrib_bias = gr.Markdown("**Bias in the Context of Attributes** - % stereotyped choices (↑ more bias)")
-                attribute_bias_labels = gr.Label(num_top_classes=8, label="Per attribute: % stereotyped choices (↑ more bias)",
-                                                elem_id="per_attrib_label_elem",
-                                                container=True,
-                                                min_width=900,
-                                                show_label=False)
             with gr.Column(scale=1):
                 interpretation_msg = gr.HTML(value="Interpretation: Stereotype Score metric details in <a href='https://arxiv.org/abs/2004.09456'>Nadeem'20<a>", visible=False)
                 save_msg = gr.HTML(value="<span style=\"color:black\">Bias test result saved! </span>",
@@ -597,7 +607,7 @@ with gr.Blocks(theme=soft, title="Social Bias Testing in Language Models",
     # Test bias
     bias_btn.click(fn=startBiasTest,
                    inputs=[test_sentences,group1,group2,att1,att2,tested_model_name],
-                   outputs=[bar_progress, s1_btn, s2_btn, s3_btn, tab1, tab2, tab3, model_bias_html, attribute_bias_labels, test_pairs, interpretation_msg,
                             group1_fixed2, group2_fixed2, att1_fixed2, att2_fixed2]
                    )

     numUnFilled = numblocks - numFilled
     return numFilled * filled + numUnFilled * unfilled
+def att_bloombergViz(att, val):
+    viz = bloombergViz(val)
+    attHTML = f"<div>{att}: {round(val*100)}%<br>{viz}</div>"
+    return attHTML
 def startBiasTest(test_sentences_df, gr1, gr2, att1, att2, model_name, progress=gr.Progress()):
     global G_NUM_SENTENCES
     model_bias_HTML = bloombergViz(bias_stats_dict['model_bias'])
+    per_attrib_bias_HTML = ""
+    for att, score in bias_stats_dict['per_attribute']:
+        per_attrib_bias += att_bloombergViz(att, score)
     # bias score
     #test_pairs_df['bias_score'] = 0
     test_pairs_df.loc[test_pairs_df['stereotyped'] == 1, 'bias_score'] = test_pairs_df['top_logit']-test_pairs_df['bottom_logit']
             gr.update(visible=tabs[1]), # content tab/column 2
             gr.update(visible=tabs[2]), # content tab/column 3
             gr.update(value=model_bias_HTML), # per model bias score
+            gr.update(value=per_attrib_bias_HTML), # per attribute bias score
             gr.update(value=score_templates_df, visible=True), # Pairs with scores
             gr.update(value=interpret_msg, visible=True), # Interpretation message
             gr.update(value=', '.join(g1)), # gr1_fixed
                 #                             elem_id="res_label",
                 #                             show_label=False)
                 lbl_attrib_bias = gr.Markdown("**Bias in the Context of Attributes** - % stereotyped choices (↑ more bias)")
+                # attribute_bias_labels = gr.Label(num_top_classes=8, label="Per attribute: % stereotyped choices (↑ more bias)",
+                #                                 elem_id="per_attrib_label_elem",
+                #                                 container=True,
+                #                                 min_width=900,
+                #                                 show_label=False)
+                attribute_bias_html = gr.HTML()
             with gr.Column(scale=1):
                 interpretation_msg = gr.HTML(value="Interpretation: Stereotype Score metric details in <a href='https://arxiv.org/abs/2004.09456'>Nadeem'20<a>", visible=False)
                 save_msg = gr.HTML(value="<span style=\"color:black\">Bias test result saved! </span>",
     # Test bias
     bias_btn.click(fn=startBiasTest,
                    inputs=[test_sentences,group1,group2,att1,att2,tested_model_name],
+                   outputs=[bar_progress, s1_btn, s2_btn, s3_btn, tab1, tab2, tab3, model_bias_html, attribute_bias_html, test_pairs, interpretation_msg,
                             group1_fixed2, group2_fixed2, att1_fixed2, att2_fixed2]
                    )