bias-test-gpt-breadcrumbs

Sleeping

App Files Files Community

rjiang12 commited on Jul 2, 2023

Commit

857daba

1 Parent(s): 28012b4

Update app.py

Browse files

Files changed (1) hide show

app.py +29 -9

app.py CHANGED Viewed

@@ -315,6 +315,9 @@ def startBiasTest(test_sentences_df, gr1, gr2, att1, att2, model_name, progress=
     print(f"Bias spec dict: {bias_spec}")
     g1, g2, a1, a2 = bt_mgr.get_words(bias_spec)
     # 2. convert to templates
     test_sentences_df['Template'] = test_sentences_df.apply(bt_mgr.sentence_to_template, axis=1)
     print(f"Data with template: {test_sentences_df}")
@@ -346,13 +349,23 @@ def startBiasTest(test_sentences_df, gr1, gr2, att1, att2, model_name, progress=
     model_bias_HTML = bloombergViz(bias_stats_dict['model_bias'])
-    per_attrib_bias_HTML = ""
     num_atts = 0
     for att, score in attrib_by_score.items():
-        per_attrib_bias_HTML += att_bloombergViz(att, score)
-        num_atts += 1
-        if num_atts >= 8:
-            break
     # bias score
     #test_pairs_df['bias_score'] = 0
@@ -390,7 +403,8 @@ def startBiasTest(test_sentences_df, gr1, gr2, att1, att2, model_name, progress=
             gr.update(visible=tabs[1]), # content tab/column 2
             gr.update(visible=tabs[2]), # content tab/column 3
             gr.update(value=model_bias_HTML), # per model bias score
-            gr.update(value=per_attrib_bias_HTML), # per attribute bias score
             gr.update(value=score_templates_df, visible=True), # Pairs with scores
             gr.update(value=interpret_msg, visible=True), # Interpretation message
             gr.update(value=', '.join(g1)), # gr1_fixed
@@ -576,7 +590,13 @@ with gr.Blocks(theme=soft, title="Social Bias Testing in Language Models",
                 #                                 container=True,
                 #                                 min_width=900,
                 #                                 show_label=False)
-                attribute_bias_html = gr.HTML()
             with gr.Column(scale=1):
                 interpretation_msg = gr.HTML(value="Interpretation: Stereotype Score metric details in <a href='https://arxiv.org/abs/2004.09456'>Nadeem'20<a>", visible=False)
                 save_msg = gr.HTML(value="<span style=\"color:black\">Bias test result saved! </span>",
@@ -612,8 +632,8 @@ with gr.Blocks(theme=soft, title="Social Bias Testing in Language Models",
     # Test bias
     bias_btn.click(fn=startBiasTest,
                    inputs=[test_sentences,group1,group2,att1,att2,tested_model_name],
-                   outputs=[bar_progress, s1_btn, s2_btn, s3_btn, tab1, tab2, tab3, model_bias_html, attribute_bias_html, test_pairs, interpretation_msg,
-                            group1_fixed2, group2_fixed2, att1_fixed2, att2_fixed2]
                    )
     # top breadcrumbs

     print(f"Bias spec dict: {bias_spec}")
     g1, g2, a1, a2 = bt_mgr.get_words(bias_spec)
+    attributes_g1 = bias_spec['attributes']['attribute 1']
+    attributes_g2 = bias_spec['attributes']['attribute 2']
     # 2. convert to templates
     test_sentences_df['Template'] = test_sentences_df.apply(bt_mgr.sentence_to_template, axis=1)
     print(f"Data with template: {test_sentences_df}")
     model_bias_HTML = bloombergViz(bias_stats_dict['model_bias'])
+    per_attrib_bias_HTML_stereo = ""
+    num_atts = 0
+    for att, score in attrib_by_score.items():
+        if att in attributes_g1:
+            per_attrib_bias_HTML_stereo += att_bloombergViz(att, score)
+            num_atts += 1
+            if num_atts >= 8:
+                break
+    per_attrib_bias_HTML_antistereo = ""
     num_atts = 0
     for att, score in attrib_by_score.items():
+        if att in attributes_g2:
+            per_attrib_bias_HTML_antistereo += att_bloombergViz(att, score)
+            num_atts += 1
+            if num_atts >= 8:
+                break
     # bias score
     #test_pairs_df['bias_score'] = 0
             gr.update(visible=tabs[1]), # content tab/column 2
             gr.update(visible=tabs[2]), # content tab/column 3
             gr.update(value=model_bias_HTML), # per model bias score
+            gr.update(value=per_attrib_bias_HTML_stereo), # per attribute bias score stereotyped
+            gr.update(value=per_attrib_bias_HTML_antistereo), # per attribute bias score antistereotyped
             gr.update(value=score_templates_df, visible=True), # Pairs with scores
             gr.update(value=interpret_msg, visible=True), # Interpretation message
             gr.update(value=', '.join(g1)), # gr1_fixed
                 #                                 container=True,
                 #                                 min_width=900,
                 #                                 show_label=False)
+                with gr.Row():
+                    with gr.Column():
+                        gr.Markdown("Group 1 stereotypes")
+                        attribute_bias_html_stereo = gr.HTML()
+                    with gr.Column():
+                        gr.Markdown("Group 2 stereotypes")
+                        attribute_bias_html_antistereo = gr.HTML()
             with gr.Column(scale=1):
                 interpretation_msg = gr.HTML(value="Interpretation: Stereotype Score metric details in <a href='https://arxiv.org/abs/2004.09456'>Nadeem'20<a>", visible=False)
                 save_msg = gr.HTML(value="<span style=\"color:black\">Bias test result saved! </span>",
     # Test bias
     bias_btn.click(fn=startBiasTest,
                    inputs=[test_sentences,group1,group2,att1,att2,tested_model_name],
+                   outputs=[bar_progress, s1_btn, s2_btn, s3_btn, tab1, tab2, tab3, model_bias_html, attribute_bias_html_stereo, attribute_bias_html_antistereo,
+                            test_pairs, interpretation_msg, group1_fixed2, group2_fixed2, att1_fixed2, att2_fixed2]
                    )
     # top breadcrumbs