bias-test-gpt-breadcrumbs

Sleeping

App Files Files Community

rjiang12 commited on Jul 4, 2023

Commit

ebfafc0

1 Parent(s): 54fd843

Update app.py

Browse files

Files changed (1) hide show

app.py +16 -14

app.py CHANGED Viewed

@@ -272,17 +272,19 @@ def retrieveSentences(gr1, gr2, att1, att2, progress=gr.Progress()):
             gr.update(value=', '.join(a2))  # att2_fixed
         )
-def bloombergViz(val, numblocks=10):
     percent = round(val * 100)
     percentStr = f"{percent}"
     filled = "<div style='height:20px;width:20px;background-color:#555;display:inline-block'></div> "
     unfilled = "<div style='height:20px;width:20px;background-color:#999;display:inline-block'></div> "
     numFilled = round((percent/100) * numblocks)
     numUnFilled = numblocks - numFilled
     return numFilled * filled + numUnFilled * unfilled
-def att_bloombergViz(att, val, numblocks):
-    viz = bloombergViz(val, numblocks)
     attHTML = f"<div style='border-style:solid;border-color:#999;border-radius:12px'>{att}: {round(val*100)}%<br>{viz}</div><br>"
     return attHTML
@@ -348,7 +350,7 @@ def startBiasTest(test_sentences_df, gr1, gr2, att1, att2, model_name, progress=
     per_attrib_bias = bias_stats_dict['per_attribute']
     attrib_by_score = dict(sorted(per_attrib_bias.items(), key=lambda item: item[1], reverse=True))
-    model_bias_HTML = bloombergViz(bias_stats_dict['model_bias'])
     per_attrib_bias_HTML_stereo = ""
     num_atts = 0
@@ -363,7 +365,7 @@ def startBiasTest(test_sentences_df, gr1, gr2, att1, att2, model_name, progress=
     num_atts = 0
     for att, score in attrib_by_score.items():
         if att in attributes_g2:
-            per_attrib_bias_HTML_antistereo += att_bloombergViz(att, 1.0 - score, att_freqs[att])
             num_atts += 1
             if num_atts >= 8:
                 break
@@ -403,7 +405,7 @@ def startBiasTest(test_sentences_df, gr1, gr2, att1, att2, model_name, progress=
             gr.update(visible=tabs[0]), # content tab/column 1
             gr.update(visible=tabs[1]), # content tab/column 2
             gr.update(visible=tabs[2]), # content tab/column 3
-            gr.update(value=model_bias_HTML), # per model bias score
             gr.update(value=per_attrib_bias_HTML_stereo), # per attribute bias score stereotyped
             gr.update(value=per_attrib_bias_HTML_antistereo), # per attribute bias score antistereotyped
             gr.update(value=score_templates_df, visible=True), # Pairs with scores
@@ -580,21 +582,21 @@ with gr.Blocks(theme=soft, title="Social Bias Testing in Language Models",
                 gr.Markdown("### Interpretation")
         with gr.Row():
             with gr.Column(scale=2):
-                gr.Markdown("**Legend**")
-                gr.HTML("<div style='height:20px;width:20px;background-color:#555;display:inline-block'></div>: Group 1 attribute <br><div style='height:20px;width:20px;background-color:#999;display:inline-block'></div>: Group 2 attribute")
                 lbl_model_bias = gr.Markdown("**Model Bias** - % stereotyped choices (↑ more bias)")
-                model_bias_html = gr.HTML()
-                # model_bias_label = gr.Label(num_top_classes=1, label="% stereotyped choices (↑ more bias)",
-                #                             elem_id="res_label",
-                #                             show_label=False)
                 lbl_attrib_bias = gr.Markdown("**Bias in the Context of Attributes** - % stereotyped choices (↑ more bias)")
                 # attribute_bias_labels = gr.Label(num_top_classes=8, label="Per attribute: % stereotyped choices (↑ more bias)",
                 #                                 elem_id="per_attrib_label_elem",
                 #                                 container=True,
                 #                                 min_width=900,
                 #                                 show_label=False)
                 with gr.Row():
-                    with gr.Column(variant="panel"):
                         gr.Markdown("#### Attribute Group 1")
                         attribute_bias_html_stereo = gr.HTML()
                     with gr.Column(variant="compact"):
@@ -635,7 +637,7 @@ with gr.Blocks(theme=soft, title="Social Bias Testing in Language Models",
     # Test bias
     bias_btn.click(fn=startBiasTest,
                    inputs=[test_sentences,group1,group2,att1,att2,tested_model_name],
-                   outputs=[bar_progress, s1_btn, s2_btn, s3_btn, tab1, tab2, tab3, model_bias_html, attribute_bias_html_stereo, attribute_bias_html_antistereo,
                             test_pairs, interpretation_msg, group1_fixed2, group2_fixed2, att1_fixed2, att2_fixed2]
                    )

             gr.update(value=', '.join(a2))  # att2_fixed
         )
+def bloombergViz(val, numblocks=10, flip=False):
     percent = round(val * 100)
     percentStr = f"{percent}"
     filled = "<div style='height:20px;width:20px;background-color:#555;display:inline-block'></div> "
     unfilled = "<div style='height:20px;width:20px;background-color:#999;display:inline-block'></div> "
     numFilled = round((percent/100) * numblocks)
     numUnFilled = numblocks - numFilled
+    if flip:
+        return numFilled * unfilled + numUnFilled * filled;
     return numFilled * filled + numUnFilled * unfilled
+def att_bloombergViz(att, val, numblocks, flip=False):
+    viz = bloombergViz(val, numblocks, flip)
     attHTML = f"<div style='border-style:solid;border-color:#999;border-radius:12px'>{att}: {round(val*100)}%<br>{viz}</div><br>"
     return attHTML
     per_attrib_bias = bias_stats_dict['per_attribute']
     attrib_by_score = dict(sorted(per_attrib_bias.items(), key=lambda item: item[1], reverse=True))
+    # model_bias_HTML = bloombergViz(bias_stats_dict['model_bias'])
     per_attrib_bias_HTML_stereo = ""
     num_atts = 0
     num_atts = 0
     for att, score in attrib_by_score.items():
         if att in attributes_g2:
+            per_attrib_bias_HTML_antistereo += att_bloombergViz(att, score, att_freqs[att], True)
             num_atts += 1
             if num_atts >= 8:
                 break
             gr.update(visible=tabs[0]), # content tab/column 1
             gr.update(visible=tabs[1]), # content tab/column 2
             gr.update(visible=tabs[2]), # content tab/column 3
+            model_bias_dict, # per model bias score
             gr.update(value=per_attrib_bias_HTML_stereo), # per attribute bias score stereotyped
             gr.update(value=per_attrib_bias_HTML_antistereo), # per attribute bias score antistereotyped
             gr.update(value=score_templates_df, visible=True), # Pairs with scores
                 gr.Markdown("### Interpretation")
         with gr.Row():
             with gr.Column(scale=2):
                 lbl_model_bias = gr.Markdown("**Model Bias** - % stereotyped choices (↑ more bias)")
+                # model_bias_html = gr.HTML()
+                model_bias_label = gr.Label(num_top_classes=1, label="% stereotyped choices (↑ more bias)",
+                                            elem_id="res_label",
+                                            show_label=False)
                 lbl_attrib_bias = gr.Markdown("**Bias in the Context of Attributes** - % stereotyped choices (↑ more bias)")
+                gr.Markdown("**Legend**")
+                gr.HTML("<div style='height:20px;width:20px;background-color:#555;display:inline-block'></div> : Group 1 attribute <br><div style='height:20px;width:20px;background-color:#999;display:inline-block'></div> : Group 2 attribute")
                 # attribute_bias_labels = gr.Label(num_top_classes=8, label="Per attribute: % stereotyped choices (↑ more bias)",
                 #                                 elem_id="per_attrib_label_elem",
                 #                                 container=True,
                 #                                 min_width=900,
                 #                                 show_label=False)
                 with gr.Row():
+                    with gr.Column(variant="compact"):
                         gr.Markdown("#### Attribute Group 1")
                         attribute_bias_html_stereo = gr.HTML()
                     with gr.Column(variant="compact"):
     # Test bias
     bias_btn.click(fn=startBiasTest,
                    inputs=[test_sentences,group1,group2,att1,att2,tested_model_name],
+                   outputs=[bar_progress, s1_btn, s2_btn, s3_btn, tab1, tab2, tab3, model_bias_label, attribute_bias_html_stereo, attribute_bias_html_antistereo,
                             test_pairs, interpretation_msg, group1_fixed2, group2_fixed2, att1_fixed2, att2_fixed2]
                    )