Spaces:

emilylearning
/

spurious_correlation_evaluation

Running

App Files Files Community

emilylearning commited on Mar 6, 2023

Commit

12781b6

1 Parent(s): c494a1d

fix add-own-model bug, less nice but its late, updated markdown,

Browse files

Files changed (1) hide show

app.py +26 -30

app.py CHANGED Viewed

@@ -1,4 +1,3 @@
-# Model card: https://huggingface.co/emilylearning/selection-induced-collider-bias
 # %%
 import gradio as gr
 import matplotlib.pyplot as plt
@@ -8,18 +7,9 @@ import random
 from matplotlib.ticker import MaxNLocator
 from transformers import pipeline
 OWN_MODEL_NAME = 'add-a-model'
-MODEL_NAME_DICT = {
-    "roberta-large": "RoBERTa-large",
-    "bert-large-uncased": "BERT-large",
-    "roberta-base": "RoBERTa-base",
-    "bert-base-uncased": "BERT-base",
-    "olm/olm-roberta-base-oct-2022": "OLM_RoBERTa-base",
-    OWN_MODEL_NAME: "Your model's"
-}
-MODEL_NAMES = list(MODEL_NAME_DICT.keys())
 DECIMAL_PLACES = 1
 EPS = 1e-5  # to avoid /0 errors
@@ -145,12 +135,15 @@ GENDERED_LIST = [
 # %%
 # Fire up the models
-models = {m : pipeline("fill-mask", model=m) for m in MODEL_NAMES if m != OWN_MODEL_NAME}
 # %%
-def get_gendered_tokens():
     male_gendered_tokens = [list[0] for list in GENDERED_LIST]
     female_gendered_tokens = [list[1] for list in GENDERED_LIST]
@@ -177,7 +170,7 @@ def get_avg_prob_from_pipeline_outputs(mask_filled_text, gendered_token, num_pre
 # %%
-def get_figure(df, gender, n_fit=1):
     df = df.set_index('x-axis')
     cols = df.columns
     xs = list(range(len(df)))
@@ -205,7 +198,7 @@ def get_figure(df, gender, n_fit=1):
     ax.axis('tight')
     ax.set_xlabel("Value injected into input text")
     ax.set_title(
-        f"Probability of predicting {gender} pronouns.")
     ax.set_ylabel(f"Softmax prob for pronouns")
     ax.xaxis.set_major_locator(MaxNLocator(6))
     ax.tick_params(axis='x', labelrotation=5)
@@ -227,6 +220,7 @@ def predict_gender_pronouns(
     """
     if model_name not in MODEL_NAMES:
         model = pipeline("fill-mask", model=own_model_name)
     else:
         model = models[model_name]
@@ -234,7 +228,7 @@ def predict_gender_pronouns(
     indie_vars_list = indie_vars.split(',')
-    male_gendered_tokens, female_gendered_tokens = get_gendered_tokens()
     text_segments, num_preds = prepare_text_for_masking(
         input_text, mask_token, male_gendered_tokens + female_gendered_tokens, split_key)
@@ -276,9 +270,9 @@ def predict_gender_pronouns(
     results_df['female_pronouns'] = female_pronoun_preds
     results_df['male_pronouns'] = male_pronoun_preds
     female_fig = get_figure(results_df.drop(
-        'male_pronouns', axis=1), 'female',  n_fit,)
     male_fig = get_figure(results_df.drop(
-        'female_pronouns', axis=1), 'male',  n_fit,)
     display_text = f"{random.choice(indie_vars_list)}".join(text_segments)
     return (
@@ -293,18 +287,17 @@ def predict_gender_pronouns(
 title = "Causing Gender Pronouns"
 description = """
 ## Intro
 """
 date_example = [
-    MODEL_NAMES[4],
     '',
     ', '.join(DATES),
     'DATE',
     "False",
     1,
-    'In DATE, she became an adult.'
 ]
@@ -315,7 +308,7 @@ place_example = [
     'PLACE',
     "False",
     1,
-    'She became a teen in PLACE.'
 ]
@@ -362,7 +355,9 @@ with demo:
     gr.Markdown("# Spurious Correlation Evaluation for Pre-trained LLMs")
     gr.Markdown("Find spurious correlations between seemingly independent variables (for example between `gender` and `time`) in almost any BERT-like LLM on Hugging Face, below.")
-    gr.Markdown("See why this happens in ['Selection Induced Collider Bias: A Gender Pronoun Uncertainty Case Study'](https://arxiv.org/abs/2210.00131).")
     gr.Markdown("## Instructions for this Demo")
     gr.Markdown("1) Click on one of the examples below (where we sweep through a spectrum of `places`, `dates` and `subreddits`) to pre-populate the input fields.")
     gr.Markdown("2) Check out the pre-populated fields as you scroll down to the ['Hit Submit...'] button!")
@@ -401,7 +396,8 @@ with demo:
     with gr.Row():
         model_name = gr.Radio(
-            MODEL_NAMES,
             label="B) BERT-like model.",
         )
         own_model_name = gr.Textbox(
@@ -417,6 +413,7 @@ with demo:
         to_normalize = gr.Dropdown(
             ["False", "True"],
             label="D) Normalize model's predictions to only the gendered ones?",
         )
         place_holder = gr.Textbox(
             label="E) Special token place-holder",
@@ -424,6 +421,7 @@ with demo:
         n_fit = gr.Dropdown(
             list(range(1, 5)),
             label="F) Degree of polynomial fit",
         )
     gr.Markdown(
@@ -436,15 +434,16 @@ with demo:
         )
     gr.Markdown("## Outputs!")
     with gr.Row():
         btn = gr.Button("Hit submit to generate predictions!")
     with gr.Row():
         sample_text = gr.Textbox(
-            label="Output text: Sample of text fed to model")
     with gr.Row():
-        female_fig = gr.Plot()
-        male_fig = gr.Plot()
     with gr.Row():
         df = gr.Dataframe(
             show_label=True,
@@ -471,6 +470,3 @@ with demo:
 demo.launch(debug=True)
-# %%

 # %%
 import gradio as gr
 import matplotlib.pyplot as plt
 from matplotlib.ticker import MaxNLocator
 from transformers import pipeline
+MODEL_NAMES = ["bert-base-uncased", "roberta-base", "bert-large-uncased", "roberta-large"]
 OWN_MODEL_NAME = 'add-a-model'
 DECIMAL_PLACES = 1
 EPS = 1e-5  # to avoid /0 errors
 # %%
 # Fire up the models
+models = dict()
+for bert_like in MODEL_NAMES:
+    models[bert_like] = pipeline("fill-mask", model=bert_like)
 # %%
+def get_gendered_token_ids():
     male_gendered_tokens = [list[0] for list in GENDERED_LIST]
     female_gendered_tokens = [list[1] for list in GENDERED_LIST]
 # %%
+def get_figure(df, gender, n_fit=1, model_name=None):
     df = df.set_index('x-axis')
     cols = df.columns
     xs = list(range(len(df)))
     ax.axis('tight')
     ax.set_xlabel("Value injected into input text")
     ax.set_title(
+        f"Probability of predicting {gender} pronouns on {model_name}.")
     ax.set_ylabel(f"Softmax prob for pronouns")
     ax.xaxis.set_major_locator(MaxNLocator(6))
     ax.tick_params(axis='x', labelrotation=5)
     """
     if model_name not in MODEL_NAMES:
         model = pipeline("fill-mask", model=own_model_name)
+        model_name = OWN_MODEL_NAME
     else:
         model = models[model_name]
     indie_vars_list = indie_vars.split(',')
+    male_gendered_tokens, female_gendered_tokens = get_gendered_token_ids()
     text_segments, num_preds = prepare_text_for_masking(
         input_text, mask_token, male_gendered_tokens + female_gendered_tokens, split_key)
     results_df['female_pronouns'] = female_pronoun_preds
     results_df['male_pronouns'] = male_pronoun_preds
     female_fig = get_figure(results_df.drop(
+        'male_pronouns', axis=1), 'female',  n_fit, model_name)
     male_fig = get_figure(results_df.drop(
+        'female_pronouns', axis=1), 'male',  n_fit, model_name)
     display_text = f"{random.choice(indie_vars_list)}".join(text_segments)
     return (
 title = "Causing Gender Pronouns"
 description = """
 ## Intro
 """
 date_example = [
+    MODEL_NAMES[1],
     '',
     ', '.join(DATES),
     'DATE',
     "False",
     1,
+    'She was a teenager in DATE.'
 ]
     'PLACE',
     "False",
     1,
+    'She became an adult in PLACE.'
 ]
     gr.Markdown("# Spurious Correlation Evaluation for Pre-trained LLMs")
     gr.Markdown("Find spurious correlations between seemingly independent variables (for example between `gender` and `time`) in almost any BERT-like LLM on Hugging Face, below.")
+    # gr.Markdown("Note: If there is an issue with the rendering of the results taking longer than expected (more than 10s of seconds), there may be an unexpected issue effecting the hosting. If so, please see this [backup colab notebook](https://colab.research.google.com/drive/1A3a9cy9fERaxkuoX8YNTFhLlhRt_cxMm?usp=sharing).")
     gr.Markdown("## Instructions for this Demo")
     gr.Markdown("1) Click on one of the examples below (where we sweep through a spectrum of `places`, `dates` and `subreddits`) to pre-populate the input fields.")
     gr.Markdown("2) Check out the pre-populated fields as you scroll down to the ['Hit Submit...'] button!")
     with gr.Row():
         model_name = gr.Radio(
+            MODEL_NAMES + [OWN_MODEL_NAME],
+            type="value",
             label="B) BERT-like model.",
         )
         own_model_name = gr.Textbox(
         to_normalize = gr.Dropdown(
             ["False", "True"],
             label="D) Normalize model's predictions to only the gendered ones?",
+            type="index",
         )
         place_holder = gr.Textbox(
             label="E) Special token place-holder",
         n_fit = gr.Dropdown(
             list(range(1, 5)),
             label="F) Degree of polynomial fit",
+            type="value",
         )
     gr.Markdown(
         )
     gr.Markdown("## Outputs!")
+    #gr.Markdown("Scroll down and 'Hit Submit'!")
     with gr.Row():
         btn = gr.Button("Hit submit to generate predictions!")
     with gr.Row():
         sample_text = gr.Textbox(
+            type="auto", label="Output text: Sample of text fed to model")
     with gr.Row():
+        female_fig = gr.Plot(type="auto")
+        male_fig = gr.Plot(type="auto")
     with gr.Row():
         df = gr.Dataframe(
             show_label=True,
 demo.launch(debug=True)