Spaces:

emilylearning
/

llm_uncertainty

Running

App Files Files Community

Emily McMilin commited on Sep 7, 2022

Commit

d4b589f

1 Parent(s): 55392f1

fix bug causing add-own-model to fail

Browse files

Files changed (1) hide show

app.py +16 -18

app.py CHANGED Viewed

@@ -1,5 +1,4 @@
 # %%
-# from http.client import TEMPORARY_REDIRECT
 import gradio as gr
 import matplotlib.pyplot as plt
 import numpy as np
@@ -9,18 +8,19 @@ from matplotlib.ticker import MaxNLocator
 from transformers import pipeline
 from winogender_sentences import get_sentences
 MODEL_NAME_DICT = {
     "roberta-large": "RoBERTa-large",
     "bert-large-uncased": "BERT-large",
     "roberta-base": "RoBERTa-base",
     "bert-base-uncased": "BERT-base",
 }
 MODEL_NAMES = list(MODEL_NAME_DICT.keys())
-OWN_MODEL_NAME = 'add-a-model'
-PICK_YOUR_OWN_LABEL = 'pick-your-own'
 DECIMAL_PLACES = 1
 EPS = 1e-5  # to avoid /0 errors
 NUM_PTS_TO_AVERAGE = 2
@@ -33,7 +33,6 @@ NUM_PTS = 30
 DATES = np.linspace(START_YEAR, STOP_YEAR, NUM_PTS).astype(int).tolist()
 DATES = [f'{d}' for d in DATES]
 GENDERED_LIST = [
     ['he', 'she'],
     ['him', 'her'],
@@ -52,10 +51,7 @@ GENDERED_LIST = [
 # %%
 # Fire up the models
-models = dict()
-for bert_like in MODEL_NAMES:
-    models[bert_like] = pipeline("fill-mask", model=bert_like)
 # %%
 # Get the winogender sentences
@@ -64,7 +60,6 @@ occs = sorted(list({sentence_id.split('_')[0]
                     for sentence_id in winogender_sentences}))
 # %%
 def get_gendered_token_ids():
     male_gendered_tokens = [list[0] for list in GENDERED_LIST]
     female_gendered_tokens = [list[1] for list in GENDERED_LIST]
@@ -112,8 +107,7 @@ def get_figure(df, model_name, occ):
     ax.axis('tight')
     ax.set_xlabel("Sentence number")
     ax.set_ylabel("Uncertainty metric")
-    ax.set_title(
-        f"{MODEL_NAME_DICT[model_name]} gender pronoun uncertainty in '{occ}' sentences")
     return fig
@@ -137,7 +131,7 @@ def predict_gender_pronouns(
     if model_name is None or model_name == '':
         model_name = MODEL_NAMES[0]
         model = models[model_name]
-    elif model_name not in MODEL_NAMES:
         model = pipeline("fill-mask", model=own_model_name)
     else:
         model = models[model_name]
@@ -200,11 +194,12 @@ def predict_gender_pronouns(
     uncertain_df = uncertain_df.reset_index().rename(
         columns={'index': 'Sentence number'})
     return (
         uncertain_df,
         get_figure(uncertain_df, model_name, occ),
     )
-# %%
 demo = gr.Blocks()
@@ -227,13 +222,13 @@ with demo:
     with gr.Row():
         model_name = gr.Radio(
-            MODEL_NAMES + [OWN_MODEL_NAME],
             type="value",
-            label="Pick a preloaded BERT-like model for uncertainty evaluation (note: BERT-base performance least consistant)...",
         )
         own_model_name = gr.Textbox(
             label=f"...Or, if you selected an '{OWN_MODEL_NAME}' model, put any Hugging Face pipeline model name \
-            (that supports the [fill-mask task](https://huggingface.co/models?pipeline_tag=fill-mask)) here.",
         )
     with gr.Row():
@@ -269,12 +264,15 @@ with demo:
         female_fig = gr.Plot(type="auto")
     with gr.Row():
         female_df = gr.Dataframe()
     uncertain_btn.click(
         fn=predict_gender_pronouns,
         inputs=[model_name, own_model_name, input_texts, occ_box],
         # inputs=date_example,
-        outputs=[female_df, female_fig]
     )
 demo.launch(debug=True)

 # %%
 import gradio as gr
 import matplotlib.pyplot as plt
 import numpy as np
 from transformers import pipeline
 from winogender_sentences import get_sentences
+OWN_MODEL_NAME = 'add-a-model'
+PICK_YOUR_OWN_LABEL = 'pick-your-own'
 MODEL_NAME_DICT = {
     "roberta-large": "RoBERTa-large",
     "bert-large-uncased": "BERT-large",
     "roberta-base": "RoBERTa-base",
     "bert-base-uncased": "BERT-base",
+    OWN_MODEL_NAME: "Your model's"
 }
 MODEL_NAMES = list(MODEL_NAME_DICT.keys())
 DECIMAL_PLACES = 1
 EPS = 1e-5  # to avoid /0 errors
 NUM_PTS_TO_AVERAGE = 2
 DATES = np.linspace(START_YEAR, STOP_YEAR, NUM_PTS).astype(int).tolist()
 DATES = [f'{d}' for d in DATES]
 GENDERED_LIST = [
     ['he', 'she'],
     ['him', 'her'],
 # %%
 # Fire up the models
+models = {m : pipeline("fill-mask", model=m) for m in MODEL_NAMES if m != OWN_MODEL_NAME}
 # %%
 # Get the winogender sentences
                     for sentence_id in winogender_sentences}))
 # %%
 def get_gendered_token_ids():
     male_gendered_tokens = [list[0] for list in GENDERED_LIST]
     female_gendered_tokens = [list[1] for list in GENDERED_LIST]
     ax.axis('tight')
     ax.set_xlabel("Sentence number")
     ax.set_ylabel("Uncertainty metric")
+    ax.set_title(f"{MODEL_NAME_DICT[model_name]} gender pronoun uncertainty in '{occ}' sentences")
     return fig
     if model_name is None or model_name == '':
         model_name = MODEL_NAMES[0]
         model = models[model_name]
+    elif model_name == OWN_MODEL_NAME:
         model = pipeline("fill-mask", model=own_model_name)
     else:
         model = models[model_name]
     uncertain_df = uncertain_df.reset_index().rename(
         columns={'index': 'Sentence number'})
     return (
+        target_text,
         uncertain_df,
         get_figure(uncertain_df, model_name, occ),
     )
 demo = gr.Blocks()
     with gr.Row():
         model_name = gr.Radio(
+            MODEL_NAMES,
             type="value",
+            label="Pick a preloaded BERT-like model for uncertainty evaluation (note: BERT-base performance least consistent)...",
         )
         own_model_name = gr.Textbox(
             label=f"...Or, if you selected an '{OWN_MODEL_NAME}' model, put any Hugging Face pipeline model name \
+            (that supports the `fill-mask` task (see list at https://huggingface.co/models?pipeline_tag=fill-mask).",
         )
     with gr.Row():
         female_fig = gr.Plot(type="auto")
     with gr.Row():
         female_df = gr.Dataframe()
+    with gr.Row():
+        display_text = gr.Textbox(
+            type="auto", label="Sample of text fed to model")
     uncertain_btn.click(
         fn=predict_gender_pronouns,
         inputs=[model_name, own_model_name, input_texts, occ_box],
         # inputs=date_example,
+        outputs=[display_text, female_df, female_fig]
     )
 demo.launch(debug=True)