Spaces:

jedick
/

AI4citations

Running on Zero

App Files Files Community

jedick commited on May 31

Commit

7879fc7

1 Parent(s): 0eb9d15

Remove barplot

Browse files

Files changed (1) hide show

app.py +64 -142

app.py CHANGED Viewed

@@ -50,28 +50,6 @@ if gr.NO_RELOAD:
         )
-def prediction_to_df(prediction=None):
-    """
-    Convert prediction text to DataFrame for barplot
-    """
-    if prediction is None or prediction == "":
-        # Show an empty plot for app initialization or auto-reload
-        prediction = {"SUPPORT": 0, "NEI": 0, "REFUTE": 0}
-    elif "Model" in prediction:
-        # Show full-height bars when the model is changed
-        prediction = {"SUPPORT": 1, "NEI": 1, "REFUTE": 1}
-    else:
-        # Convert predictions text to dictionary
-        prediction = eval(prediction)
-        # Use custom order for labels (pipe() returns labels in descending order of softmax score)
-        labels = ["SUPPORT", "NEI", "REFUTE"]
-        prediction = {k: prediction[k] for k in labels}
-    # Convert dictionary to DataFrame with one column (Probability)
-    df = pd.DataFrame.from_dict(prediction, orient="index", columns=["Probability"])
-    # Move the index to the Class column
-    return df.reset_index(names="Class")
 # Setup theme without background image
 my_theme = gr.Theme.from_hub("NoCrypt/miku")
 my_theme.set(body_background_fill="#FFFFFF", body_background_fill_dark="#000000")
@@ -127,22 +105,44 @@ with gr.Blocks(theme=my_theme, head=font_awesome_html) as demo:
                         completion_tokens = gr.Number(
                             label="Completion tokens", visible=False
                         )
         with gr.Column(scale=2):
-            # Keep the prediction textbox hidden
-            with gr.Accordion(visible=False):
-                prediction = gr.Textbox(label="Prediction")
-            barplot = gr.BarPlot(
-                prediction_to_df,
-                x="Class",
-                y="Probability",
-                color="Class",
-                color_map={"SUPPORT": "green", "NEI": "#888888", "REFUTE": "#FF8888"},
-                inputs=prediction,
-                y_lim=([0, 1]),
-                visible=False,
-            )
-            label = gr.Label(label="Prediction")
             with gr.Accordion("Feedback"):
                 gr.Markdown(
                     "*Provide the correct label to help improve this app*<br>**NOTE:** The claim and evidence will also be saved"
@@ -189,71 +189,19 @@ with gr.Blocks(theme=my_theme, head=font_awesome_html) as demo:
                         "label"
                     ].tolist(),
                 )
-    with gr.Row():
-        with gr.Column(scale=3):
-            with gr.Row():
-                with gr.Column(scale=1):
-                    gr.Markdown(
-                        """
-                    ### Usage:
-                    - Input a **Claim**, then:
-                        - Upload a PDF and click **Get Evidence** OR
-                        - Input **Evidence** statements yourself
-                    """
-                    )
-                with gr.Column(scale=2):
-                    gr.Markdown(
-                        """
-                    ### To make the prediction:
-                    - Hit 'Enter' in the **Claim** text box OR
-                    - Hit 'Shift-Enter' in the **Evidence** text box
-                    _The prediction is also made after clicking **Get Evidence**_
-                    """
-                    )
-        with gr.Column(scale=2):
-            with gr.Accordion("Settings", open=False):
-                # Create dropdown menu to select the model
-                model = gr.Dropdown(
-                    choices=[
-                        # TODO: For bert-base-uncased, how can we set num_labels = 2 in HF pipeline?
-                        # (num_labels is available in AutoModelForSequenceClassification.from_pretrained)
-                        # "bert-base-uncased",
-                        "MoritzLaurer/DeBERTa-v3-base-mnli-fever-anli",
-                        "jedick/DeBERTa-v3-base-mnli-fever-anli-scifact-citint",
-                    ],
-                    value=MODEL_NAME,
-                    label="Model",
-                )
-                radio = gr.Radio(
-                    ["label", "barplot"], value="label", label="Prediction"
-                )
-            with gr.Accordion("Sources", open=False):
-                gr.Markdown(
-                    """
-                #### *Capstone project*
-                - <i class="fa-brands fa-github"></i> [jedick/MLE-capstone-project](https://github.com/jedick/MLE-capstone-project) (project repo)
-                - <i class="fa-brands fa-github"></i> [jedick/AI4citations](https://github.com/jedick/AI4citations) (app repo)
-                #### *Text Classification*
-                - <img src="https://huggingface.co/datasets/huggingface/brand-assets/resolve/main/hf-logo.svg" style="height: 1.2em; display: inline-block;"> [jedick/DeBERTa-v3-base-mnli-fever-anli-scifact-citint](https://huggingface.co/jedick/DeBERTa-v3-base-mnli-fever-anli-scifact-citint) (fine-tuned)
-                - <img src="https://huggingface.co/datasets/huggingface/brand-assets/resolve/main/hf-logo.svg" style="height: 1.2em; display: inline-block;"> [MoritzLaurer/DeBERTa-v3-base-mnli-fever-anli](https://huggingface.co/MoritzLaurer/DeBERTa-v3-base-mnli-fever-anli) (base)
-                #### *Evidence Retrieval*
-                - <i class="fa-brands fa-github"></i> [xhluca/bm25s](https://github.com/xhluca/bm25s) (BM25S)
-                - <img src="https://huggingface.co/datasets/huggingface/brand-assets/resolve/main/hf-logo.svg" style="height: 1.2em; display: inline-block;"> [deepset/deberta-v3-large-squad2](https://huggingface.co/deepset/deberta-v3-large-squad2) (DeBERTa)
-                - <img src="https://upload.wikimedia.org/wikipedia/commons/4/4d/OpenAI_Logo.svg" style="height: 1.2em; display: inline-block;"> [gpt-4o-mini-2024-07-18](https://platform.openai.com/docs/pricing) (GPT)
-                #### *Datasets for fine-tuning*
-                - <i class="fa-brands fa-github"></i> [allenai/SciFact](https://github.com/allenai/scifact) (SciFact)
-                - <i class="fa-brands fa-github"></i> [ScienceNLP-Lab/Citation-Integrity](https://github.com/ScienceNLP-Lab/Citation-Integrity) (CitInt)
-                #### *Other sources*
-                - <img src="https://plos.org/wp-content/uploads/2020/01/logo-color-blue.svg" style="height: 1.4em; display: inline-block;"> [Medicine](https://doi.org/10.1371/journal.pmed.0030197), <i class="fa-brands fa-wikipedia-w"></i> [CRISPR](https://en.wikipedia.org/wiki/CRISPR) (evidence retrieval examples)
-                - <img src="https://huggingface.co/datasets/huggingface/brand-assets/resolve/main/hf-logo.svg" style="height: 1.2em; display: inline-block;"> [nyu-mll/multi_nli](https://huggingface.co/datasets/nyu-mll/multi_nli/viewer/default/train?row=37&views%5B%5D=train) (MNLI example)
-                - <img src="https://huggingface.co/datasets/huggingface/brand-assets/resolve/main/hf-logo.svg" style="height: 1.2em; display: inline-block;"> [NoCrypt/miku](https://huggingface.co/spaces/NoCrypt/miku) (theme)
-                """
-                )
     # Functions
@@ -284,8 +232,7 @@ with gr.Blocks(theme=my_theme, head=font_awesome_html) as demo:
             ("REFUTE" if k in ["REFUTE", "contradiction"] else k): v
             for k, v in prediction.items()
         }
-        # Return two instances of the prediction to send to different Gradio components
-        return prediction, prediction
     def select_model(model_name):
         """
@@ -298,15 +245,6 @@ with gr.Blocks(theme=my_theme, head=font_awesome_html) as demo:
             model=MODEL_NAME,
         )
-    def change_visualization(choice):
-        if choice == "barplot":
-            barplot = gr.update(visible=True)
-            label = gr.update(visible=False)
-        elif choice == "label":
-            barplot = gr.update(visible=False)
-            label = gr.update(visible=True)
-        return barplot, label
     # From gradio/client/python/gradio_client/utils.py
     def is_http_url_like(possible_url) -> bool:
         """
@@ -354,13 +292,13 @@ with gr.Blocks(theme=my_theme, head=font_awesome_html) as demo:
             return f"Unknown retrieval method: {method}"
     def append_feedback(
-        claim: str, evidence: str, model: str, label: str, user_label: str
     ) -> None:
         """
         Append input/outputs and user feedback to a JSON Lines file.
         """
         # Get the first label (prediction with highest probability)
-        prediction = next(iter(label))
         with USER_FEEDBACK_PATH.open("a") as f:
             f.write(
                 json.dumps(
@@ -368,7 +306,7 @@ with gr.Blocks(theme=my_theme, head=font_awesome_html) as demo:
                         "claim": claim,
                         "evidence": evidence,
                         "model": model,
-                        "prediction": prediction,
                         "user_label": user_label,
                         "datetime": datetime.now().isoformat(),
                     }
@@ -435,7 +373,7 @@ with gr.Blocks(theme=my_theme, head=font_awesome_html) as demo:
         triggers=[claim.submit, evidence.submit],
         fn=query_model,
         inputs=[claim, evidence],
-        outputs=[prediction, label],
     )
     # Get evidence from PDF and run the model
@@ -447,7 +385,7 @@ with gr.Blocks(theme=my_theme, head=font_awesome_html) as demo:
     ).then(
         fn=query_model,
         inputs=[claim, evidence],
-        outputs=[prediction, label],
         api_name=False,
     )
@@ -461,7 +399,7 @@ with gr.Blocks(theme=my_theme, head=font_awesome_html) as demo:
     ).then(
         fn=query_model,
         inputs=[claim, evidence],
-        outputs=[prediction, label],
         api_name=False,
     )
@@ -475,7 +413,7 @@ with gr.Blocks(theme=my_theme, head=font_awesome_html) as demo:
     ).then(
         fn=query_model,
         inputs=[claim, evidence],
-        outputs=[prediction, label],
         api_name=False,
     )
@@ -489,7 +427,7 @@ with gr.Blocks(theme=my_theme, head=font_awesome_html) as demo:
     ).then(
         fn=query_model,
         inputs=[claim, evidence],
-        outputs=[prediction, label],
         api_name=False,
     )
@@ -508,53 +446,37 @@ with gr.Blocks(theme=my_theme, head=font_awesome_html) as demo:
     ).then(
         fn=query_model,
         inputs=[claim, evidence],
-        outputs=[prediction, label],
-        api_name=False,
-    )
-    # Change visualization
-    radio.change(
-        fn=change_visualization,
-        inputs=radio,
-        outputs=[barplot, label],
-        api_name=False,
-    )
-    # Clear the previous predictions when the model is changed
-    gr.on(
-        triggers=[model.select],
-        fn=lambda: "Model changed! Waiting for updated predictions...",
-        outputs=[prediction],
         api_name=False,
     )
-    # Change the model the update the predictions
     model.change(
         fn=select_model,
         inputs=model,
     ).then(
         fn=query_model,
         inputs=[claim, evidence],
-        outputs=[prediction, label],
         api_name=False,
     )
     # Log user feedback when button is clicked
     flag_support.click(
         fn=save_feedback_support,
-        inputs=[claim, evidence, model, label],
         outputs=None,
         api_name=False,
     )
     flag_nei.click(
         fn=save_feedback_nei,
-        inputs=[claim, evidence, model, label],
         outputs=None,
         api_name=False,
     )
     flag_refute.click(
         fn=save_feedback_refute,
-        inputs=[claim, evidence, model, label],
         outputs=None,
         api_name=False,
     )

         )
 # Setup theme without background image
 my_theme = gr.Theme.from_hub("NoCrypt/miku")
 my_theme.set(body_background_fill="#FFFFFF", body_background_fill_dark="#000000")
                         completion_tokens = gr.Number(
                             label="Completion tokens", visible=False
                         )
+                    gr.Markdown(
+                        """
+                    ### App Usage:
+                    - Input a **Claim**, then:
+                        - Upload a PDF and click **Get Evidence** OR
+                        - Input **Evidence** statements yourself
+                    - Make the **Prediction**:
+                        - Hit 'Enter' in the **Claim** text box OR
+                        - Hit 'Shift-Enter' in the **Evidence** text box OR
+                        - Click **Get Evidence**
+                    """
+                    )
+            with gr.Accordion("Sources", open=False):
+                gr.Markdown(
+                    """
+                #### *Capstone project*
+                - <i class="fa-brands fa-github"></i> [jedick/MLE-capstone-project](https://github.com/jedick/MLE-capstone-project) (project repo)
+                - <i class="fa-brands fa-github"></i> [jedick/AI4citations](https://github.com/jedick/AI4citations) (app repo)
+                #### *Text Classification*
+                - <img src="https://huggingface.co/datasets/huggingface/brand-assets/resolve/main/hf-logo.svg" style="height: 1.2em; display: inline-block;"> [jedick/DeBERTa-v3-base-mnli-fever-anli-scifact-citint](https://huggingface.co/jedick/DeBERTa-v3-base-mnli-fever-anli-scifact-citint) (fine-tuned)
+                - <img src="https://huggingface.co/datasets/huggingface/brand-assets/resolve/main/hf-logo.svg" style="height: 1.2em; display: inline-block;"> [MoritzLaurer/DeBERTa-v3-base-mnli-fever-anli](https://huggingface.co/MoritzLaurer/DeBERTa-v3-base-mnli-fever-anli) (base)
+                #### *Evidence Retrieval*
+                - <i class="fa-brands fa-github"></i> [xhluca/bm25s](https://github.com/xhluca/bm25s) (BM25S)
+                - <img src="https://huggingface.co/datasets/huggingface/brand-assets/resolve/main/hf-logo.svg" style="height: 1.2em; display: inline-block;"> [deepset/deberta-v3-large-squad2](https://huggingface.co/deepset/deberta-v3-large-squad2) (DeBERTa)
+                - <img src="https://upload.wikimedia.org/wikipedia/commons/4/4d/OpenAI_Logo.svg" style="height: 1.2em; display: inline-block;"> [gpt-4o-mini-2024-07-18](https://platform.openai.com/docs/pricing) (GPT)
+                #### *Datasets for fine-tuning*
+                - <i class="fa-brands fa-github"></i> [allenai/SciFact](https://github.com/allenai/scifact) (SciFact)
+                - <i class="fa-brands fa-github"></i> [ScienceNLP-Lab/Citation-Integrity](https://github.com/ScienceNLP-Lab/Citation-Integrity) (CitInt)
+                #### *Other sources*
+                - <img src="https://plos.org/wp-content/uploads/2020/01/logo-color-blue.svg" style="height: 1.4em; display: inline-block;"> [Medicine](https://doi.org/10.1371/journal.pmed.0030197), <i class="fa-brands fa-wikipedia-w"></i> [CRISPR](https://en.wikipedia.org/wiki/CRISPR) (evidence retrieval examples)
+                - <img src="https://huggingface.co/datasets/huggingface/brand-assets/resolve/main/hf-logo.svg" style="height: 1.2em; display: inline-block;"> [nyu-mll/multi_nli](https://huggingface.co/datasets/nyu-mll/multi_nli/viewer/default/train?row=37&views%5B%5D=train) (MNLI example)
+                - <img src="https://huggingface.co/datasets/huggingface/brand-assets/resolve/main/hf-logo.svg" style="height: 1.2em; display: inline-block;"> [NoCrypt/miku](https://huggingface.co/spaces/NoCrypt/miku) (theme)
+                """
+                )
         with gr.Column(scale=2):
+            prediction = gr.Label(label="Prediction")
             with gr.Accordion("Feedback"):
                 gr.Markdown(
                     "*Provide the correct label to help improve this app*<br>**NOTE:** The claim and evidence will also be saved"
                         "label"
                     ].tolist(),
                 )
+            # Create dropdown menu to select the model
+            model = gr.Dropdown(
+                choices=[
+                    # TODO: For bert-base-uncased, how can we set num_labels = 2 in HF pipeline?
+                    # (num_labels is available in AutoModelForSequenceClassification.from_pretrained)
+                    # "bert-base-uncased",
+                    "MoritzLaurer/DeBERTa-v3-base-mnli-fever-anli",
+                    "jedick/DeBERTa-v3-base-mnli-fever-anli-scifact-citint",
+                ],
+                value=MODEL_NAME,
+                label="Model",
+                info="Text classification model used for claim verification",
+            )
     # Functions
             ("REFUTE" if k in ["REFUTE", "contradiction"] else k): v
             for k, v in prediction.items()
         }
+        return prediction
     def select_model(model_name):
         """
             model=MODEL_NAME,
         )
     # From gradio/client/python/gradio_client/utils.py
     def is_http_url_like(possible_url) -> bool:
         """
             return f"Unknown retrieval method: {method}"
     def append_feedback(
+        claim: str, evidence: str, model: str, prediction: str, user_label: str
     ) -> None:
         """
         Append input/outputs and user feedback to a JSON Lines file.
         """
         # Get the first label (prediction with highest probability)
+        _prediction = next(iter(prediction))
         with USER_FEEDBACK_PATH.open("a") as f:
             f.write(
                 json.dumps(
                         "claim": claim,
                         "evidence": evidence,
                         "model": model,
+                        "prediction": _prediction,
                         "user_label": user_label,
                         "datetime": datetime.now().isoformat(),
                     }
         triggers=[claim.submit, evidence.submit],
         fn=query_model,
         inputs=[claim, evidence],
+        outputs=prediction,
     )
     # Get evidence from PDF and run the model
     ).then(
         fn=query_model,
         inputs=[claim, evidence],
+        outputs=prediction,
         api_name=False,
     )
     ).then(
         fn=query_model,
         inputs=[claim, evidence],
+        outputs=prediction,
         api_name=False,
     )
     ).then(
         fn=query_model,
         inputs=[claim, evidence],
+        outputs=prediction,
         api_name=False,
     )
     ).then(
         fn=query_model,
         inputs=[claim, evidence],
+        outputs=prediction,
         api_name=False,
     )
     ).then(
         fn=query_model,
         inputs=[claim, evidence],
+        outputs=prediction,
         api_name=False,
     )
+    # Change the model then update the predictions
     model.change(
         fn=select_model,
         inputs=model,
     ).then(
         fn=query_model,
         inputs=[claim, evidence],
+        outputs=prediction,
         api_name=False,
     )
     # Log user feedback when button is clicked
     flag_support.click(
         fn=save_feedback_support,
+        inputs=[claim, evidence, model, prediction],
         outputs=None,
         api_name=False,
     )
     flag_nei.click(
         fn=save_feedback_nei,
+        inputs=[claim, evidence, model, prediction],
         outputs=None,
         api_name=False,
     )
     flag_refute.click(
         fn=save_feedback_refute,
+        inputs=[claim, evidence, model, prediction],
         outputs=None,
         api_name=False,
     )