Spaces:

Navyabhat
/

Capstone_Project

Sleeping

App Files Files Community

Navyabhat commited on Jan 28, 2024

Commit

65f2058

verified ·

1 Parent(s): 61da4c8

Update app.py

Browse files

Files changed (1) hide show

app.py +135 -8

app.py CHANGED Viewed

@@ -1,3 +1,111 @@
 import gradio as gr
 from PIL import Image
 from inference.main import MultiModalPhi2
@@ -96,20 +204,39 @@ with gr.Blocks() as demo:
         txt = gr.Textbox(
             scale=4,
             show_label=False,
-            placeholder="Enter text and press enter, or upload an image",
             container=False,
         )
-        btn = gr.UploadButton("📁", file_types=["image", "video", "audio"])
-    txt_msg = txt.submit(add_content, [chatbot, txt, None, None], [chatbot, txt, None, None], queue=False).then(
-        run, [chatbot, txt, None, None], [chatbot, txt, None, None], api_name="bot_response"
     )
-    txt_msg.then(lambda: gr.Textbox(interactive=True), None, [txt], queue=False)
-    file_msg = btn.upload(add_content, [chatbot, None, None, btn], [chatbot, None, None, None], queue=False).then(
-        run, [chatbot, None, None, btn], [chatbot, None, None, None]
     )
     # chatbot.like(print_like_dislike, None, None)
-demo.queue()
 demo.launch()

+import gradio as gr
+from PIL import Image
+from inference.main import MultiModalPhi2
+messages = []
+multimodal_phi2 = MultiModalPhi2(
+    modelname_or_path="Navyabhat/Llava-Phi2",
+    temperature=0.2,
+    max_new_tokens=1024,
+    device="cpu",
+)
+def add_content(chatbot, input_data, input_type) -> gr.Chatbot:
+    textflag, imageflag, audioflag = False, False, False
+    if input_type == "text":
+        chatbot.append((text, None))
+        textflag = True
+    if input_type == "image":
+        chatbot.append(((image,), None))
+        imageflag = True
+    if input_type == "audio":
+        chatbot.append(((audio_mic,), None))
+        audioflag = True
+    # else:
+    #     if audio_upload is not None:
+    #         chatbot.append(((audio_upload,), None))
+    #         audioflag = True
+    if not any([textflag, imageflag, audioflag]):
+        # Raise an error if neither text nor file is provided
+        raise gr.Error("Enter a valid text, image or audio")
+    return chatbot
+def clear_data():
+    return {prompt: None, image: None, audio_upload: None, audio_mic: None, chatbot: []}
+def run(history, text, image, audio_upload, audio_mic):
+    if text in [None, ""]:
+        text = None
+    if audio_upload is not None:
+        audio = audio_upload
+    elif audio_mic is not None:
+        audio = audio_mic
+    else:
+        audio = None
+    print("text", text)
+    print("image", image)
+    print("audio", audio)
+    if image is not None:
+        image = Image.open(image)
+    outputs = multimodal_phi2(text, audio, image)
+    # outputs = ""
+    history.append((None, outputs.title()))
+    return history, None, None, None, None
+with gr.Blocks() as demo:
+    chatbot = gr.Chatbot(
+        [],
+        elem_id="chatbot",
+        bubble_full_width=False,
+        avatar_images=(None, (os.path.join(os.path.dirname(__file__), "avatar.png"))),
+    )
+    with gr.Row():
+        txt = gr.Textbox(
+            scale=4,
+            show_label=False,
+            placeholder="Enter text and press enter",
+            container=False,
+        )
+        img_audio = gr.UploadButton("📁", file_types=["image", "audio"], label="Upload Image or Audio")
+    txt_msg = txt.submit(add_content, [chatbot, txt], [chatbot, txt, "text"], queue=False).then(
+        bot, chatbot, chatbot, api_name="bot_response"
+    )
+    img_audio_msg = img_audio.upload(add_input, [chatbot, img_audio], [chatbot, "image"], queue=False).then(
+        bot, chatbot, chatbot
+    )
+    # chatbot.like(print_like_dislike, None, None)
+    submit.click(
+        add_content,
+        inputs=[chatbot, prompt, image, audio_upload, audio_mic],
+        outputs=[chatbot],
+    ).success(
+        run,
+        inputs=[chatbot, prompt, image, audio_upload, audio_mic],
+        outputs=[chatbot, prompt, image, audio_upload, audio_mic],
+    )
+    clear.click(
+        clear_data,
+        outputs=[prompt, image, audio_upload, audio_mic, chatbot],
+    )
+demo.launch()
 import gradio as gr
 from PIL import Image
 from inference.main import MultiModalPhi2
         txt = gr.Textbox(
             scale=4,
             show_label=False,
+            placeholder="Enter text and press enter",
             container=False,
         )
+        img_audio = gr.UploadButton("📁", file_types=["image", "audio"], label="Upload Image or Audio")
+    with gr.Row():
+                    # Adding a Button
+                    submit = gr.Button()
+                    clear = gr.Button(value="Clear")
+    txt_msg = txt.submit(add_input, [chatbot, txt], [chatbot, txt, "text"], queue=False).then(
+        bot, chatbot, chatbot, api_name="bot_response"
     )
+    img_audio_msg = img_audio.upload(add_input, [chatbot, img_audio], [chatbot, "image"], queue=False).then(
+        bot, chatbot, chatbot
+    )
+    # submit.click(
+    #     add_content,
+    #     inputs=[chatbot, txt, image, audio_upload, audio_mic],
+    #     outputs=[chatbot],
+    # ).success(
+    #     run,
+    #     inputs=[chatbot, txt, image, audio_upload, audio_mic],
+    #     outputs=[chatbot, txt, image, audio_upload, audio_mic],
+    # )
+    clear.click(
+        clear_data,
+        outputs=[prompt, image, audio_upload, audio_mic, chatbot],
     )
     # chatbot.like(print_like_dislike, None, None)
+# demo.queue()
 demo.launch()