Spaces:

adil9858
/

LLAMA_4_Vision

Runtime error

App Files Files Community

adil9858 commited on Apr 7

Commit

9f9b1da

verified ·

1 Parent(s): f7f8133

Create app.py

Browse files

Files changed (1) hide show

app.py +53 -0

app.py ADDED Viewed

	@@ -0,0 +1,53 @@

+import gradio as gr
+from groq import Groq
+import base64
+from PIL import Image
+import io
+# Encode image to base64
+def encode_image_to_base64(image):
+    buffered = io.BytesIO()
+    image.save(buffered, format="JPEG")
+    return base64.b64encode(buffered.getvalue()).decode("utf-8")
+# Prediction function with API key input
+def predict(api_key, image, user_prompt):
+    if not api_key:
+        return "❌ Please provide your Groq API key."
+    try:
+        client = Groq(api_key=api_key)
+        base64_image = encode_image_to_base64(image)
+        response = client.chat.completions.create(
+            model="meta-llama/llama-4-scout-17b-16e-instruct",
+            messages=[
+                {
+                    "role": "user",
+                    "content": [
+                        {"type": "text", "text": user_prompt},
+                        {"type": "image_url", "image_url": {"url": f"data:image/jpeg;base64,{base64_image}"}}
+                    ]
+                }
+            ],
+            max_tokens=1024,
+        )
+        return response.choices[0].message.content
+    except Exception as e:
+        return f"⚠️ Error: {str(e)}"
+# Gradio UI
+demo = gr.Interface(
+    fn=predict,
+    inputs=[
+        gr.Textbox(label="Groq API Key", placeholder="Enter your API key...", type="password"),
+        gr.Image(type="pil", label="Upload Image"),
+        gr.Textbox(label="Enter Prompt", lines=10, placeholder="Paste your prompt here...")
+    ],
+    outputs=gr.Markdown(label="Output"),
+    title="Custom Visual Prompt with Groq",
+    description="Upload an image, enter your Groq API key, and provide a prompt to analyze the image using LLaMA 4 Scout.",
+)
+demo.launch()