Spaces:

Ronith55
/

OCR_deepseek-vl2

Running

Ronith55 commited on Feb 25

Commit

edb8721

verified ·

1 Parent(s): 2798fcf

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,8 +1,9 @@
 import torch
-from transformers import pipeline, AutoModel, AutoProcessor
 from PIL import Image
-# ✅ Use pipeline for image-text-to-text
 pipe = pipeline("image-text-to-text", model="deepseek-ai/deepseek-vl2-small", trust_remote_code=True)
 # ✅ Load model directly (alternative approach)
@@ -10,13 +11,20 @@ model = AutoModel.from_pretrained("deepseek-ai/deepseek-vl2-small", trust_remote
 # ✅ Function to process image and text
 def predict(image_path, text_prompt):
-    image = Image.open("C:\Users\70088531\Downloads\sample_img2.JPG").convert("RGB")
     messages = [{"role": "user", "content": text_prompt}]
     result = pipe(image, messages)
     return result
 # ✅ Example usage
 if __name__ == "__main__":
-    test_image = "test.jpg"  # Replace with an actual image file
     prompt = "Describe this image."
-    print("Generated Response:", predict(test_image, prompt))

 import torch
+import os
 from PIL import Image
+from transformers import pipeline, AutoModel
+# ✅ Load the model using pipeline
 pipe = pipeline("image-text-to-text", model="deepseek-ai/deepseek-vl2-small", trust_remote_code=True)
 # ✅ Load model directly (alternative approach)
 # ✅ Function to process image and text
 def predict(image_path, text_prompt):
+    # Ensure correct path format for Windows/Linux
+    image_path = image_path.replace("\\", "/")
+    image = Image.open(image_path).convert("RGB")
     messages = [{"role": "user", "content": text_prompt}]
     result = pipe(image, messages)
     return result
 # ✅ Example usage
 if __name__ == "__main__":
+    # Replace this with the correct image path
+    test_image = "sample_img2.JPG"  # Ensure this image exists in the same folder
     prompt = "Describe this image."
+    # Run prediction
+    output = predict(test_image, prompt)
+    print("Generated Response:", output)