Spaces:

Docfile
/

Mycha

Runtime error

Youssouf Traore commited on Mar 5, 2023

Commit

6353308

1 Parent(s): 14b4a59

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,17 +1,19 @@
 import gradio as gr
 import pytesseract
-from PIL import Image
 import cv2
-def extract_text(image):
-    img_cv = cv2.imread(image)
-    # By default OpenCV stores images in BGR format and since pytesseract assumes RGB format,
-    # we need to convert from BGR to RGB format/mode:
-    img_rgb = cv2.cvtColor(img_cv, cv2.COLOR_BGR2RGB)
-    print(pytesseract.image_to_string(img_rgb))
-    # OR
-    img_rgb = Image.frombytes('RGB', img_cv.shape[:2], img_cv, 'raw', 'BGR', 0, 0)
-    print(pytesseract.image_to_string(img_rgb))
 # Définir l'interface utilisateur Gradio
 inputs = gr.inputs.Image()

 import gradio as gr
 import pytesseract
 import cv2
+from PIL import Image
+def extract_text(image):
+    # Convertir le tableau numpy.ndarray en objet Image de la bibliothèque PIL
+    image = Image.fromarray(image)
+    # Convertir l'image en noir et blanc pour une meilleure extraction de texte
+    image = image.convert('L')
+    # Utiliser Pytesseract pour extraire le texte de l'image
+    text = pytesseract.image_to_string(image)
+    return text
 # Définir l'interface utilisateur Gradio
 inputs = gr.inputs.Image()