Spaces:

GAS17
/

extract

Sleeping

GAS17 commited on Dec 21, 2024

Commit

6e5a027

verified ·

1 Parent(s): 0b83885

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -18,14 +18,24 @@ def perform_ocr(file):
     # Verificar si el archivo es un PDF
     if file.name.lower().endswith('.pdf'):
         # Convertir PDF a imágenes
-        images = convert_from_bytes(file.read())
         text = ""
         for image in images:
             text += pytesseract.image_to_string(image) + "\n\n"
     else:
         # Procesar como imagen
-        image = Image.open(file)
-        text = pytesseract.image_to_string(image)
     return text

     # Verificar si el archivo es un PDF
     if file.name.lower().endswith('.pdf'):
         # Convertir PDF a imágenes
+        try:
+            images = convert_from_bytes(file.read() if hasattr(file, 'read') else file)
+        except Exception as e:
+            return f"Error al procesar el PDF: {str(e)}"
         text = ""
         for image in images:
             text += pytesseract.image_to_string(image) + "\n\n"
     else:
         # Procesar como imagen
+        try:
+            if hasattr(file, 'read'):
+                image = Image.open(io.BytesIO(file.read()))
+            else:
+                image = Image.open(file)
+            text = pytesseract.image_to_string(image)
+        except Exception as e:
+            return f"Error al procesar la imagen: {str(e)}"
     return text