Spaces:

Hyma7
/

Commercial_court_chatbot

Running

Hyma7 commited on 13 days ago

Commit

8d54bf2

•

1 Parent(s): 2fce450

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -3,6 +3,7 @@ from transformers import pipeline
 from PyPDF2 import PdfReader
 import easyocr
 from PIL import Image
 from difflib import SequenceMatcher
 # Initialize the T5-small pipeline for lightweight generative capabilities
@@ -18,9 +19,10 @@ def analyze_pdf(file):
 def analyze_image(file):
     """Extract text from an image file using EasyOCR."""
-    image = Image.open(file)
-    reader = easyocr.Reader(['en'], gpu=False)  # Use GPU=True if resources are available
-    result = reader.readtext(image, detail=0)   # Extract text without bounding box details
     return " ".join(result)  # Combine detected text into a single string
 def classify_and_respond(extracted_text):

 from PyPDF2 import PdfReader
 import easyocr
 from PIL import Image
+import numpy as np
 from difflib import SequenceMatcher
 # Initialize the T5-small pipeline for lightweight generative capabilities
 def analyze_image(file):
     """Extract text from an image file using EasyOCR."""
+    image = Image.open(file)  # Open the uploaded image
+    image_np = np.array(image)  # Convert the PIL image to a NumPy array
+    reader = easyocr.Reader(['en'], gpu=False)  # Initialize EasyOCR reader
+    result = reader.readtext(image_np, detail=0)  # Extract text without bounding box details
     return " ".join(result)  # Combine detected text into a single string
 def classify_and_respond(extracted_text):