PaddleOCR2

Sleeping

App Files Files Community

deepak191z commited on Nov 3, 2024

Commit

669df7a

•

1 Parent(s): 3a21f1e

Update app.py

Browse files

Files changed (1) hide show

app.py +50 -32

app.py CHANGED Viewed

@@ -1,49 +1,67 @@
 import os
 os.system('pip install paddlepaddle==2.4.2')
-# os.system('pip install paddlepaddle==0.0.0 -f https://www.paddlepaddle.org.cn/whl/linux/cpu-mkl/develop.html')
 os.system('pip install paddleocr')
 from paddleocr import PaddleOCR, draw_ocr
 from PIL import Image
 import gradio as gr
 import torch
 torch.hub.download_url_to_file('https://i.imgur.com/aqMBT0i.jpg', 'example.jpg')
-def inference(img, lang):
-    ocr = PaddleOCR(use_angle_cls=True, lang=lang,use_gpu=False)
-    img_path = img
     result = ocr.ocr(img_path, cls=True)[0]
     boxes = [line[0] for line in result]
     txts = [line[1][0] for line in result]
     scores = [line[1][1] for line in result]
     image = Image.open(img_path).convert('RGB')
-    im_show = draw_ocr(image, boxes, txts=None, scores=None, # https://github.com/PaddlePaddle/PaddleOCR/blob/release/2.7/tools/infer/utility.py#L365
-                       font_path='simfang.ttf')
     im_show = Image.fromarray(im_show)
-    im_show.save('result.jpg')
-    return 'result.jpg', result, '\n'.join(txts)
-    # return 'result.jpg'
-title = 'PaddleOCR'
-description = 'Gradio demo for PaddleOCR. PaddleOCR demo supports Chinese, English, French, German, Korean and Japanese. To use it, simply upload your image and choose a language from the dropdown menu, or click one of the examples to load them. Read more at the links below.'
-article = "<p style='text-align: center'><a href='https://www.paddlepaddle.org.cn/hub/scene/ocr'>Awesome multilingual OCR toolkits based on PaddlePaddle （practical ultra lightweight OCR system, support 80+ languages recognition, provide data annotation and synthesis tools, support training and deployment among server, mobile, embedded and IoT devices）</a> | <a href='https://github.com/PaddlePaddle/PaddleOCR'>Github Repo</a></p>"
-examples = [['example.jpg','en']]
-css = ".output_image, .input_image {height: 40rem !important; width: 100% !important;}"
-app = gr.Interface(
-    inference,
-    [gr.Image(type='filepath', label='Input'),gr.Dropdown(choices=['ch', 'en', 'fr', 'german', 'korean', 'japan', 'ar'], type="value", value='ch', label='language')],
-    # gr.outputs.Image(type='file', label='Output'),
-    outputs=["image", "text", "text"],
-    title=title,
-    description=description,
-    article=article,
-    examples=examples,
-    css=css,
-    # enable_queue=True
-    )
-app.queue(max_size=10)
-app.launch(debug=True)

 import os
+import tempfile
+import shutil
+import logging
 os.system('pip install paddlepaddle==2.4.2')
 os.system('pip install paddleocr')
 from paddleocr import PaddleOCR, draw_ocr
 from PIL import Image
 import gradio as gr
 import torch
+from fastapi import FastAPI, File, UploadFile, Form
+from fastapi.responses import FileResponse
+import uvicorn
+# Configure logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+CUSTOM_PATH = "/ocr"
+app = FastAPI()
+@app.get("/")
+def read_main():
+    return {"message": "This is your main app"}
+io = gr.Interface(lambda x: "Hello, " + x + "!", "textbox", "textbox")
 torch.hub.download_url_to_file('https://i.imgur.com/aqMBT0i.jpg', 'example.jpg')
+@app.post("/ocr/")
+async def ocr_endpoint(img: UploadFile = File(...), lang: str = Form(...)):
+    logger.info("Processing OCR request")
+    # Save the uploaded image to a temporary file
+    with tempfile.NamedTemporaryFile(delete=False, suffix=".jpg") as temp_img:
+        shutil.copyfileobj(img.file, temp_img)
+        img_path = temp_img.name
+    # Perform OCR
+    ocr = PaddleOCR(use_angle_cls=True, lang=lang, use_gpu=False)
     result = ocr.ocr(img_path, cls=True)[0]
     boxes = [line[0] for line in result]
     txts = [line[1][0] for line in result]
     scores = [line[1][1] for line in result]
     image = Image.open(img_path).convert('RGB')
+    im_show = draw_ocr(image, boxes, txts=None, scores=None, font_path='simfang.ttf')
     im_show = Image.fromarray(im_show)
+    result_img_path = 'result.jpg'
+    im_show.save(result_img_path)
+    # Prepare the response
+    response_data = {
+        "result_image": result_img_path,
+        "ocr_result": result,
+        "extracted_text": '\n'.join(txts)
+    }
+    logger.info("OCR request processed successfully")
+    return response_data
+app = gr.mount_gradio_app(app, io, path=CUSTOM_PATH)
+uvicorn.run(app, host="0.0.0.0", port=7860)