Spaces:

CallMeDaniel
/

TaiwanOCR_CertificateofDiagnosis

Running

TaiwanOCR_CertificateofDiagnosis / app.py

Danieldu

update dict

d1182db 11 months ago

1.92 kB

	import os, io
	from paddleocr import PaddleOCR, draw_ocr
	from PIL import Image, ImageDraw
	import gradio as gr


	# 設定 Hugging Face Hub 的 Access Token
	os.environ["HF_TOKEN"] = "TWOCR"

	def inference(img_path):

	ocr = PaddleOCR(
	rec_char_dict_path='zhtw_common_dict.txt',
	use_gpu=False,
	rec_image_shape="3, 48, 320"
	)

	result = ocr.ocr(img_path)

	for idx in range(len(result)):
	res = result[idx]
	for line in res:
	print(line)

	result = result[0]
	image = Image.open(img_path).convert('RGB')
	boxes = [line[0] for line in result]
	txts = [line[1][0] if line[1] else '' for line in result] # 確保在無文字時 txts 還是個空字串
	scores = [line[1][1] for line in result]
	im_show_pil = draw_ocr(image, boxes, txts, scores, font_path="./simfang.ttf")

	return im_show_pil, "\n".join(txts)

	title = "<p style='text-align: center'><a href='https://www.twman.org/AI/CV' target='_blank'>繁體中文醫療診斷書和收據OCR：PaddleOCR</a></p>"

	description = """
	<p style='text-align: center'><a href="https://blog.twman.org/2023/07/wsl.html" target='_blank'>用PaddleOCR的PPOCRLabel來微調醫療診斷書和收據</a></p><br>
	<p style='text-align: center'><a href="https://github.com/Deep-Learning-101" target='_blank'>https://github.com/Deep-Learning-101</a></p><br>
	<p style='text-align: center'><a href="https://github.com/Deep-Learning-101/Computer-Vision-Paper" target='_blank'>https://github.com/Deep-Learning-101/Computer-Vision-Paper</a></p><br>
	"""


	css = ".output_image, .input_image {height: 40rem !important; width: 100% !important;}"

	gr.Interface(
	inference,
	[gr.Image(type='filepath', label='圖片上傳')],
	outputs=[
	gr.Image(type="pil", label="識別結果"),
	"text"
	],
	title=title,
	description=description,
	css=css
	).launch(debug=True)