File size: 816 Bytes
641ff3e
 
44647fa
641ff3e
 
 
 
 
16dc1f9
641ff3e
619a281
efd2dce
44647fa
504104c
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
pdfminer.six==20231228
pdf2image==1.17.0
opencv-python==4.9.0.80
presidio_analyzer==2.2.351
presidio_anonymizer==2.2.351
presidio-image-redactor==0.0.52
pikepdf==8.15.1
pandas==2.2.2
spacy # Not specified as latest versions create a conflict with latest versions of gradio
en_core_web_lg @ https://github.com/explosion/spacy-models/releases/download/en_core_web_lg-3.7.1/en_core_web_lg-3.7.1.tar.gz
gradio # Not specified as latest versions create a conflict with latest versions of spacy
boto3==1.34.103
# Following are not currently necessary for the app, may be added for improved pdf parsing in future
#unstructured
#unstructured_inference # This is big! Only necessary if you want to use the high res strategy in pdf_partition
#unstructured_pytesseract
#pillow-heif
#python-docx
#python-pptx