Spaces:

arithescientist
/

lincolnlegal

Sleeping

Ari commited on Sep 5

Commit

cffceba

•

1 Parent(s): eaae758

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -2,7 +2,13 @@ import gradio as gr
 from docx import Document  # For .docx handling
 from gtts import gTTS
 import os
-import pdfkit  # For converting text to PDF
 # Function to extract text from a .docx file and convert to PDF
 def docx_to_pdf(docx_file):
@@ -22,9 +28,9 @@ def docx_to_pdf(docx_file):
         </html>
         """
-        # Generate the PDF using pdfkit
         pdf_output_path = "document_output.pdf"
-        pdfkit.from_string(html_content, pdf_output_path)
         # Convert the text to audio using gTTS
         tts = gTTS(text=extracted_text, lang='en', slow=False)

 from docx import Document  # For .docx handling
 from gtts import gTTS
 import os
+import pdfkit
+# Path to the wkhtmltopdf executable (update this path based on the Dockerfile output)
+WKHTMLTOPDF_PATH = "/usr/local/bin/wkhtmltopdf"  # You will get this from the Dockerfile output
+# Configure pdfkit to use the correct wkhtmltopdf path
+config = pdfkit.configuration(wkhtmltopdf=WKHTMLTOPDF_PATH)
 # Function to extract text from a .docx file and convert to PDF
 def docx_to_pdf(docx_file):
         </html>
         """
+        # Generate the PDF using pdfkit with the custom wkhtmltopdf path
         pdf_output_path = "document_output.pdf"
+        pdfkit.from_string(html_content, pdf_output_path, configuration=config)
         # Convert the text to audio using gTTS
         tts = gTTS(text=extracted_text, lang='en', slow=False)