Spaces:

strickvl
/

redaction-detector

Runtime error

App Files Files Community

Alex Strick van Linschoten commited on May 5, 2022

Commit

513a0c5

•

1 Parent(s): 411008f

update tmp_dir

Browse files

Files changed (1) hide show

app.py +28 -7

app.py CHANGED Viewed

@@ -33,6 +33,7 @@ labels = learn.dls.vocab
 def predict(pdf, confidence, generate_file):
     document = fitz.open(pdf.name)
     results = []
     images = []
@@ -47,12 +48,18 @@ def predict(pdf, confidence, generate_file):
         if probs[0] > (confidence / 100):
             redaction_count = len(images)
             image_pixmap.save(
-                os.path.join(tmp_dir, pdf.name, f"page-{page_num}.png")
             )
             images.append(
                 [
                     f"Redacted page #{redaction_count + 1} on page {page_num}",
-                    os.path.join(tmp_dir, pdf.name, f"page-{page_num}.png"),
                 ]
             )
@@ -61,12 +68,18 @@ def predict(pdf, confidence, generate_file):
         for page in range(len(results))
         if results[page]["redacted"] > (confidence / 100)
     ]
-    report = os.path.join(tmp_dir, pdf.name, "redacted_pages.pdf")
     if generate_file:
         pdf = FPDF()
         pdf.set_auto_page_break(0)
         imagelist = sorted(
-            [i for i in os.listdir(tmp_dir, pdf.name) if i.endswith("png")]
         )
         for image in imagelist:
             # with PILImage.open(os.path.join(tmp_dir, image)) as img:
@@ -76,7 +89,9 @@ def predict(pdf, confidence, generate_file):
             #     else:
             #         pdf.add_page("P")
             # pdf.image(os.path.join(tmp_dir, image))
-            with PILImage.open(os.path.join(tmp_dir, pdf.name, image)) as img:
                 size = img.size
                 if size[0] > size[1]:
                     pdf.add_page("L")
@@ -95,9 +110,15 @@ def predict(pdf, confidence, generate_file):
                     label_color="#FF59D6",
                 )
                 pred_dict["img"].save(
-                    os.path.join(tmp_dir, pdf.name, f"pred-{image}")
                 )
-            pdf.image(os.path.join(tmp_dir, pdf.name, f"pred-{image}"))
         pdf.output(report, "F")
     text_output = f"A total of {len(redacted_pages)} pages were redacted. \n\n The redacted page numbers were: {', '.join(redacted_pages)}."

 def predict(pdf, confidence, generate_file):
+    filename_without_extension = pdf.name[:-4]
     document = fitz.open(pdf.name)
     results = []
     images = []
         if probs[0] > (confidence / 100):
             redaction_count = len(images)
             image_pixmap.save(
+                os.path.join(
+                    tmp_dir, filename_without_extension, f"page-{page_num}.png"
+                )
             )
             images.append(
                 [
                     f"Redacted page #{redaction_count + 1} on page {page_num}",
+                    os.path.join(
+                        tmp_dir,
+                        filename_without_extension,
+                        f"page-{page_num}.png",
+                    ),
                 ]
             )
         for page in range(len(results))
         if results[page]["redacted"] > (confidence / 100)
     ]
+    report = os.path.join(
+        tmp_dir, filename_without_extension, "redacted_pages.pdf"
+    )
     if generate_file:
         pdf = FPDF()
         pdf.set_auto_page_break(0)
         imagelist = sorted(
+            [
+                i
+                for i in os.listdir(tmp_dir, filename_without_extension)
+                if i.endswith("png")
+            ]
         )
         for image in imagelist:
             # with PILImage.open(os.path.join(tmp_dir, image)) as img:
             #     else:
             #         pdf.add_page("P")
             # pdf.image(os.path.join(tmp_dir, image))
+            with PILImage.open(
+                os.path.join(tmp_dir, filename_without_extension, image)
+            ) as img:
                 size = img.size
                 if size[0] > size[1]:
                     pdf.add_page("L")
                     label_color="#FF59D6",
                 )
                 pred_dict["img"].save(
+                    os.path.join(
+                        tmp_dir, filename_without_extension, f"pred-{image}"
+                    )
+                )
+            pdf.image(
+                os.path.join(
+                    tmp_dir, filename_without_extension, f"pred-{image}"
                 )
+            )
         pdf.output(report, "F")
     text_output = f"A total of {len(redacted_pages)} pages were redacted. \n\n The redacted page numbers were: {', '.join(redacted_pages)}."