victormiller commited on
Commit
4516bfc
1 Parent(s): 189eeae

Update curated.py

Browse files
Files changed (1) hide show
  1. curated.py +1 -1
curated.py CHANGED
@@ -680,7 +680,7 @@ filtering_process = Div(
680
  P(B("Download and Extraction: "), "Original PDF files download from", A("https://philarchive.org/oai.pl", href="https://philarchive.org/oai.pl"), ". All available PDF's were downloaded. Each PDF was converted to text using java", D_code("-jar ../philpapers_resources/src/pdfbox-app-2.0.21.jar ExtractText {f0} {FOUT.name}", language="java"), ". After converting to text formatting, a language was detected and added using the langdetect (citation needed) library."),
681
  H4("Filtering"),
682
  Ul(
683
- Li(P(B("Hyphenation Removal"), D_code("end-of", language="python"), " becomes ", D_code("end of", language="python"))),
684
  Li(P(B("Newline Filtering"), "")),
685
  Li(P(B("Header/Footer Filtering"), "")),
686
  Li(P(B("Double Whitespace Filtering"), "")),
 
680
  P(B("Download and Extraction: "), "Original PDF files download from", A("https://philarchive.org/oai.pl", href="https://philarchive.org/oai.pl"), ". All available PDF's were downloaded. Each PDF was converted to text using java", D_code("-jar ../philpapers_resources/src/pdfbox-app-2.0.21.jar ExtractText {f0} {FOUT.name}", language="java"), ". After converting to text formatting, a language was detected and added using the langdetect (citation needed) library."),
681
  H4("Filtering"),
682
  Ul(
683
+ Li(P(B("Hyphenation Removal:"), D_code("end-of", style="inline", language="python"), " becomes ", D_code("end of", language="python"))),
684
  Li(P(B("Newline Filtering"), "")),
685
  Li(P(B("Header/Footer Filtering"), "")),
686
  Li(P(B("Double Whitespace Filtering"), "")),