peter2000 commited on
Commit
d08905f
1 Parent(s): acafedc

Update scripts/clean.py

Browse files
Files changed (1) hide show
  1. scripts/clean.py +1 -1
scripts/clean.py CHANGED
@@ -84,7 +84,7 @@ def preprocessing(document):
84
  clean_header_footer=True,
85
  split_by="sentence",
86
  split_length=3,
87
- split_respect_sentence_boundary=True,
88
  split_overlap=1
89
  )
90
  for i in document:
 
84
  clean_header_footer=True,
85
  split_by="sentence",
86
  split_length=3,
87
+ split_respect_sentence_boundary=False,
88
  split_overlap=1
89
  )
90
  for i in document: