from typing import List import pypdf def read_pdf(filepath: str) -> List[str]: outputs = [] with open(filepath, 'rb') as f: pdf_reader = pypdf.PdfReader(f) for page in pdf_reader.pages: outputs.append(page.extract_text()) return outputs if __name__ == '__main__': r = read_pdf('data/109-411-2-PB.pdf') print(r)