Spaces:
Running
Running
| from typing import List | |
| import pypdf | |
| def read_pdf(filepath: str) -> List[str]: | |
| outputs = [] | |
| with open(filepath, 'rb') as f: | |
| pdf_reader = pypdf.PdfReader(f) | |
| for page in pdf_reader.pages: | |
| outputs.append(page.extract_text()) | |
| return outputs | |
| if __name__ == '__main__': | |
| r = read_pdf('data/109-411-2-PB.pdf') | |
| print(r) | |