Spaces:
Sleeping
Sleeping
Omar ID EL MOUMEN
commited on
Commit
·
48f6066
1
Parent(s):
848b14f
Little fix
Browse files
app.py
CHANGED
|
@@ -118,7 +118,7 @@ async def extract_pdf(pdf: PDF):
|
|
| 118 |
pdf_req = requests.get(pdf.url)
|
| 119 |
if pdf_req.status_code == 200:
|
| 120 |
pdf_data = BytesIO(pdf_req.content)
|
| 121 |
-
doc = fitz.open(stream=pdf_data, filetype="pdf")[:pdf.page_num]
|
| 122 |
pdf_text = " ".join([page.get_text("text") for page in doc])
|
| 123 |
pdf_metadata = doc.metadata
|
| 124 |
print(pdf_metadata)
|
|
|
|
| 118 |
pdf_req = requests.get(pdf.url)
|
| 119 |
if pdf_req.status_code == 200:
|
| 120 |
pdf_data = BytesIO(pdf_req.content)
|
| 121 |
+
doc = fitz.open(stream=pdf_data, filetype="pdf") if pdf.page_num == -1 else fitz.open(stream=pdf_data, filetype="pdf")[:pdf.page_num]
|
| 122 |
pdf_text = " ".join([page.get_text("text") for page in doc])
|
| 123 |
pdf_metadata = doc.metadata
|
| 124 |
print(pdf_metadata)
|