Spaces:
Sleeping
Sleeping
Commit
·
5a2a128
1
Parent(s):
2ec33d1
adding online PDF loader
Browse files
app.py
CHANGED
|
@@ -55,7 +55,6 @@ def document_loader(file_data,api_key,doc_type='pdf',llm='Huggingface'):
|
|
| 55 |
document = process_csv_document(document_file_name=file_data)
|
| 56 |
elif doc_type == 'word':
|
| 57 |
document = process_word_document(document_file_name=file_data)
|
| 58 |
-
print(document)
|
| 59 |
if document:
|
| 60 |
texts = process_documents(documents=document)
|
| 61 |
vector_db = FAISS.from_documents(documents=texts, embedding= embedding_model)
|
|
@@ -90,10 +89,9 @@ def process_word_document(document_file_name):
|
|
| 90 |
return document
|
| 91 |
|
| 92 |
|
| 93 |
-
def process_pdf_document(
|
| 94 |
-
print("Document File Name :",
|
| 95 |
-
|
| 96 |
-
loader = OnlinePDFLoader(os.stat(str(document_file_name)))
|
| 97 |
document = loader.load()[0]
|
| 98 |
return document
|
| 99 |
|
|
|
|
| 55 |
document = process_csv_document(document_file_name=file_data)
|
| 56 |
elif doc_type == 'word':
|
| 57 |
document = process_word_document(document_file_name=file_data)
|
|
|
|
| 58 |
if document:
|
| 59 |
texts = process_documents(documents=document)
|
| 60 |
vector_db = FAISS.from_documents(documents=texts, embedding= embedding_model)
|
|
|
|
| 89 |
return document
|
| 90 |
|
| 91 |
|
| 92 |
+
def process_pdf_document(document_file):
|
| 93 |
+
print("Document File Name :",document_file.name)
|
| 94 |
+
loader = OnlinePDFLoader(document_file.name)
|
|
|
|
| 95 |
document = loader.load()[0]
|
| 96 |
return document
|
| 97 |
|