Spaces:

PabloVD
/

CAMELSDocBot

Sleeping

App Files Files Community

PabloVD commited on Oct 28, 2024

Commit

114ce4a

1 Parent(s): ab23f0c

First commit

Browse files

Files changed (3) hide show

app.py +34 -0
requirements.txt +4 -0
worker.py +93 -0

app.py ADDED Viewed

	@@ -0,0 +1,34 @@

+import gradio as gr
+import worker
+import requests
+from pathlib import Path
+import torchvision
+torchvision.disable_beta_transforms_warning()
+# Get data from url
+url = 'https://camels.readthedocs.io/_/downloads/en/latest/pdf/'
+r = requests.get(url, stream=True)
+document_path = Path('metadata.pdf')
+document_path.write_bytes(r.content)
+worker.process_document(document_path)
+def handle_prompt(message, history):
+    bot_response = worker.process_prompt(message)
+    return bot_response
+greetingsmessage = "Hi, I'm the CAMELS DocBot, I'm here to assist you with any question related to the CAMELS simulations documentation"
+example_questions = [
+                    "How can i read a halo file?",
+                    "Which simulation suites are included in CAMELS?",
+                    "Which are the largest volumes in CAMELS simulations?",
+                    "How can I get the power spectrum of a simulation?"
+                     ]
+# chatbot = gr.Chatbot(value=[{"role": "assistant", "content": greetingsmessage}])
+# chatbot = gr.Chatbot(value=[[None, greetingsmessage]])
+# chatbot = gr.Chatbot(value=gr.ChatMessage(role="assistant",content="How can I help you?"))
+# chatbot = gr.Chatbot(placeholder=greetingsmessage)
+demo = gr.ChatInterface(handle_prompt, type="messages", title="CAMELS DocBot",examples=example_questions, theme=gr.themes.Soft(), description=greetingsmessage)#, chatbot=chatbot)
+demo.launch()

requirements.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+langchain
+langchain-community
+langchain-huggingface
+chromadb

worker.py ADDED Viewed

	@@ -0,0 +1,93 @@

+import os
+import torch
+from langchain.chains import RetrievalQA
+from langchain_community.embeddings import HuggingFaceInstructEmbeddings
+from langchain_community.document_loaders import PyPDFLoader
+from langchain.text_splitter import RecursiveCharacterTextSplitter
+from langchain_community.vectorstores import Chroma
+from langchain_huggingface import HuggingFaceEndpoint
+# Check for GPU availability and set the appropriate device for computation.
+DEVICE = "cuda:0" if torch.cuda.is_available() else "cpu"
+# Global variables
+conversation_retrieval_chain = None
+chat_history = []
+llm_hub = None
+embeddings = None
+# Function to initialize the language model and its embeddings
+def init_llm():
+    global llm_hub, embeddings
+    # Set up the environment variable for HuggingFace and initialize the desired model.
+    # tokenfile = open("api_token.txt")
+    # api_token = tokenfile.readline().replace("\n","")
+    # tokenfile.close()
+    # os.environ["HUGGINGFACEHUB_API_TOKEN"] = api_token
+    # repo name for the model
+    # model_id = "tiiuae/falcon-7b-instruct"
+    model_id = "microsoft/Phi-3.5-mini-instruct"
+    # model_id = "meta-llama/Llama-3.2-1B-Instruct"
+    # load the model into the HuggingFaceHub
+    llm_hub = HuggingFaceEndpoint(repo_id=model_id, temperature=0.1, max_new_tokens=600, model_kwargs={"max_length":600})
+    llm_hub.client.api_url = 'https://api-inference.huggingface.co/models/'+model_id
+    # llm_hub.invoke('foo bar')
+    #Initialize embeddings using a pre-trained model to represent the text data.
+    embedddings_model = "sentence-transformers/multi-qa-distilbert-cos-v1"
+    # embedddings_model = "sentence-transformers/all-MiniLM-L6-v2"
+    embeddings = HuggingFaceInstructEmbeddings(
+        model_name=embedddings_model,
+        model_kwargs={"device": DEVICE}
+    )
+# Function to process a PDF document
+def process_document(document_path):
+    global conversation_retrieval_chain
+    # Load the document
+    loader = PyPDFLoader(document_path)
+    documents = loader.load()
+    # Split the document into chunks
+    text_splitter = RecursiveCharacterTextSplitter(chunk_size=1024, chunk_overlap=64)
+    texts = text_splitter.split_documents(documents)
+    # Create an embeddings database using Chroma from the split text chunks.
+    db = Chroma.from_documents(texts, embedding=embeddings)
+    # --> Build the QA chain, which utilizes the LLM and retriever for answering questions.
+    # By default, the vectorstore retriever uses similarity search.
+    # If the underlying vectorstore support maximum marginal relevance search, you can specify that as the search type (search_type="mmr").
+    # You can also specify search kwargs like k to use when doing retrieval. k represent how many search results send to llm
+    conversation_retrieval_chain = RetrievalQA.from_chain_type(
+        llm=llm_hub,
+        chain_type="stuff",
+        retriever=db.as_retriever(search_type="mmr", search_kwargs={'k': 6, 'lambda_mult': 0.25}),
+        return_source_documents=False,
+        input_key = "question"
+     #   chain_type_kwargs={"prompt": prompt} # if you are using prompt template, you need to uncomment this part
+    )
+# Function to process a user prompt
+def process_prompt(prompt):
+    global conversation_retrieval_chain
+    global chat_history
+    # Query the model
+    output = conversation_retrieval_chain.invoke({"question": prompt, "chat_history": chat_history})
+    answer = output["result"]
+    # Update the chat history
+    chat_history.append((prompt, answer))
+    # Return the model's response
+    return answer
+# Initialize the language model
+init_llm()