Spaces:

techasad
/

document_chatbot

Sleeping

App Files Files Community

techasad commited on Mar 1, 2024

Commit

2b48034

verified ·

1 Parent(s): b89b0a0

Update app.py

Browse files

Files changed (1) hide show

app.py +85 -42

app.py CHANGED Viewed

@@ -3,7 +3,7 @@ from PyPDF2 import PdfReader
 import langchain
 from textwrap import dedent
 import pandas as pd
 from langchain_community.callbacks import StreamlitCallbackHandler
 from langchain_openai import ChatOpenAI
 from langchain_community.chat_models import ChatGooglePalm
@@ -30,15 +30,57 @@ from langchain.prompts import (
 #api_key2 = st.secrets["OPENAI_API_KEY"]
-os.environ["GOOGLE_API_KEY"] = "AIzaSyD29fEos3V6S2L-AGSQgNu03GqZEIgJads"
-st.set_page_config(page_title='Personal Chatbot', page_icon='books')
-st.header('Knowledge Query Assistant')
-st.write("Upload your file to begin a chat, or ask any general questions you have")
-st.sidebar.title('Options')
 st.sidebar.subheader("Please Choose the AI Engine")
 use_google = st.sidebar.checkbox("Use Free AI", value =True)
 use_openai = st.sidebar.checkbox("Use OpenAI with your API Key")
@@ -163,7 +205,6 @@ st.sidebar.markdown("[Website](https://tenlancer.com/)")
 ########--Save PDF--########
 def text_to_audio(response, lang):
     audio_buffer = BytesIO()
     audio_file = gTTS(text=response, lang=lang, slow=False)
@@ -173,7 +214,7 @@ def text_to_audio(response, lang):
 def main():
-    try:
         if (use_openai and openai_api_key) or use_google:
             if uploaded_file:
                 db = processing_csv_pdf_docx(uploaded_file)
@@ -181,17 +222,20 @@ def main():
                     st.success(f'Your File: {file.name} is Embedded', icon="✅")
             for msg in st.session_state.messages:
-                st.chat_message(msg["role"]).write(msg["content"])
-                #if msg["role"] == "Assistant":
-                 #   st.chat_message(msg["role"]).audio(msg["audio_content"], format='audio/wav')
                     #st.audio(audio_msg, format='audio/mp3').audio(audio_msg)
             if prompt := st.chat_input(placeholder="Type your question!"):
                 st.session_state.messages.append({"role": "user", "content": prompt})
-                st.chat_message("user").write(prompt)
-                memory = ConversationBufferMemory(memory_key="chat_history", input_key="question", human_prefix= "", ai_prefix= "")
                 user_message = {"role": "user", "content": prompt}
@@ -200,15 +244,15 @@ def main():
                         user_prompt = st.session_state.messages[i]
                         ai_res = st.session_state.messages[i + 1]
-                        current_role = user_prompt["role"]
                         current_content = user_prompt["content"]
-                        next_role = ai_res["role"]
                         next_content = ai_res["content"]
                         # Concatenate role and content for context and output
-                        user = f"{current_role}: {current_content}"
-                        ai = f"{next_role}: {next_content}"
                         memory.save_context({"question": user}, {"output": ai})
@@ -224,12 +268,15 @@ def main():
                 compliment = ['thank you', 'thanks', 'thanks a lot', 'thanks a bunch', 'great', 'ok', 'ok thanks', 'okay', 'great', 'awesome', 'nice']
                 prompt_template =dedent(r"""
-                You are an informative chatbot designed to assist users with queries specifically related to context.
-                Your purpose is to provide accurate information sourced from a document, ensuring relevance and reliability in your responses.
-                Respond with humility and avoid speculative or hypothetical answers. Use the provided context to formulate concise responses, staying within 100 words, and refrain from adding unnecessary information.
-                Ensure that your answers are directly related to the user's query and do not deviate from the provided context.
-                this is the context from study material:
                 ---------
                 {context}
                 ---------
@@ -260,7 +307,7 @@ def main():
                 #chain = load_qa_chain(ChatOpenAI(temperature=0.9, model="gpt-3.5-turbo-0613", streaming=True) , verbose= True, prompt = PROMPT, memory=memory,chain_type="stuff")
-                with st.chat_message("Assistant"):
                     st_cb = StreamlitCallbackHandler(st.container())
                     if prompt.lower() in greetings:
                         response = 'Hi, how are you? I am here to help you get information from your file. How can I assist you?'
@@ -272,8 +319,7 @@ def main():
                         audio_buffer = text_to_audio(response, lang)
                         #st.audio(audio_buffer, format='audio/mp3')
-                        st.session_state.messages.append({"role": "Assistant", "content": response})
-                        #st.session_state.messages.append({"role": "Assistant", "content": response, "audio_content": audio_buffer})
                     elif prompt.lower() in compliment:
                         response = 'My pleasure! If you have any more questions, feel free to ask.'
@@ -285,12 +331,11 @@ def main():
                         audio_buffer = text_to_audio(response, lang)
                         #st.audio(audio_buffer, format='audio/mp3')
-                        st.session_state.messages.append({"role": "Assistant", "content": response})
-                        #st.session_state.messages.append({"role": "Assistant", "content": response, "audio_content": audio_buffer})
                     elif uploaded_file:
                         with st.spinner('Bot is typing ...'):
-                            docs = db.similarity_search(prompt, k=10, fetch_k=30)
                             response = chain.run(input_documents=docs, question=prompt)
@@ -301,8 +346,8 @@ def main():
                             audio_buffer = text_to_audio(response, lang)
                            # st.audio(audio_buffer, format='audio/mp3')
                             #st.session_state.audio.append({"role": "Assistant", "audio": audio_buffer})
-                            #st.session_state.messages.append({"role": "Assistant", "content": response, "audio_content": audio_buffer})
-                            st.session_state.messages.append({"role": "Assistant", "content": response})
                             assistant_message = {"role": "assistant", "content": response}
                     else:
                         with st.spinner('Bot is typing ...'):
@@ -315,27 +360,25 @@ def main():
-                            #audio_buffer = text_to_audio(response, lang)
                             #st.audio(audio_buffer, format='audio/mp3')
                             #st.session_state.audio.append({"role": "Assistant", "audio": audio_buffer})
-                            #st.session_state.messages.append({"role": "Assistant", "content": response, "audio_content": audio_buffer})
-                            st.session_state.messages.append({"role": "Assistant", "content": response})
                             assistant_message = {"role": "assistant", "content": response}
                     st.write(response)
-                    #st.audio(audio_buffer, format='audio/wav')
-    except Exception as e:
-        "Sorry, there was a problem. A corrupted file or;"
-        if use_google:
-            "Google PaLM AI only take English Data and Questions. Or the AI could not find the answer in your provided document."
-        elif use_openai:
-            "Please check your OpenAI API key"
 hide_streamlit_style = """

 import langchain
 from textwrap import dedent
 import pandas as pd
+from langchain_google_genai import ChatGoogleGenerativeAI
 from langchain_community.callbacks import StreamlitCallbackHandler
 from langchain_openai import ChatOpenAI
 from langchain_community.chat_models import ChatGooglePalm
+st.set_page_config(page_title='Personal Chatbot', page_icon='books')
+st.markdown(
+    """
+    <style>
+        [data-testid=stImage]{
+            text-align: center;
+            display: block;
+            margin-left: 10%;
+            margin-right:10%;
+            width: 100%;
+    }
+    img {
+        border-radius: 50%;
+        align: center;
+    }
+    </style>
+    """, unsafe_allow_html=True
+)
+st.image("tenlancer.png", width=80)
+st.markdown("<h3 style='text-align: center; color: white;'> Knowledge Query Assistant </h3>", unsafe_allow_html=True)
+st.markdown(
+    """
+    <style>
+    [data-testid="stChatMessageContent"] p{
+        font-size: 1.2rem;
+        color: #404040
+    }
+    </style>
+    """, unsafe_allow_html=True
+)
+google_api_key = st.secrets["GOOGLE_API_KEY"]
 #api_key2 = st.secrets["OPENAI_API_KEY"]
+os.environ["GOOGLE_API_KEY"] = google_api_key
+st.sidebar.header("options")
 st.sidebar.subheader("Please Choose the AI Engine")
 use_google = st.sidebar.checkbox("Use Free AI", value =True)
 use_openai = st.sidebar.checkbox("Use OpenAI with your API Key")
 ########--Save PDF--########
 def text_to_audio(response, lang):
     audio_buffer = BytesIO()
     audio_file = gTTS(text=response, lang=lang, slow=False)
 def main():
+   # try:
         if (use_openai and openai_api_key) or use_google:
             if uploaded_file:
                 db = processing_csv_pdf_docx(uploaded_file)
                     st.success(f'Your File: {file.name} is Embedded', icon="✅")
             for msg in st.session_state.messages:
+                if msg["role"] == "user":
+                    st.chat_message("user", avatar="user.png").write(msg["content"])
+                if msg["role"] == "Assistant":
+                    st.chat_message("Assistant", avatar="logo.png").write(msg["content"])
+                    st.audio(msg["audio_content"], format='audio/wav')
                     #st.audio(audio_msg, format='audio/mp3').audio(audio_msg)
             if prompt := st.chat_input(placeholder="Type your question!"):
                 st.session_state.messages.append({"role": "user", "content": prompt})
+                st.chat_message("user", avatar="user.png").write(prompt)
+                memory = ConversationBufferMemory(memory_key="chat_history", input_key="question", human_prefix= "User", ai_prefix= "Assistant")
                 user_message = {"role": "user", "content": prompt}
                         user_prompt = st.session_state.messages[i]
                         ai_res = st.session_state.messages[i + 1]
                         current_content = user_prompt["content"]
                         next_content = ai_res["content"]
                         # Concatenate role and content for context and output
+                        user = f" {current_content}"
+                        ai = f" {next_content}"
                         memory.save_context({"question": user}, {"output": ai})
                 compliment = ['thank you', 'thanks', 'thanks a lot', 'thanks a bunch', 'great', 'ok', 'ok thanks', 'okay', 'great', 'awesome', 'nice']
                 prompt_template =dedent(r"""
+                You are a helpful assistant.
+                talk humbly. Answer the question from the provided context. Do not answer from your own training data.
+                Use the following pieces of context to answer the question at the end.
+                If you don't know the answer, just say that you don't know. Do not makeup any answer.
+                Do not answer hypothetically. Do not answer in more than 100 words.
+                Please Do Not say: "Based on the provided context"
+                this is the context:
                 ---------
                 {context}
                 ---------
                 #chain = load_qa_chain(ChatOpenAI(temperature=0.9, model="gpt-3.5-turbo-0613", streaming=True) , verbose= True, prompt = PROMPT, memory=memory,chain_type="stuff")
+                with st.chat_message("Assistant",  avatar="logo.png"):
                     st_cb = StreamlitCallbackHandler(st.container())
                     if prompt.lower() in greetings:
                         response = 'Hi, how are you? I am here to help you get information from your file. How can I assist you?'
                         audio_buffer = text_to_audio(response, lang)
                         #st.audio(audio_buffer, format='audio/mp3')
+                        st.session_state.messages.append({"role": "Assistant", "content": response, "audio_content": audio_buffer})
                     elif prompt.lower() in compliment:
                         response = 'My pleasure! If you have any more questions, feel free to ask.'
                         audio_buffer = text_to_audio(response, lang)
                         #st.audio(audio_buffer, format='audio/mp3')
+                        st.session_state.messages.append({"role": "Assistant", "content": response, "audio_content": audio_buffer})
                     elif uploaded_file:
                         with st.spinner('Bot is typing ...'):
+                            docs = db.similarity_search(prompt, k=5, fetch_k=10)
                             response = chain.run(input_documents=docs, question=prompt)
                             audio_buffer = text_to_audio(response, lang)
                            # st.audio(audio_buffer, format='audio/mp3')
                             #st.session_state.audio.append({"role": "Assistant", "audio": audio_buffer})
+                            st.session_state.messages.append({"role": "Assistant", "content": response, "audio_content": audio_buffer})
                             assistant_message = {"role": "assistant", "content": response}
                     else:
                         with st.spinner('Bot is typing ...'):
+                            audio_buffer = text_to_audio(response, lang)
                             #st.audio(audio_buffer, format='audio/mp3')
                             #st.session_state.audio.append({"role": "Assistant", "audio": audio_buffer})
+                            st.session_state.messages.append({"role": "Assistant", "content": response, "audio_content": audio_buffer})
                             assistant_message = {"role": "assistant", "content": response}
                     st.write(response)
+                st.audio(audio_buffer, format='audio/wav')
+    #except Exception as e:
+     #   "Sorry, there was a problem. A corrupted file or;"
+      #  if use_google:
+       #     "Google PaLM AI only take English Data and Questions. Or the AI could not find the answer in your provided document."
+        #elif use_openai:
+         #   "Please check your OpenAI API key"
 hide_streamlit_style = """