Spaces:

jedick
/

R-help-chat

Running on Zero

App Files Files Community

jedick commited on Jul 31

Commit

f6e2d8a

1 Parent(s): 7320bf1

Download data during app startup

Browse files

Files changed (3) hide show

app.py +24 -150
data.py +59 -0
retriever.py +5 -2

app.py CHANGED Viewed

@@ -1,37 +1,42 @@
-import gradio as gr
-from main import GetChatModel, openai_model, model_id
-from graph import BuildGraph
-from retriever import db_dir
-from util import get_sources, get_start_end_months
-from mods.tool_calling_llm import extract_think
-from huggingface_hub import snapshot_download
 from langgraph.checkpoint.memory import MemorySaver
 from dotenv import load_dotenv
-import requests
-import zipfile
-import shutil
 import spaces
 import torch
-import boto3
 import uuid
 import ast
 import os
 import re
 # Setup environment variables
 load_dotenv(dotenv_path=".env", override=True)
 # Download model snapshots from Hugging Face Hub
-print(f"Downloading/loading checkpoints for {model_id}...")
 ckpt_dir = snapshot_download(model_id, local_dir_use_symlinks=False)
 print(f"Using checkpoints from {ckpt_dir}")
-embedding_model_id = "nomic-ai/nomic-embed-text-v1.5"
-print(f"Downloading/loading checkpoints for {embedding_model_id}...")
 embedding_ckpt_dir = snapshot_download(embedding_model_id, local_dir_use_symlinks=False)
 print(f"Using embedding checkpoints from {embedding_ckpt_dir}")
 # Global setting for search type
 search_type = "hybrid"
@@ -39,7 +44,6 @@ search_type = "hybrid"
 # https://www.gradio.app/guides/state-in-blocks
 graph_instances = {"local": {}, "remote": {}}
 def cleanup_graph(request: gr.Request):
     if request.session_hash in graph_instances["local"]:
         del graph_instances["local"][request.session_hash]
@@ -91,7 +95,7 @@ def run_workflow(input, history, compute_mode, thread_id, session_hash):
         if compute_mode == "local":
             gr.Info(
                 f"Please wait for the local model to load",
-                duration=15,
                 title=f"Model loading...",
             )
         # Get the chat model and build the graph
@@ -399,7 +403,7 @@ with gr.Blocks(
             🧠 Thinking is enabled for the answer<br>
             &emsp;&nbsp; 🔍 Add **/think** to enable thinking for the query</br>
             &emsp;&nbsp; 🚫 Add **/no_think** to disable all thinking</br>
-            ✨ [nomic-embed-text-v1.5](https://huggingface.co/nomic-ai/nomic-embed-text-v1.5) and [{model_id.split("/")[-1]}](https://huggingface.co/{model_id})<br>
             🏠 See the project's [GitHub repository](https://github.com/jedick/R-help-chat)
             """
         return status_text
@@ -459,7 +463,7 @@ with gr.Blocks(
                     intro = gr.Markdown(get_intro_text())
                 with gr.Column(scale=1):
                     compute_mode.render()
-            with gr.Group(visible=False) as chat_interface:
                 chatbot.render()
                 input.render()
             # Render textboxes for data loading progress
@@ -626,136 +630,6 @@ with gr.Blocks(
         api_name=False,
     )
-    # ------------
-    # Data loading
-    # ------------
-    def download():
-        """Download the application data"""
-        def download_file_from_bucket(bucket_name, s3_key, output_file):
-            """Download file from S3 bucket"""
-            # https://thecodinginterface.com/blog/aws-s3-python-boto3
-            session = boto3.session.Session(
-                aws_access_key_id=os.getenv("AWS_ACCESS_KEY_ID"),
-                aws_secret_access_key=os.getenv("AWS_ACCESS_KEY_SECRET"),
-                region_name="us-east-1",
-            )
-            s3_resource = session.resource("s3")
-            bucket = s3_resource.Bucket(bucket_name)
-            bucket.download_file(Key=s3_key, Filename=output_file)
-        def download_dropbox_file(shared_url, output_file):
-            """Download file from Dropbox"""
-            # Modify the shared URL to enable direct download
-            direct_url = shared_url.replace(
-                "www.dropbox.com", "dl.dropboxusercontent.com"
-            ).replace("?dl=0", "")
-            # Send a GET request to the direct URL
-            response = requests.get(direct_url, stream=True)
-            if response.status_code == 200:
-                # Write the content to a local file
-                with open(output_file, "wb") as file:
-                    for chunk in response.iter_content(chunk_size=8192):
-                        file.write(chunk)
-                print(f"File downloaded successfully as '{output_file}'")
-            else:
-                print(
-                    f"Failed to download file. HTTP Status Code: {response.status_code}"
-                )
-        if not os.path.isdir(db_dir) and not os.path.exists("db.zip"):
-            # For S3 (need AWS_ACCESS_KEY_ID and AWS_ACCESS_KEY_SECRET)
-            download_file_from_bucket("r-help-chat", "db.zip", "db.zip")
-            ## For Dropbox (shared file - key is in URL)
-            # shared_link = "https://www.dropbox.com/scl/fi/jx90g5lorpgkkyyzeurtc/db.zip?rlkey=wvqa3p9hdy4rmod1r8yf2am09&st=l9tsam56&dl=0"
-            # output_filename = "db.zip"
-            # download_dropbox_file(shared_link, output_filename)
-    def extract():
-        """Extract the db.zip file"""
-        if not os.path.isdir(db_dir):
-            file_path = "db.zip"
-            extract_to_path = "./"
-            try:
-                with zipfile.ZipFile(file_path, "r") as zip_ref:
-                    zip_ref.extractall(extract_to_path)
-            except:
-                # If there were any errors, remove zip file and db directory
-                # to initiate a new download when app is reloaded
-                try:
-                    os.remove(file_path)
-                    print(f"{file_path} has been deleted.")
-                except FileNotFoundError:
-                    print(f"{file_path} does not exist.")
-                except PermissionError:
-                    print(f"Permission denied to delete {file_path}.")
-                except Exception as e:
-                    print(f"An error occurred: {e}")
-                directory_path = "./db"
-                try:
-                    # Forcefully and recursively delete a directory, like rm -rf
-                    shutil.rmtree(directory_path)
-                    print(f"Successfully deleted: {directory_path}")
-                except FileNotFoundError:
-                    print(f"Directory not found: {directory_path}")
-                except PermissionError:
-                    print(f"Permission denied: {directory_path}")
-                except Exception as e:
-                    print(f"An error occurred: {e}")
-    def visible_if_data_present():
-        """Make component visible if the database directory is present"""
-        visible = os.path.isdir(db_dir)
-        return change_visibility(visible)
-    def visible_if_data_missing():
-        """Make component visible if the database directory is missing"""
-        visible = not os.path.isdir(db_dir)
-        return change_visibility(visible)
-    false = gr.State(False)
-    true = gr.State(True)
-    # When app is launched: show "Loading Data" textbox, download and extract
-    # data if necessary, make chat interface visible or show error textbox, and
-    # update database info
-    # fmt: off
-    demo.load(
-        change_visibility, [true], [loading_data], api_name=False
-    ).then(
-        visible_if_data_missing, None, [downloading], api_name=False
-    ).then(
-        download, None, [downloading], api_name=False
-    ).then(
-        change_visibility, [false], [downloading], api_name=False
-    ).then(
-        visible_if_data_missing, None, [extracting], api_name=False
-    ).then(
-        extract, None, [extracting], api_name=False
-    ).then(
-        change_visibility, [false], [extracting], api_name=False
-    ).then(
-        change_visibility, [false], [loading_data], api_name=False
-    ).then(
-        visible_if_data_present, None, [chat_interface], api_name=False
-    ).then(
-        visible_if_data_missing, None, [missing_data], api_name=False
-    ).then(
-        get_info_text, None, [info], api_name=False
-    )
-    # fmt: on
     # Clean up graph instances when page is closed/refreshed
     demo.unload(cleanup_graph)

 from langgraph.checkpoint.memory import MemorySaver
+from huggingface_hub import snapshot_download
 from dotenv import load_dotenv
+import gradio as gr
 import spaces
 import torch
 import uuid
 import ast
 import os
 import re
+# Local modules
+from main import GetChatModel, openai_model, model_id
+from util import get_sources, get_start_end_months
+from retriever import db_dir, embedding_model_id
+from mods.tool_calling_llm import extract_think
+from data import download_data, extract_data
+from graph import BuildGraph
 # Setup environment variables
 load_dotenv(dotenv_path=".env", override=True)
 # Download model snapshots from Hugging Face Hub
+print(f"Downloading checkpoints for {model_id}...")
 ckpt_dir = snapshot_download(model_id, local_dir_use_symlinks=False)
 print(f"Using checkpoints from {ckpt_dir}")
+print(f"Downloading checkpoints for {embedding_model_id}...")
 embedding_ckpt_dir = snapshot_download(embedding_model_id, local_dir_use_symlinks=False)
 print(f"Using embedding checkpoints from {embedding_ckpt_dir}")
+# Download and extract data if data directory is not present
+if not os.path.isdir(db_dir):
+    print("Downloading data ... ", end = "")
+    download_data()
+    print("done!")
+    print("Extracting data ... ", end = "")
+    extract_data()
+    print("done!")
 # Global setting for search type
 search_type = "hybrid"
 # https://www.gradio.app/guides/state-in-blocks
 graph_instances = {"local": {}, "remote": {}}
 def cleanup_graph(request: gr.Request):
     if request.session_hash in graph_instances["local"]:
         del graph_instances["local"][request.session_hash]
         if compute_mode == "local":
             gr.Info(
                 f"Please wait for the local model to load",
+                duration=8,
                 title=f"Model loading...",
             )
         # Get the chat model and build the graph
             🧠 Thinking is enabled for the answer<br>
             &emsp;&nbsp; 🔍 Add **/think** to enable thinking for the query</br>
             &emsp;&nbsp; 🚫 Add **/no_think** to disable all thinking</br>
+            ✨ [{embedding_model_id.split("/")[-1]}](https://huggingface.co/{embedding_model_id}) and [{model_id.split("/")[-1]}](https://huggingface.co/{model_id})<br>
             🏠 See the project's [GitHub repository](https://github.com/jedick/R-help-chat)
             """
         return status_text
                     intro = gr.Markdown(get_intro_text())
                 with gr.Column(scale=1):
                     compute_mode.render()
+            with gr.Group() as chat_interface:
                 chatbot.render()
                 input.render()
             # Render textboxes for data loading progress
         api_name=False,
     )
     # Clean up graph instances when page is closed/refreshed
     demo.unload(cleanup_graph)

data.py ADDED Viewed

	@@ -0,0 +1,59 @@

+import requests
+import zipfile
+import shutil
+import boto3
+import os
+def download_file_from_bucket(bucket_name, s3_key, output_file):
+    """Download file from S3 bucket"""
+    # https://thecodinginterface.com/blog/aws-s3-python-boto3
+    session = boto3.session.Session(
+        aws_access_key_id=os.getenv("AWS_ACCESS_KEY_ID"),
+        aws_secret_access_key=os.getenv("AWS_ACCESS_KEY_SECRET"),
+        region_name="us-east-1",
+    )
+    s3_resource = session.resource("s3")
+    bucket = s3_resource.Bucket(bucket_name)
+    bucket.download_file(Key=s3_key, Filename=output_file)
+def download_dropbox_file(shared_url, output_file):
+    """Download file from Dropbox"""
+    # Modify the shared URL to enable direct download
+    direct_url = shared_url.replace(
+        "www.dropbox.com", "dl.dropboxusercontent.com"
+    ).replace("?dl=0", "")
+    # Send a GET request to the direct URL
+    response = requests.get(direct_url, stream=True)
+    if response.status_code == 200:
+        # Write the content to a local file
+        with open(output_file, "wb") as file:
+            for chunk in response.iter_content(chunk_size=8192):
+                file.write(chunk)
+        print(f"File downloaded successfully as '{output_file}'")
+    else:
+        print(
+            f"Failed to download file. HTTP Status Code: {response.status_code}"
+        )
+def download_data():
+    """Download the email database"""
+    if not os.path.exists("db.zip"):
+        # For S3 (need AWS_ACCESS_KEY_ID and AWS_ACCESS_KEY_SECRET)
+        download_file_from_bucket("r-help-chat", "db.zip", "db.zip")
+        ## For Dropbox (shared file - key is in URL)
+        # shared_link = "https://www.dropbox.com/scl/fi/jx90g5lorpgkkyyzeurtc/db.zip?rlkey=wvqa3p9hdy4rmod1r8yf2am09&st=l9tsam56&dl=0"
+        # output_filename = "db.zip"
+        # download_dropbox_file(shared_link, output_filename)
+def extract_data():
+    """Extract the db.zip file"""
+    file_path = "db.zip"
+    extract_to_path = "./"
+    with zipfile.ZipFile(file_path, "r") as zip_ref:
+        zip_ref.extractall(extract_to_path)

retriever.py CHANGED Viewed

@@ -29,6 +29,9 @@ from mods.file_system import LocalFileStore
 # Database directory
 db_dir = "db"
 def BuildRetriever(
     compute_mode,
@@ -145,13 +148,13 @@ def BuildRetrieverDense(compute_mode: str, top_k=6, embedding_ckpt_dir=None):
     if compute_mode == "local":
         # embedding_function = HuggingFaceEmbeddings(model_name="BAAI/bge-large-en-v1.5", show_progress=True)
         # https://python.langchain.com/api_reference/community/embeddings/langchain_community.embeddings.huggingface.HuggingFaceBgeEmbeddings.html
-        model_name = "nomic-ai/nomic-embed-text-v1.5"
-        id_or_dir = embedding_ckpt_dir if embedding_ckpt_dir else model_name
         model_kwargs = {
             "device": "cuda",
             "trust_remote_code": True,
         }
         encode_kwargs = {"normalize_embeddings": True}
         embedding_function = HuggingFaceBgeEmbeddings(
             model_name=id_or_dir,
             model_kwargs=model_kwargs,

 # Database directory
 db_dir = "db"
+# Embedding model
+embedding_model_id = "nomic-ai/nomic-embed-text-v1.5"
 def BuildRetriever(
     compute_mode,
     if compute_mode == "local":
         # embedding_function = HuggingFaceEmbeddings(model_name="BAAI/bge-large-en-v1.5", show_progress=True)
         # https://python.langchain.com/api_reference/community/embeddings/langchain_community.embeddings.huggingface.HuggingFaceBgeEmbeddings.html
         model_kwargs = {
             "device": "cuda",
             "trust_remote_code": True,
         }
         encode_kwargs = {"normalize_embeddings": True}
+        # Use embedding model ID or checkpoint directory if given
+        id_or_dir = embedding_ckpt_dir if embedding_ckpt_dir else embedding_model_id
         embedding_function = HuggingFaceBgeEmbeddings(
             model_name=id_or_dir,
             model_kwargs=model_kwargs,