Spaces:

vinuajeesh
/

mybot

Runtime error

vinuajeesh commited on Jun 7

Commit

84d2105

verified ·

1 Parent(s): 9169ab9

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,23 +1,43 @@
 import gradio as gr
-from llama_cpp import Llama
 from huggingface_hub import hf_hub_download
-# Download model from HF Hub to local cache
 model_path = hf_hub_download(
-    repo_id="unsloth/gemma-3-4b-it-GGUF",
-    filename="gemma-3-4b-it.Q4_K_M.gguf"   # or correct filename
 )
-# Load model
-llm = Llama(model_path=model_path, n_ctx=2048)
-# Chat function
 def chat(prompt):
-    output = llm(prompt, max_tokens=512)
-    return output['choices'][0]['text']
-# Gradio UI
-iface = gr.Interface(fn=chat, inputs="text", outputs="text")
 iface.launch()

 import gradio as gr
 from huggingface_hub import hf_hub_download
+from llama_cpp import Llama
+# Download the model from Hugging Face Hub (only first time, then cached)
+print("Downloading model...")
 model_path = hf_hub_download(
+    repo_id="TheBloke/gemma-7b-it-GGUF",
+    filename="gemma-7b-it.Q4_K_M.gguf"
 )
+print("Model downloaded to:", model_path)
+# Load the model with llama-cpp-python
+print("Loading model...")
+llm = Llama(
+    model_path=model_path,
+    n_ctx=2048  # You can adjust this as per your memory limits
+)
+print("Model loaded.")
+# Define a function to interact with the model
 def chat(prompt):
+    print(f"User input: {prompt}")
+    output = llm(
+        prompt,
+        max_tokens=512,
+        stop=["</s>", "User:", "Assistant:"]
+    )
+    reply = output['choices'][0]['text'].strip()
+    print(f"Model reply: {reply}")
+    return reply
+# Create a simple Gradio UI
+iface = gr.Interface(
+    fn=chat,
+    inputs="text",
+    outputs="text",
+    title="Gemma 7B IT Chatbot",
+    description="Running a GGUF model (Gemma 7B IT) on Hugging Face Space using llama-cpp-python"
+)
+# Launch the app
 iface.launch()