Spaces:
Build error
Build error
Update app.py
Browse files
app.py
CHANGED
|
@@ -4,8 +4,16 @@ from huggingface_hub import InferenceClient
|
|
| 4 |
"""
|
| 5 |
For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
|
| 6 |
"""
|
| 7 |
-
client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
|
|
|
|
| 8 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 9 |
|
| 10 |
def respond(
|
| 11 |
message,
|
|
|
|
| 4 |
"""
|
| 5 |
For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
|
| 6 |
"""
|
| 7 |
+
# client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
|
| 8 |
+
# !pip install llama-cpp-python
|
| 9 |
|
| 10 |
+
from llama_cpp import Llama
|
| 11 |
+
|
| 12 |
+
|
| 13 |
+
client = Llama.from_pretrained(
|
| 14 |
+
repo_id="unsloth/DeepSeek-R1-0528-Qwen3-8B-GGUF",
|
| 15 |
+
filename="DeepSeek-R1-0528-Qwen3-8B-Q4_K_M.gguf",
|
| 16 |
+
)
|
| 17 |
|
| 18 |
def respond(
|
| 19 |
message,
|