Update app.py
Browse files
app.py
CHANGED
|
@@ -15,7 +15,7 @@ try:
|
|
| 15 |
print("Loading MiniCPM-V-2_6-gguf model...")
|
| 16 |
llm = Llama.from_pretrained(
|
| 17 |
repo_id="openbmb/MiniCPM-V-2_6-gguf",
|
| 18 |
-
filename="ggml-model-
|
| 19 |
n_ctx=4096,
|
| 20 |
n_threads=os.cpu_count(),
|
| 21 |
n_batch=512, # Increased batch size for prompt processing
|
|
|
|
| 15 |
print("Loading MiniCPM-V-2_6-gguf model...")
|
| 16 |
llm = Llama.from_pretrained(
|
| 17 |
repo_id="openbmb/MiniCPM-V-2_6-gguf",
|
| 18 |
+
filename="ggml-model-Q4_K_M.gguf",
|
| 19 |
n_ctx=4096,
|
| 20 |
n_threads=os.cpu_count(),
|
| 21 |
n_batch=512, # Increased batch size for prompt processing
|