Update app.py
Browse files
app.py
CHANGED
|
@@ -23,6 +23,7 @@ try:
|
|
| 23 |
filename="ggml-model-Q4_K_M.gguf",
|
| 24 |
n_ctx=4096,
|
| 25 |
n_threads=os.cpu_count(),
|
|
|
|
| 26 |
verbose=False, # Set to True for more debug output
|
| 27 |
# `chat_format` can sometimes be inferred from model, but explicitly setting for safety:
|
| 28 |
# MiniCPM-V-2_6-gguf uses a specific chat template.
|
|
|
|
| 23 |
filename="ggml-model-Q4_K_M.gguf",
|
| 24 |
n_ctx=4096,
|
| 25 |
n_threads=os.cpu_count(),
|
| 26 |
+
n_batch=512,
|
| 27 |
verbose=False, # Set to True for more debug output
|
| 28 |
# `chat_format` can sometimes be inferred from model, but explicitly setting for safety:
|
| 29 |
# MiniCPM-V-2_6-gguf uses a specific chat template.
|