shawno commited on
Commit
c1c816a
·
verified ·
1 Parent(s): 9212838

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -0
app.py CHANGED
@@ -23,6 +23,7 @@ try:
23
  filename="ggml-model-Q4_K_M.gguf",
24
  n_ctx=4096,
25
  n_threads=os.cpu_count(),
 
26
  verbose=False, # Set to True for more debug output
27
  # `chat_format` can sometimes be inferred from model, but explicitly setting for safety:
28
  # MiniCPM-V-2_6-gguf uses a specific chat template.
 
23
  filename="ggml-model-Q4_K_M.gguf",
24
  n_ctx=4096,
25
  n_threads=os.cpu_count(),
26
+ n_batch=512,
27
  verbose=False, # Set to True for more debug output
28
  # `chat_format` can sometimes be inferred from model, but explicitly setting for safety:
29
  # MiniCPM-V-2_6-gguf uses a specific chat template.