refine TGI parmas
Browse files
app_modules/llm_loader.py
CHANGED
|
@@ -191,11 +191,11 @@ class LLMLoader:
|
|
| 191 |
self.llm = HuggingFaceTextGenInference(
|
| 192 |
inference_server_url=HFTGI_SERVER_URL,
|
| 193 |
max_new_tokens=self.max_tokens_limit / 2,
|
| 194 |
-
top_k=
|
| 195 |
top_p=0.95,
|
| 196 |
-
typical_p=0.95,
|
| 197 |
temperature=0.01,
|
| 198 |
-
repetition_penalty=1.
|
| 199 |
callbacks=callbacks,
|
| 200 |
streaming=True,
|
| 201 |
)
|
|
|
|
| 191 |
self.llm = HuggingFaceTextGenInference(
|
| 192 |
inference_server_url=HFTGI_SERVER_URL,
|
| 193 |
max_new_tokens=self.max_tokens_limit / 2,
|
| 194 |
+
# top_k=0,
|
| 195 |
top_p=0.95,
|
| 196 |
+
# typical_p=0.95,
|
| 197 |
temperature=0.01,
|
| 198 |
+
repetition_penalty=1.115,
|
| 199 |
callbacks=callbacks,
|
| 200 |
streaming=True,
|
| 201 |
)
|