Spaces:

Xorbits
/

xinference

Runtime error

aresnow commited on Jul 13, 2023

Commit

da866b5

1 Parent(s): a9bd2fc

modify max tokens

Files changed (1) hide show

app.py CHANGED Viewed

@@ -131,7 +131,7 @@ class GradioApp:
             max_token = gr.Slider(
                 128,
                 1024,
-                value=256,
                 step=1,
                 label=self._locale("Max tokens"),
                 info=self._locale("The maximum number of tokens to generate."),
@@ -462,7 +462,7 @@ async def launch_xinference():
         address=supervisor_address, supervisor_address=supervisor_address
     )
     api = AsyncSupervisorAPI(supervisor_address)
-    supported_models = ["orca", "chatglm2", "chatglm", "vicuna-v1.3"]
     for model in supported_models:
         await api.launch_model(str(uuid.uuid4()), model)

             max_token = gr.Slider(
                 128,
                 1024,
+                value=128,
                 step=1,
                 label=self._locale("Max tokens"),
                 info=self._locale("The maximum number of tokens to generate."),
         address=supervisor_address, supervisor_address=supervisor_address
     )
     api = AsyncSupervisorAPI(supervisor_address)
+    supported_models = ["chatglm2", "chatglm", "vicuna-v1.3", "orca"]
     for model in supported_models:
         await api.launch_model(str(uuid.uuid4()), model)