Spaces:

Eliot0110
/

Travel_Assistant

Sleeping

App Files Files Community

Eliot0110 commited on Aug 5

Commit

3589840

1 Parent(s): c40cb3f

fix: missing definition of chat

Browse files

Files changed (1) hide show

modules/ai_model.py +31 -2

modules/ai_model.py CHANGED Viewed

@@ -140,7 +140,7 @@ class AIModel:
         else:  # text
             return input_type, None, raw_input
-    def run_inference(self, input_type: str, formatted_input: Union[str, Image.Image], prompt: str) -> str:
         try:
             if len(prompt) > 500:
@@ -176,7 +176,7 @@ class AIModel:
                     **inputs,
                     max_new_tokens=256,
                     do_sample=True,
-                    temperature=0.7,
                     top_p=0.9,
                     pad_token_id=self.processor.tokenizer.eos_token_id,
                     use_cache=True
@@ -198,6 +198,35 @@ class AIModel:
         except Exception as e:
             log.error(f"❌ 模型推理失败: {e}", exc_info=True)
             return "抱歉，处理您的请求时遇到技术问题。"
     def _build_limited_prompt(self, processed_text: str, context: str = "") -> str:
         """构建长度受限的prompt - 新增辅助方法"""

         else:  # text
             return input_type, None, raw_input
+    def run_inference(self, input_type: str, formatted_input: Union[str, Image.Image], prompt: str,temperature: float = 0.7) -> str:
         try:
             if len(prompt) > 500:
                     **inputs,
                     max_new_tokens=256,
                     do_sample=True,
+                    temperature=temperature,
                     top_p=0.9,
                     pad_token_id=self.processor.tokenizer.eos_token_id,
                     use_cache=True
         except Exception as e:
             log.error(f"❌ 模型推理失败: {e}", exc_info=True)
             return "抱歉，处理您的请求时遇到技术问题。"
+    def chat_completion(self, model: str, messages: list, **kwargs) -> str:
+        if not self.is_available():
+            log.error("模型未就绪，无法执行 chat_completion")
+            # 对于需要JSON输出的场景，返回一个表示错误的有效JSON字符串
+            if kwargs.get("response_format", {}).get("type") == "json_object":
+                return '{"error": "Model not available"}'
+            return "抱歉，AI 模型当前不可用。"
+        full_prompt = "\n".join([msg.get("content", "") for msg in messages])
+        temperature = kwargs.get("temperature", 0.7)
+        if kwargs.get("response_format", {}).get("type") == "json_object":
+            # 在 prompt 末尾添加指令，强制模型输出 JSON
+            full_prompt += "\n\n请注意：你的回答必须是一个严格的、不含任何额外解释和代码块标记的 JSON 对象。"
+            # 对于JSON生成任务，使用较低的 temperature 以获得更稳定、确定性的结构
+            temperature = 0.1
+        log.debug(f"▶️ 执行 chat_completion (适配器), temperature={temperature}, prompt='{full_prompt[:100]}...'")
+        return self.run_inference(
+            input_type="text",
+            formatted_input=None,
+            prompt=full_prompt,
+            temperature=temperature # 将处理后的 temperature 传递下去
+        )
     def _build_limited_prompt(self, processed_text: str, context: str = "") -> str:
         """构建长度受限的prompt - 新增辅助方法"""