dq_hosted1

Running

App Files Files Community

dq_hosted1 / app.py

csabakecskemeti

Upload app.py

ebf8e32 verified 4 months ago

raw

history blame

13.7 kB

	import os
	import gradio as gr
	from typing import List
	import logging
	import logging.handlers
	import json
	from langchain_openai import ChatOpenAI
	from langchain_core.tools import tool
	from langchain_core.messages import HumanMessage, AIMessage, ToolMessage
	from langchain_tavily import TavilySearch

	# Configuration - set to False to disable detailed logging
	ENABLE_DETAILED_LOGGING = True

	# Setup logging with rotation (7 days max)
	if ENABLE_DETAILED_LOGGING:
	# Create formatter
	formatter = logging.Formatter('%(asctime)s - %(name)s - %(levelname)s - %(message)s')

	# Setup console handler
	console_handler = logging.StreamHandler()
	console_handler.setFormatter(formatter)

	# Setup rotating file handler (7 days, daily rotation)
	file_handler = logging.handlers.TimedRotatingFileHandler(
	'agent.log',
	when='midnight',
	interval=1,
	backupCount=7, # Keep 7 days of logs
	encoding='utf-8'
	)
	file_handler.setFormatter(formatter)

	# Configure root logger
	logging.basicConfig(
	level=logging.INFO,
	handlers=[console_handler, file_handler]
	)
	else:
	logging.basicConfig(level=logging.WARNING)

	logger = logging.getLogger(__name__)

	# Configuration from environment variables
	llm_ip = os.environ.get('public_ip')
	llm_port = os.environ.get('port')
	llm_key = os.environ.get('api_key')
	llm_model = os.environ.get('model')

	# Tavily API configuration
	tavily_key = os.environ.get('tavily_key', '')
	if ENABLE_DETAILED_LOGGING:
	logger.info(f"Tavily API key present: {bool(tavily_key)}")
	if tavily_key:
	logger.info(f"Tavily API key length: {len(tavily_key)}")
	else:
	logger.warning("No Tavily API key found in environment variables")

	# Tool calling agent implementation
	class ToolCallingAgentChat:
	def __init__(self, ip: str, port: str, api_key: str, model: str):
	self.ip = ip
	self.port = port
	self.api_key = api_key
	self.model = model
	self.llm = None
	self.tools = []
	self._setup_agent()

	def _setup_agent(self):
	"""Initialize the tool calling agent"""
	try:
	if ENABLE_DETAILED_LOGGING:
	logger.info(f"=== SETTING UP TOOL CALLING AGENT ===")
	logger.info(f"LLM URL: http://{self.ip}:{self.port}/v1")
	logger.info(f"Model: {self.model}")

	# Create OpenAI-compatible model
	self.llm = ChatOpenAI(
	base_url=f"http://{self.ip}:{self.port}/v1",
	api_key=self.api_key,
	model=self.model,
	temperature=0.7
	)
	if ENABLE_DETAILED_LOGGING:
	logger.info("LLM created successfully")

	# Define web search tool
	if tavily_key:
	if ENABLE_DETAILED_LOGGING:
	logger.info("Setting up Tavily search tool")
	try:
	@tool
	def web_search(query: str) -> str:
	"""Search the web for current information about any topic. Use this when you need up-to-date information, current events, or real-time data."""
	try:
	tavily_tool = TavilySearch(
	tavily_api_key=tavily_key,
	max_results=5,
	topic="general",
	include_answer=True,
	search_depth="advanced"
	)
	result = tavily_tool.invoke({"query": query})
	if ENABLE_DETAILED_LOGGING:
	logger.info(f"Tavily search successful for query: {query}")
	return result
	except Exception as e:
	error_str = str(e).lower()
	if ENABLE_DETAILED_LOGGING:
	logger.error(f"Tavily search failed for query '{query}': {e}")
	logger.error(f"Exception type: {type(e).__name__}")

	# Check for rate limit or quota issues
	if any(keyword in error_str for keyword in ['rate limit', 'quota', 'limit exceeded', 'usage limit', 'billing']):
	if ENABLE_DETAILED_LOGGING:
	logger.warning(f"Tavily rate limit/quota exceeded: {e}")
	return "I can't search the web right now due to rate limits."
	else:
	if ENABLE_DETAILED_LOGGING:
	logger.error(f"Tavily API error: {e}")
	return f"I can't search the web right now. Error: {str(e)[:100]}"

	self.tools = [web_search]
	if ENABLE_DETAILED_LOGGING:
	logger.info("Tavily search tool created successfully")
	except Exception as e:
	if ENABLE_DETAILED_LOGGING:
	logger.error(f"Failed to create Tavily tool: {e}")
	self.tools = []
	else:
	if ENABLE_DETAILED_LOGGING:
	logger.warning("No Tavily API key found, no web search tool available")
	self.tools = []

	# Bind tools to the model
	if self.tools:
	self.llm_with_tools = self.llm.bind_tools(self.tools)
	if ENABLE_DETAILED_LOGGING:
	logger.info(f"Tools bound to model: {[tool.name for tool in self.tools]}")
	else:
	self.llm_with_tools = self.llm
	if ENABLE_DETAILED_LOGGING:
	logger.info("No tools available, using base model")

	if ENABLE_DETAILED_LOGGING:
	logger.info("Tool calling agent created successfully")

	except Exception as e:
	logger.error(f"=== AGENT SETUP ERROR ===")
	logger.error(f"Failed to setup agent: {e}")
	import traceback
	logger.error(f"Traceback: {traceback.format_exc()}")
	raise e

	def update_config(self, ip: str, port: str, api_key: str, model: str):
	"""Update LLM configuration"""
	if (ip != self.ip or port != self.port or
	api_key != self.api_key or model != self.model):
	self.ip = ip
	self.port = port
	self.api_key = api_key
	self.model = model
	self._setup_agent()

	def chat(self, message: str, history: List[List[str]]) -> str:
	"""Generate chat response using tool calling"""
	try:
	if not self.llm_with_tools:
	return "Error: Agent not initialized"

	if ENABLE_DETAILED_LOGGING:
	logger.info(f"=== USER INPUT ===")
	logger.info(f"Message: {message}")
	logger.info(f"History length: {len(history)}")

	# Convert history to messages for context
	messages = []
	for user_msg, assistant_msg in history:
	messages.append(HumanMessage(content=user_msg))
	if assistant_msg: # Only add if assistant responded
	messages.append(AIMessage(content=assistant_msg))

	# Add current message
	messages.append(HumanMessage(content=message))

	# Get initial response from LLM
	if ENABLE_DETAILED_LOGGING:
	logger.info(f"=== INVOKING LLM ===")
	logger.info(f"Total messages in context: {len(messages)}")

	response = self.llm_with_tools.invoke(messages)

	if ENABLE_DETAILED_LOGGING:
	logger.info(f"=== LLM RESPONSE ===")
	logger.info(f"Response type: {type(response)}")
	logger.info(f"Has tool calls: {bool(response.tool_calls if hasattr(response, 'tool_calls') else False)}")

	# Check if LLM wants to call tools
	if hasattr(response, 'tool_calls') and response.tool_calls:
	if ENABLE_DETAILED_LOGGING:
	logger.info(f"=== TOOL CALLS DETECTED ===")
	logger.info(f"Number of tool calls: {len(response.tool_calls)}")

	# Add the LLM response to messages
	messages.append(response)

	# Execute tool calls
	for tool_call in response.tool_calls:
	if ENABLE_DETAILED_LOGGING:
	logger.info(f"Executing tool: {tool_call['name']} with args: {tool_call['args']}")

	# Find and execute the tool
	tool_result = None
	for tool in self.tools:
	if tool.name == tool_call['name']:
	try:
	tool_result = tool.invoke(tool_call['args'])
	if ENABLE_DETAILED_LOGGING:
	logger.info(f"Tool executed successfully: {tool_call['name']}")
	break
	except Exception as e:
	tool_result = f"Tool execution failed: {str(e)}"
	if ENABLE_DETAILED_LOGGING:
	logger.error(f"Tool execution failed: {e}")

	if tool_result is None:
	tool_result = f"Tool {tool_call['name']} not found"

	# Add tool result to messages
	messages.append(ToolMessage(
	content=str(tool_result),
	tool_call_id=tool_call['id']
	))

	# Get final response from LLM after tool execution
	if ENABLE_DETAILED_LOGGING:
	logger.info(f"=== GETTING FINAL RESPONSE ===")

	final_response = self.llm_with_tools.invoke(messages)
	final_message = final_response.content
	else:
	# No tool calls, use the direct response
	final_message = response.content

	if ENABLE_DETAILED_LOGGING:
	logger.info(f"=== FINAL MESSAGE ===")
	logger.info(f"Final message: {final_message}")

	return final_message

	except Exception as e:
	error_msg = f"Agent error: {str(e)}"
	logger.error(f"=== AGENT ERROR ===")
	logger.error(f"Error: {e}")
	logger.error(f"Error type: {type(e)}")
	import traceback
	logger.error(f"Traceback: {traceback.format_exc()}")
	return error_msg

	# Global agent instance
	tool_calling_agent = ToolCallingAgentChat(llm_ip, llm_port, llm_key, llm_model)

	def generate_response(message: str, history: List[List[str]], system_prompt: str,
	max_tokens: int, ip: str, port: str, api_key: str, model: str):
	"""Generate response using tool calling agent"""
	global tool_calling_agent

	try:
	# Update agent configuration if changed
	tool_calling_agent.update_config(ip, port, api_key, model)

	# Generate response
	response = tool_calling_agent.chat(message, history)

	# Stream the response word by word for better UX
	words = response.split()
	current_response = ""
	for word in words:
	current_response += word + " "
	yield current_response.strip()

	except Exception as e:
	error_msg = f"Error: {str(e)}"
	logger.error(error_msg)
	yield error_msg

	# Create Gradio ChatInterface
	chatbot = gr.ChatInterface(
	generate_response,
	chatbot=gr.Chatbot(
	avatar_images=[
	None,
	"https://cdn-avatars.huggingface.co/v1/production/uploads/64e6d37e02dee9bcb9d9fa18/o_HhUnXb_PgyYlqJ6gfEO.png"
	],
	height="64vh"
	),
	additional_inputs=[
	gr.Textbox(
	"You are a helpful AI assistant with web search capabilities. Use web search when you need current information, recent events, or real-time data.",
	label="System Prompt",
	lines=2
	),
	gr.Slider(50, 2048, label="Max Tokens", value=512,
	info="Maximum number of tokens in the response"),
	gr.Textbox(llm_ip, label="LLM IP Address",
	info="IP address of the OpenAI-compatible LLM server"),
	gr.Textbox(llm_port, label="LLM Port",
	info="Port of the LLM server"),
	gr.Textbox(llm_key, label="API Key", type="password",
	info="API key for the LLM server"),
	gr.Textbox(llm_model, label="Model Name",
	info="Name of the model to use"),
	],
	title="🚀 Fast Tool Calling Agent with Tavily Search",
	description="Chat with a fast tool calling agent that can search the web using Tavily. The agent automatically decides when to search based on your query - much faster than ReAct agents!",
	theme="finlaymacklon/smooth_slate"
	)

	if __name__ == "__main__":
	chatbot.queue().launch()