Final_Assignment_Template

Sleeping

App Files Files Community

josondev commited on Jun 27

Commit

b1b6e20

verified ·

1 Parent(s): cd32eb4

Update veryfinal.py

Browse files

Files changed (1) hide show

veryfinal.py +227 -343

veryfinal.py CHANGED Viewed

@@ -1,26 +1,30 @@
 import os, time, random
 from dotenv import load_dotenv
 from typing import List, Dict, Any, TypedDict, Annotated
 import operator
-# Load environment variables
-load_dotenv()
 # LangGraph imports
-from langgraph.graph import StateGraph, END
-from langgraph.prebuilt import create_react_agent
 from langgraph.checkpoint.memory import MemorySaver
 # LangChain imports
-from langchain_core.messages import HumanMessage, AIMessage, SystemMessage
 from langchain_core.tools import tool
 from langchain_groq import ChatGroq
 from langchain_google_genai import ChatGoogleGenerativeAI
 from langchain_nvidia_ai_endpoints import ChatNVIDIA
-from langchain_core.rate_limiters import InMemoryRateLimiter
-# Tavily import
-from tavily import TavilyClient
 # Advanced Rate Limiter (SILENT)
 class AdvancedRateLimiter:
@@ -41,385 +45,265 @@ class AdvancedRateLimiter:
         # Record this request
         self.request_times.append(current_time)
-# Initialize rate limiters for free tiers
 groq_limiter = AdvancedRateLimiter(requests_per_minute=30)
 gemini_limiter = AdvancedRateLimiter(requests_per_minute=2)
-nvidia_limiter = AdvancedRateLimiter(requests_per_minute=5)  # NVIDIA free tier
-tavily_limiter = AdvancedRateLimiter(requests_per_minute=50)
-# Initialize LangChain rate limiters for NVIDIA
-nvidia_rate_limiter = InMemoryRateLimiter(
-    requests_per_second=0.083,  # 5 requests per minute
-    check_every_n_seconds=0.1,
-    max_bucket_size=5
-)
-# Initialize LLMs with best free models
-groq_llm = ChatGroq(
-    model="llama-3.3-70b-versatile",
-    api_key=os.getenv("GROQ_API_KEY"),
-    temperature=0
-)
-gemini_llm = ChatGoogleGenerativeAI(
-    model="gemini-2.0-flash-thinking-exp",
-    api_key=os.getenv("GOOGLE_API_KEY"),
-    temperature=0
-)
-# Best NVIDIA models based on search results
-nvidia_general_llm = ChatNVIDIA(
-    model="meta/llama3-70b-instruct",  # Best general model from NVIDIA
-    api_key=os.getenv("NVIDIA_API_KEY"),
-    temperature=0,
-    max_tokens=4000,
-    rate_limiter=nvidia_rate_limiter
-)
-nvidia_code_llm = ChatNVIDIA(
-    model="meta/codellama-70b",  # Best code generation model from NVIDIA
-    api_key=os.getenv("NVIDIA_API_KEY"),
-    temperature=0,
-    max_tokens=4000,
-    rate_limiter=nvidia_rate_limiter
-)
-nvidia_math_llm = ChatNVIDIA(
-    model="mistralai/mixtral-8x22b-instruct-v0.1",  # Best reasoning model from NVIDIA
-    api_key=os.getenv("NVIDIA_API_KEY"),
-    temperature=0,
-    max_tokens=4000,
-    rate_limiter=nvidia_rate_limiter
-)
-# Initialize Tavily client
-tavily_client = TavilyClient(api_key=os.getenv("TAVILY_API_KEY"))
-# Define State
-class AgentState(TypedDict):
-    messages: Annotated[List[HumanMessage | AIMessage], operator.add]
-    query: str
-    agent_type: str
-    final_answer: str
 # Custom Tools
 @tool
-def multiply_tool(a: float, b: float) -> float:
-    """Multiply two numbers together"""
     return a * b
 @tool
-def add_tool(a: float, b: float) -> float:
-    """Add two numbers together"""
     return a + b
 @tool
-def subtract_tool(a: float, b: float) -> float:
-    """Subtract two numbers"""
     return a - b
 @tool
-def divide_tool(a: float, b: float) -> float:
-    """Divide two numbers"""
     if b == 0:
         raise ValueError("Cannot divide by zero.")
     return a / b
 @tool
-def tavily_search_tool(query: str) -> str:
-    """Search the web using Tavily for current information"""
-    try:
-        tavily_limiter.wait_if_needed()
-        response = tavily_client.search(
-            query=query,
-            max_results=3,
-            search_depth="basic",
-            include_answer=False
-        )
-        # Format results
-        results = []
-        for result in response.get('results', []):
-            results.append(f"Title: {result.get('title', '')}\nContent: {result.get('content', '')}")
-        return "\n\n---\n\n".join(results)
-    except Exception as e:
-        return f"Tavily search failed: {str(e)}"
 @tool
-def wiki_search_tool(query: str) -> str:
-    """Search Wikipedia for encyclopedic information"""
     try:
         time.sleep(random.uniform(1, 3))
-        from langchain_community.document_loaders import WikipediaLoader
-        loader = WikipediaLoader(query=query, load_max_docs=1)
-        data = loader.load()
-        return "\n\n---\n\n".join([doc.page_content[:1000] for doc in data])
     except Exception as e:
         return f"Wikipedia search failed: {str(e)}"
-# Define tools for each agent type
-math_tools = [multiply_tool, add_tool, subtract_tool, divide_tool]
-research_tools = [tavily_search_tool, wiki_search_tool]
-coordinator_tools = [tavily_search_tool, wiki_search_tool]
-# Node functions
-def router_node(state: AgentState) -> AgentState:
-    """Route queries to appropriate agent type"""
-    query = state["query"].lower()
-    if any(word in query for word in ['calculate', 'math', 'multiply', 'add', 'subtract', 'divide', 'compute']):
-        agent_type = "math"
-    elif any(word in query for word in ['code', 'program', 'python', 'javascript', 'function', 'algorithm']):
-        agent_type = "code"
-    elif any(word in query for word in ['search', 'find', 'research', 'what is', 'who is', 'when', 'where']):
-        agent_type = "research"
-    else:
-        agent_type = "coordinator"
-    return {**state, "agent_type": agent_type}
-def math_agent_node(state: AgentState) -> AgentState:
-    """Mathematical specialist agent using NVIDIA Mixtral"""
-    nvidia_limiter.wait_if_needed()
-    system_message = SystemMessage(content="""You are a mathematical specialist with access to calculation tools.
-    Use the appropriate math tools for calculations.
-    Show your work step by step.
-    Always provide precise numerical answers.
-    Finish with: FINAL ANSWER: [numerical result]""")
-    # Create math agent with NVIDIA's best reasoning model
-    math_agent = create_react_agent(nvidia_math_llm, math_tools)
-    # Process query
-    messages = [system_message, HumanMessage(content=state["query"])]
-    config = {"configurable": {"thread_id": "math_thread"}}
     try:
-        result = math_agent.invoke({"messages": messages}, config)
-        final_message = result["messages"][-1].content
-        return {
-            **state,
-            "messages": state["messages"] + [AIMessage(content=final_message)],
-            "final_answer": final_message
-        }
     except Exception as e:
-        error_msg = f"Math agent error: {str(e)}"
-        return {
-            **state,
-            "messages": state["messages"] + [AIMessage(content=error_msg)],
-            "final_answer": error_msg
-        }
-def code_agent_node(state: AgentState) -> AgentState:
-    """Code generation specialist agent using NVIDIA CodeLlama"""
-    nvidia_limiter.wait_if_needed()
-    system_message = SystemMessage(content="""You are an expert coding AI specialist.
-    Generate clean, efficient, and well-documented code.
-    Explain your code solutions clearly.
-    Always provide working code examples.
-    Finish with: FINAL ANSWER: [your code solution]""")
-    # Create code agent with NVIDIA's best code model
-    code_agent = create_react_agent(nvidia_code_llm, [])
-    # Process query
-    messages = [system_message, HumanMessage(content=state["query"])]
-    config = {"configurable": {"thread_id": "code_thread"}}
     try:
-        result = code_agent.invoke({"messages": messages}, config)
-        final_message = result["messages"][-1].content
-        return {
-            **state,
-            "messages": state["messages"] + [AIMessage(content=final_message)],
-            "final_answer": final_message
-        }
     except Exception as e:
-        error_msg = f"Code agent error: {str(e)}"
-        return {
-            **state,
-            "messages": state["messages"] + [AIMessage(content=error_msg)],
-            "final_answer": error_msg
-        }
-def research_agent_node(state: AgentState) -> AgentState:
-    """Research specialist agent using Gemini"""
-    gemini_limiter.wait_if_needed()
-    system_message = SystemMessage(content="""You are a research specialist with access to web search and Wikipedia.
-    Use appropriate search tools to gather comprehensive information.
-    Always cite sources and provide well-researched answers.
-    Synthesize information from multiple sources when possible.
-    Finish with: FINAL ANSWER: [your researched answer]""")
-    # Create research agent
-    research_agent = create_react_agent(gemini_llm, research_tools)
-    # Process query
-    messages = [system_message, HumanMessage(content=state["query"])]
-    config = {"configurable": {"thread_id": "research_thread"}}
     try:
-        result = research_agent.invoke({"messages": messages}, config)
-        final_message = result["messages"][-1].content
-        return {
-            **state,
-            "messages": state["messages"] + [AIMessage(content=final_message)],
-            "final_answer": final_message
         }
-    except Exception as e:
-        error_msg = f"Research agent error: {str(e)}"
-        return {
-            **state,
-            "messages": state["messages"] + [AIMessage(content=error_msg)],
-            "final_answer": error_msg
-        }
-def coordinator_agent_node(state: AgentState) -> AgentState:
-    """Coordinator agent using NVIDIA Llama3"""
-    nvidia_limiter.wait_if_needed()
-    system_message = SystemMessage(content="""You are the main coordinator agent.
-    Analyze queries and provide comprehensive responses.
-    Use search tools for factual information when needed.
-    Always finish with: FINAL ANSWER: [your final answer]""")
-    # Create coordinator agent with NVIDIA's best general model
-    coordinator_agent = create_react_agent(nvidia_general_llm, coordinator_tools)
-    # Process query
-    messages = [system_message, HumanMessage(content=state["query"])]
-    config = {"configurable": {"thread_id": "coordinator_thread"}}
-    try:
-        result = coordinator_agent.invoke({"messages": messages}, config)
-        final_message = result["messages"][-1].content
-        return {
-            **state,
-            "messages": state["messages"] + [AIMessage(content=final_message)],
-            "final_answer": final_message
-        }
     except Exception as e:
-        error_msg = f"Coordinator agent error: {str(e)}"
-        return {
-            **state,
-            "messages": state["messages"] + [AIMessage(content=error_msg)],
-            "final_answer": error_msg
-        }
-# Conditional routing function
-def route_agent(state: AgentState) -> str:
-    """Route to appropriate agent based on agent_type"""
-    agent_type = state.get("agent_type", "coordinator")
-    if agent_type == "math":
-        return "math_agent"
-    elif agent_type == "code":
-        return "code_agent"
-    elif agent_type == "research":
-        return "research_agent"
     else:
-        return "coordinator_agent"
-# LangGraph Multi-Agent System
-class LangGraphMultiAgentSystem:
-    def __init__(self):
-        self.request_count = 0
-        self.last_request_time = time.time()
-        self.graph = self._create_graph()
-    def _create_graph(self) -> StateGraph:
-        """Create the LangGraph workflow"""
-        workflow = StateGraph(AgentState)
-        # Add nodes
-        workflow.add_node("router", router_node)
-        workflow.add_node("math_agent", math_agent_node)
-        workflow.add_node("code_agent", code_agent_node)
-        workflow.add_node("research_agent", research_agent_node)
-        workflow.add_node("coordinator_agent", coordinator_agent_node)
-        # Add edges
-        workflow.set_entry_point("router")
-        workflow.add_conditional_edges(
-            "router",
-            route_agent,
-            {
-                "math_agent": "math_agent",
-                "code_agent": "code_agent",
-                "research_agent": "research_agent",
-                "coordinator_agent": "coordinator_agent"
-            }
-        )
-        # All agents end the workflow
-        workflow.add_edge("math_agent", END)
-        workflow.add_edge("code_agent", END)
-        workflow.add_edge("research_agent", END)
-        workflow.add_edge("coordinator_agent", END)
-        # Compile the graph
-        memory = MemorySaver()
-        return workflow.compile(checkpointer=memory)
-    def process_query(self, query: str) -> str:
-        """Process query using LangGraph multi-agent system"""
-        # Global rate limiting (SILENT)
-        current_time = time.time()
-        if current_time - self.last_request_time > 3600:
-            self.request_count = 0
-            self.last_request_time = current_time
-        self.request_count += 1
-        # Add delay between requests (SILENT)
-        if self.request_count > 1:
-            time.sleep(random.uniform(3, 10))
-        # Initial state
-        initial_state = {
-            "messages": [HumanMessage(content=query)],
-            "query": query,
-            "agent_type": "",
-            "final_answer": ""
-        }
-        # Configuration for the graph
-        config = {"configurable": {"thread_id": f"thread_{self.request_count}"}}
-        try:
-            # Run the graph
-            final_state = self.graph.invoke(initial_state, config)
-            return final_state.get("final_answer", "No response generated")
-        except Exception as e:
-            return f"Error: {str(e)}"
-# Main functions
-def main(query: str) -> str:
-    """Main function using LangGraph multi-agent system"""
-    langgraph_system = LangGraphMultiAgentSystem()
-    return langgraph_system.process_query(query)
-def get_final_answer(query: str) -> str:
-    """Extract only the FINAL ANSWER from the response"""
-    full_response = main(query)
-    if "FINAL ANSWER:" in full_response:
-        final_answer = full_response.split("FINAL ANSWER:")[-1].strip()
-        return final_answer
-    else:
-        return full_response.strip()
 if __name__ == "__main__":
-    # Test the LangGraph system - CLEAN OUTPUT ONLY
-    result = get_final_answer("What are the names of the US presidents who were assassinated?")
-    print(result)

+"""LangGraph Agent with FAISS Vector Store and Custom Tools"""
 import os, time, random
 from dotenv import load_dotenv
 from typing import List, Dict, Any, TypedDict, Annotated
 import operator
 # LangGraph imports
+from langgraph.graph import START, StateGraph, MessagesState
+from langgraph.prebuilt import tools_condition
+from langgraph.prebuilt import ToolNode
 from langgraph.checkpoint.memory import MemorySaver
 # LangChain imports
+from langchain_core.messages import SystemMessage, HumanMessage
 from langchain_core.tools import tool
 from langchain_groq import ChatGroq
 from langchain_google_genai import ChatGoogleGenerativeAI
 from langchain_nvidia_ai_endpoints import ChatNVIDIA
+from langchain_community.tools.tavily_search import TavilySearchResults
+from langchain_community.document_loaders import WikipediaLoader, ArxivLoader
+from langchain_community.vectorstores import FAISS
+from langchain_nvidia_ai_endpoints import NVIDIAEmbeddings
+from langchain.tools.retriever import create_retriever_tool
+from langchain_text_splitters import RecursiveCharacterTextSplitter
+from langchain_community.document_loaders import JSONLoader
+load_dotenv()
 # Advanced Rate Limiter (SILENT)
 class AdvancedRateLimiter:
         # Record this request
         self.request_times.append(current_time)
+# Initialize rate limiters
 groq_limiter = AdvancedRateLimiter(requests_per_minute=30)
 gemini_limiter = AdvancedRateLimiter(requests_per_minute=2)
+nvidia_limiter = AdvancedRateLimiter(requests_per_minute=5)
 # Custom Tools
 @tool
+def multiply(a: int, b: int) -> int:
+    """Multiply two numbers.
+    Args:
+        a: first int
+        b: second int
+    """
     return a * b
 @tool
+def add(a: int, b: int) -> int:
+    """Add two numbers.
+    Args:
+        a: first int
+        b: second int
+    """
     return a + b
 @tool
+def subtract(a: int, b: int) -> int:
+    """Subtract two numbers.
+    Args:
+        a: first int
+        b: second int
+    """
     return a - b
 @tool
+def divide(a: int, b: int) -> float:
+    """Divide two numbers.
+    Args:
+        a: first int
+        b: second int
+    """
     if b == 0:
         raise ValueError("Cannot divide by zero.")
     return a / b
 @tool
+def modulus(a: int, b: int) -> int:
+    """Get the modulus of two numbers.
+    Args:
+        a: first int
+        b: second int
+    """
+    return a % b
 @tool
+def wiki_search(query: str) -> str:
+    """Search Wikipedia for a query and return maximum 2 results.
+    Args:
+        query: The search query."""
     try:
         time.sleep(random.uniform(1, 3))
+        search_docs = WikipediaLoader(query=query, load_max_docs=2).load()
+        formatted_search_docs = "\n\n---\n\n".join(
+            [
+                f'<Document source="{doc.metadata["source"]}" page="{doc.metadata.get("page", "")}"/>\n{doc.page_content}\n</Document>'
+                for doc in search_docs
+            ])
+        return formatted_search_docs
     except Exception as e:
         return f"Wikipedia search failed: {str(e)}"
+@tool
+def web_search(query: str) -> str:
+    """Search Tavily for a query and return maximum 3 results.
+    Args:
+        query: The search query."""
     try:
+        time.sleep(random.uniform(2, 5))
+        search_docs = TavilySearchResults(max_results=3).invoke(query=query)
+        formatted_search_docs = "\n\n---\n\n".join(
+            [
+                f'<Document source="{doc.get("url", "")}" />\n{doc.get("content", "")}\n</Document>'
+                for doc in search_docs
+            ])
+        return formatted_search_docs
     except Exception as e:
+        return f"Web search failed: {str(e)}"
+@tool
+def arvix_search(query: str) -> str:
+    """Search Arxiv for a query and return maximum 3 result.
+    Args:
+        query: The search query."""
     try:
+        time.sleep(random.uniform(1, 4))
+        search_docs = ArxivLoader(query=query, load_max_docs=3).load()
+        formatted_search_docs = "\n\n---\n\n".join(
+            [
+                f'<Document source="{doc.metadata["source"]}" page="{doc.metadata.get("page", "")}"/>\n{doc.page_content[:1000]}\n</Document>'
+                for doc in search_docs
+            ])
+        return formatted_search_docs
     except Exception as e:
+        return f"ArXiv search failed: {str(e)}"
+# Load and process JSONL data for FAISS vector store
+def setup_faiss_vector_store():
+    """Setup FAISS vector database from JSONL metadata"""
     try:
+        jq_schema = """
+        {
+          page_content: .Question,
+          metadata: {
+            task_id: .task_id,
+            Level: .Level,
+            Final_answer: ."Final answer",
+            file_name: .file_name,
+            Steps: .["Annotator Metadata"].Steps,
+            Number_of_steps: .["Annotator Metadata"]["Number of steps"],
+            How_long: .["Annotator Metadata"]["How long did this take?"],
+            Tools: .["Annotator Metadata"].Tools,
+            Number_of_tools: .["Annotator Metadata"]["Number of tools"]
+          }
         }
+        """
+        # Load documents
+        json_loader = JSONLoader(file_path="metadata.jsonl", jq_schema=jq_schema, json_lines=True, text_content=False)
+        json_docs = json_loader.load()
+        # Split documents
+        text_splitter = RecursiveCharacterTextSplitter(chunk_size=512, chunk_overlap=200)
+        json_chunks = text_splitter.split_documents(json_docs)
+        # Create FAISS vector store
+        embeddings = NVIDIAEmbeddings(
+            model="nvidia/nv-embedqa-e5-v5",
+            api_key=os.getenv("NVIDIA_API_KEY")
+        )
+        vector_store = FAISS.from_documents(json_chunks, embeddings)
+        return vector_store
     except Exception as e:
+        print(f"FAISS vector store setup failed: {e}")
+        return None
+# Load system prompt
+try:
+    with open("system_prompt.txt", "r", encoding="utf-8") as f:
+        system_prompt = f.read()
+except FileNotFoundError:
+    system_prompt = """You are a helpful assistant tasked with answering questions using a set of tools.
+    Now, I will ask you a question. Report your thoughts, and finish your answer with the following template:
+    FINAL ANSWER: [YOUR FINAL ANSWER].
+    YOUR FINAL ANSWER should be a number OR as few words as possible OR a comma separated list of numbers and/or strings. If you are asked for a number, don't use comma to write your number neither use units such as $ or percent sign unless specified otherwise. If you are asked for a string, don't use articles, neither abbreviations (e.g. for cities), and write the digits in plain text unless specified otherwise. If you are asked for a comma separated list, apply the above rules depending of whether the element to be put in the list is a number or a string.
+    Your answer should only start with "FINAL ANSWER: ", then follows with the answer."""
+# System message
+sys_msg = SystemMessage(content=system_prompt)
+# Setup FAISS vector store and retriever
+vector_store = setup_faiss_vector_store()
+if vector_store:
+    retriever = vector_store.as_retriever(search_type="similarity", search_kwargs={"k": 3})
+    retriever_tool = create_retriever_tool(
+        retriever=retriever,
+        name="Question_Search",
+        description="A tool to retrieve similar questions from a vector store.",
+    )
+else:
+    retriever_tool = None
+# All tools
+all_tools = [
+    multiply,
+    add,
+    subtract,
+    divide,
+    modulus,
+    wiki_search,
+    web_search,
+    arvix_search,
+]
+if retriever_tool:
+    all_tools.append(retriever_tool)
+# Build graph function
+def build_graph(provider: str = "groq"):
+    """Build the LangGraph with rate limiting"""
+    # Initialize LLMs with best free models
+    if provider == "google":
+        llm = ChatGoogleGenerativeAI(model="gemini-2.0-flash-thinking-exp", temperature=0)
+    elif provider == "groq":
+        llm = ChatGroq(model="llama-3.3-70b-versatile", temperature=0)
+    elif provider == "nvidia":
+        llm = ChatNVIDIA(model="meta/llama-3.1-70b-instruct", temperature=0)
     else:
+        raise ValueError("Invalid provider. Choose 'google', 'groq' or 'nvidia'.")
+    # Bind tools to LLM
+    llm_with_tools = llm.bind_tools(all_tools)
+    # Node functions
+    def assistant(state: MessagesState):
+        """Assistant node with rate limiting"""
+        if provider == "groq":
+            groq_limiter.wait_if_needed()
+        elif provider == "google":
+            gemini_limiter.wait_if_needed()
+        elif provider == "nvidia":
+            nvidia_limiter.wait_if_needed()
+        return {"messages": [llm_with_tools.invoke(state["messages"])]}
+    def retriever_node(state: MessagesState):
+        """Retriever node"""
+        if vector_store and len(state["messages"]) > 0:
+            try:
+                similar_questions = vector_store.similarity_search(state["messages"][-1].content, k=1)
+                if similar_questions:
+                    example_msg = HumanMessage(
+                        content=f"Here I provide a similar question and answer for reference: \n\n{similar_questions[0].page_content}",
+                    )
+                    return {"messages": [sys_msg] + state["messages"] + [example_msg]}
+            except Exception as e:
+                print(f"Retriever error: {e}")
+        return {"messages": [sys_msg] + state["messages"]}
+    # Build graph
+    builder = StateGraph(MessagesState)
+    builder.add_node("retriever", retriever_node)
+    builder.add_node("assistant", assistant)
+    builder.add_node("tools", ToolNode(all_tools))
+    builder.add_edge(START, "retriever")
+    builder.add_edge("retriever", "assistant")
+    builder.add_conditional_edges("assistant", tools_condition)
+    builder.add_edge("tools", "assistant")
+    # Compile graph with memory
+    memory = MemorySaver()
+    return builder.compile(checkpointer=memory)
+# Test
 if __name__ == "__main__":
+    question = "What are the names of the US presidents who were assassinated?"
+    # Build the graph
+    graph = build_graph(provider="groq")
+    # Run the graph
+    messages = [HumanMessage(content=question)]
+    config = {"configurable": {"thread_id": "test_thread"}}
+    result = graph.invoke({"messages": messages}, config)
+    for m in result["messages"]:
+        m.pretty_print()