Final_Assignment_Template

Sleeping

App Files Files Community

Abbasid commited on about 1 month ago

Commit

d5ef142

verified ·

1 Parent(s): 83ebef7

Update agent.py

Browse files

Files changed (1) hide show

agent.py +120 -146

agent.py CHANGED Viewed

@@ -8,10 +8,9 @@ import re
 import subprocess
 import textwrap
 import base64
-from datetime import datetime, timedelta
 from io import BytesIO
 from pathlib import Path
-from typing import List
 # Third-party libraries
 import requests
@@ -23,9 +22,9 @@ from langchain.schema import Document
 from langchain.tools.retriever import create_retriever_tool
 from langchain_community.vectorstores import FAISS
 from langchain_community.tools.tavily_search import TavilySearchResults
-from langchain_community.document_loaders import WikipediaLoader, ArxivLoader # Added loaders
 from langchain_core.messages import SystemMessage, HumanMessage, AIMessage
-from langchain_core.tools import tool
 from langchain_google_genai import ChatGoogleGenerativeAI
 from langchain_groq import ChatGroq
 from langchain_huggingface import HuggingFaceEmbeddings, HuggingFaceEndpoint, ChatHuggingFace
@@ -42,185 +41,143 @@ load_dotenv()
 JSONL_PATH   = Path("metadata.jsonl")
 FAISS_CACHE  = Path("faiss_index.pkl")
 EMBED_MODEL  = "sentence-transformers/all-mpnet-base-v2"
-RETRIEVER_K  = 5  # Number of similar documents to retrieve
-CACHE_TTL    = 600 # Cache API calls for 10 minutes
-# Global cache object for API calls
 API_CACHE = TTLCache(maxsize=256, ttl=CACHE_TTL)
 # ----------------------------------------------------------
-# Section 2: The Agent Class
 # ----------------------------------------------------------
-class MyAgent:
-    """
-    Encapsulates the agent's state, including LLMs, retriever, and tools.
-    This class-based approach ensures clean management of dependencies.
-    """
-    def __init__(self, provider: str = "groq"):
-        """
-        Initializes the agent, setting up LLMs and the FAISS retriever.
-        Args:
-            provider (str): The LLM provider to use ('google', 'groq', 'huggingface').
-        """
-        print(f"Initializing agent with provider: {provider}")
-        self.llm = self._build_llm(provider)
-        self.vision_llm = ChatGroq(model_name="meta-llama/llama-4-maverick-17b-128e-instruct", temperature=0)
-        self.retriever = self._get_retriever()
-    def _get_retriever(self):
-        """Builds or loads the FAISS retriever from a local cache."""
-        embeddings = HuggingFaceEmbeddings(model_name=EMBED_MODEL)
-        if FAISS_CACHE.exists():
-            print(f"Loading FAISS index from cache: {FAISS_CACHE}")
-            with open(FAISS_CACHE, "rb") as f:
-                vector_store = pickle.load(f)
-        else:
-            print("FAISS cache not found. Building new index from metadata.jsonl...")
-            if not JSONL_PATH.exists():
-                raise FileNotFoundError(f"{JSONL_PATH} not found. Cannot build vector store.")
-            docs = [Document(page_content=f"Question: {rec['Question']}\n\nFinal answer: {rec['Final answer']}", metadata={"source": rec["task_id"]}) for rec in (json.loads(line) for line in open(JSONL_PATH, "rt", encoding="utf-8"))]
-            if not docs: raise ValueError("No documents found in metadata.jsonl.")
-            vector_store = FAISS.from_documents(docs, embeddings)
-            with open(FAISS_CACHE, "wb") as f: pickle.dump(vector_store, f)
-            print(f"FAISS index built and saved to cache: {FAISS_CACHE}")
-        return vector_store.as_retriever(search_kwargs={"k": RETRIEVER_K})
-    def _build_llm(self, provider: str):
-        """Helper to build the main text-based LLM based on the chosen provider."""
-        if provider == "google": return ChatGoogleGenerativeAI(model="gemini-1.5-pro-latest", temperature=0)
-        elif provider == "groq": return ChatGroq(model_name="meta-llama/llama-4-maverick-17b-128e-instruct", temperature=0)
-        elif provider == "huggingface": return ChatHuggingFace(llm=HuggingFaceEndpoint(repo_id="Qwen/Qwen2.5-Coder-32B-Instruct", temperature=0))
-        else: raise ValueError("Provider must be 'google', 'groq', or 'huggingface'")
-    def _cached_get(self, key: str, fetch_fn):
-        """Helper for caching API calls."""
-        if key in API_CACHE: return API_CACHE[key]
-        val = fetch_fn()
-        API_CACHE[key] = val
-        return val
-    # --- Tool Definitions as Class Methods ---
-    @tool
-    def python_repl(self, code: str) -> str:
-        """Executes a string of Python code and returns the stdout/stderr."""
-        code = textwrap.dedent(code).strip()
-        try:
-            result = subprocess.run(["python", "-c", code], capture_output=True, text=True, timeout=10, check=False)
-            if result.returncode == 0: return f"Execution successful.\nSTDOUT:\n```\n{result.stdout}\n```"
-            else: return f"Execution failed.\nSTDOUT:\n```\n{result.stdout}\n```\nSTDERR:\n```\n{result.stderr}\n```"
-        except subprocess.TimeoutExpired: return "Execution timed out (>10s)."
-    @tool
-    def describe_image(self, image_source: str) -> str:
-        """Describes an image from a local file path or a URL using Gemini vision."""
-        try:
-            if image_source.startswith("http"):
-                img = Image.open(BytesIO(requests.get(image_source, timeout=10).content))
-            else:
-                img = Image.open(image_source)
-            buffered = BytesIO()
-            img.convert("RGB").save(buffered, format="JPEG")
-            b64_string = base64.b64encode(buffered.getvalue()).decode()
-            msg = HumanMessage(content=[{"type": "text", "text": "Describe this image in detail."}, {"type": "image_url", "image_url": {"url": f"data:image/jpeg;base64,{b64_string}"}}])
-            return self.vision_llm.invoke([msg]).content
-        except Exception as e: return f"Error processing image: {e}"
-    @tool
-    def web_search(self, query: str) -> str:
-        """Performs a web search using Tavily and returns a compilation of results."""
-        key = f"web:{query}"
-        results = self._cached_get(key, lambda: TavilySearchResults(max_results=5).invoke(query))
-        return "\n\n---\n\n".join([f"Source: {res['url']}\nContent: {res['content']}" for res in results])
-    @tool
-    def wiki_search(self, query: str) -> str:
-        """Searches Wikipedia and returns the top 2 results."""
-        key = f"wiki:{query}"
-        docs = self._cached_get(key, lambda: WikipediaLoader(query=query, load_max_docs=2, doc_content_chars_max=2000).load())
-        return "\n\n---\n\n".join([f"Source: {d.metadata['source']}\n\n{d.page_content}" for d in docs])
-    @tool
-    def arxiv_search(self, query: str) -> str:
-        """Searches Arxiv for scientific papers and returns the top 2 results."""
-        key = f"arxiv:{query}"
-        docs = self._cached_get(key, lambda: ArxivLoader(query=query, load_max_docs=2).load())
-        return "\n\n---\n\n".join([f"Source: {d.metadata['source']}\nPublished: {d.metadata['Published']}\nTitle: {d.metadata['Title']}\n\nSummary:\n{d.page_content}" for d in docs])
-    def get_tools(self) -> list:
-        """Returns a list of all tools available to the agent."""
-        tools_list = [
-            self.python_repl,
-            self.describe_image,
-            self.web_search,
-            self.wiki_search,
-            self.arxiv_search,
-        ]
-        retriever_tool = create_retriever_tool(
-            retriever=self.retriever,
-            name="retrieve_examples",
-            description="Retrieve solved questions and answers similar to the user's query.",
-        )
-        tools_list.append(retriever_tool)
-        return tools_list
 # ----------------------------------------------------------
 # Section 3: System Prompt
 # ----------------------------------------------------------
 SYSTEM_PROMPT = (
     """You are an expert-level research assistant designed to answer questions accurately.
 **Your Reasoning Process:**
-1.  **Think Step-by-Step:** Before answering, break down the user's question into a series of logical steps. Plan which tools you need to use for each step.
-2.  **Use Your Tools:** Execute your plan by calling one tool at a time. Analyze the results from the tool to see if you have enough information.
-3.  **Iterate if Necessary:** If the first tool call doesn't give you the full answer, continue to use other tools until you are confident you have all the necessary information.
-4.  **Synthesize the Final Answer:** Once you have gathered all the information, and only then, formulate a concise final answer.
 **Output Format:**
-- Your final response to the user MUST strictly follow this format and nothing else:
   `FINAL ANSWER: [Your concise and accurate answer here]`
 **Crucial Instructions:**
-- If the tools you have **cannot possibly answer the question** (e.g., the question asks you to listen to an audio file, watch a video, or read a local file you cannot access), you MUST respond by stating the limitation.
 - In case of a limitation, your response should be:
   `FINAL ANSWER: I am unable to answer this question because it requires a capability I do not possess, such as [describe the missing capability].`
-**Example of handling a limitation:**
-- User Question: "Please summarize the attached PDF."
-- Your Response: `FINAL ANSWER: I am unable to answer this question because it requires a capability I do not possess, such as reading local PDF files.`
 """
 )
 # ----------------------------------------------------------
 # Section 4: Factory Function for Agent Executor
 # ----------------------------------------------------------
-def create_agent_executor(provider: str = "google"):
-    """Factory function to create and compile the LangGraph agent executor."""
-    my_agent_instance = MyAgent(provider=provider)
-    tools_list = my_agent_instance.get_tools()
-    llm_with_tools = my_agent_instance.llm.bind_tools(tools_list)
     def retriever_node(state: MessagesState):
-        """First node: retrieves examples and prepends them to the message history."""
         user_query = state["messages"][-1].content
-        docs = my_agent_instance.retriever.invoke(user_query)
         messages = [SystemMessage(content=SYSTEM_PROMPT)]
         if docs:
             example_text = "\n\n---\n\n".join(d.page_content for d in docs)
-            example_msg = AIMessage(content=f"I have found {len(docs)} similar solved examples:\n\n{example_text}", name="ExampleRetriever")
-            messages.append(example_msg)
         messages.extend(state["messages"])
         return {"messages": messages}
     def assistant_node(state: MessagesState):
-        """Main assistant node: calls the LLM with the current state to decide the next action."""
         result = llm_with_tools.invoke(state["messages"])
         return {"messages": [result]}
     builder = StateGraph(MessagesState)
     builder.add_node("retriever", retriever_node)
     builder.add_node("assistant", assistant_node)
@@ -236,10 +193,27 @@ def create_agent_executor(provider: str = "google"):
     return agent_executor
 # ----------------------------------------------------------
-# Section 5: Direct Execution Block for Testing
 # ----------------------------------------------------------
 if __name__ == "__main__":
-    """direct testing of the agent's logic."""
     print("--- Running Agent in Test Mode ---")
     agent = create_agent_executor(provider="google")
     question = "According to wikipedia, what is the main difference between a lama and an alpaca?"

 import subprocess
 import textwrap
 import base64
+import functools # Used to pre-fill arguments for our tool functions
 from io import BytesIO
 from pathlib import Path
 # Third-party libraries
 import requests
 from langchain.tools.retriever import create_retriever_tool
 from langchain_community.vectorstores import FAISS
 from langchain_community.tools.tavily_search import TavilySearchResults
+from langchain_community.document_loaders import WikipediaLoader, ArxivLoader
 from langchain_core.messages import SystemMessage, HumanMessage, AIMessage
+from langchain_core.tools import Tool, tool # Import Tool for manual tool creation
 from langchain_google_genai import ChatGoogleGenerativeAI
 from langchain_groq import ChatGroq
 from langchain_huggingface import HuggingFaceEmbeddings, HuggingFaceEndpoint, ChatHuggingFace
 JSONL_PATH   = Path("metadata.jsonl")
 FAISS_CACHE  = Path("faiss_index.pkl")
 EMBED_MODEL  = "sentence-transformers/all-mpnet-base-v2"
+RETRIEVER_K  = 5
+CACHE_TTL    = 600
 API_CACHE = TTLCache(maxsize=256, ttl=CACHE_TTL)
+# Global helper for caching API calls
+def cached_get(key: str, fetch_fn):
+    if key in API_CACHE: return API_CACHE[key]
+    val = fetch_fn()
+    API_CACHE[key] = val
+    return val
 # ----------------------------------------------------------
+# Section 2: Standalone Tool Functions (No 'self' parameter)
 # ----------------------------------------------------------
+@tool
+def python_repl(code: str) -> str:
+    """Executes a string of Python code and returns the stdout/stderr."""
+    code = textwrap.dedent(code).strip()
+    try:
+        result = subprocess.run(["python", "-c", code], capture_output=True, text=True, timeout=10, check=False)
+        if result.returncode == 0: return f"Execution successful.\nSTDOUT:\n```\n{result.stdout}\n```"
+        else: return f"Execution failed.\nSTDOUT:\n```\n{result.stdout}\n```\nSTDERR:\n```\n{result.stderr}\n```"
+    except subprocess.TimeoutExpired: return "Execution timed out (>10s)."
+# These functions now accept their dependencies (like an llm instance or a cache function) as arguments.
+@tool
+def describe_image_func(image_source: str, vision_llm_instance) -> str:
+    """Describes an image from a local file path or a URL using a provided vision LLM."""
+    try:
+        if image_source.startswith("http"): img = Image.open(BytesIO(requests.get(image_source, timeout=10).content))
+        else: img = Image.open(image_source)
+        buffered = BytesIO()
+        img.convert("RGB").save(buffered, format="JPEG")
+        b64_string = base64.b64encode(buffered.getvalue()).decode()
+        msg = HumanMessage(content=[{"type": "text", "text": "Describe this image in detail."}, {"type": "image_url", "image_url": {"url": f"data:image/jpeg;base64,{b64_string}"}}])
+        return vision_llm_instance.invoke([msg]).content
+    except Exception as e: return f"Error processing image: {e}"
+@tool
+def web_search_func(query: str, cache_func) -> str:
+    """Performs a web search using Tavily and returns a compilation of results."""
+    key = f"web:{query}"
+    results = cache_func(key, lambda: TavilySearchResults(max_results=5).invoke(query))
+    return "\n\n---\n\n".join([f"Source: {res['url']}\nContent: {res['content']}" for res in results])
+@tool
+def wiki_search_func(query: str, cache_func) -> str:
+    """Searches Wikipedia and returns the top 2 results."""
+    key = f"wiki:{query}"
+    docs = cache_func(key, lambda: WikipediaLoader(query=query, load_max_docs=2, doc_content_chars_max=2000).load())
+    return "\n\n---\n\n".join([f"Source: {d.metadata['source']}\n\n{d.page_content}" for d in docs])
+@tool
+def arxiv_search_func(query: str, cache_func) -> str:
+    """Searches Arxiv for scientific papers and returns the top 2 results."""
+    key = f"arxiv:{query}"
+    docs = cache_func(key, lambda: ArxivLoader(query=query, load_max_docs=2).load())
+    return "\n\n---\n\n".join([f"Source: {d.metadata['source']}\nPublished: {d.metadata['Published']}\nTitle: {d.metadata['Title']}\n\nSummary:\n{d.page_content}" for d in docs])
 # ----------------------------------------------------------
 # Section 3: System Prompt
 # ----------------------------------------------------------
 SYSTEM_PROMPT = (
     """You are an expert-level research assistant designed to answer questions accurately.
 **Your Reasoning Process:**
+1.  **Think Step-by-Step:** Break down the user's question into logical steps. Plan which tools you need.
+2.  **Use Your Tools:** Execute your plan by calling one tool at a time. Analyze the results.
+3.  **Iterate:** If needed, use more tools until you have enough information.
+4.  **Synthesize:** Formulate a concise final answer based on the information.
 **Output Format:**
+- Your final response MUST strictly follow this format:
   `FINAL ANSWER: [Your concise and accurate answer here]`
 **Crucial Instructions:**
+- If your tools **cannot possibly answer the question** (e.g., it requires watching a video or listening to audio), you MUST respond by stating the limitation.
 - In case of a limitation, your response should be:
   `FINAL ANSWER: I am unable to answer this question because it requires a capability I do not possess, such as [describe the missing capability].`
 """
 )
 # ----------------------------------------------------------
 # Section 4: Factory Function for Agent Executor
 # ----------------------------------------------------------
+def create_agent_executor(provider: str = "groq"):
+    """
+    Factory function to create and compile the LangGraph agent executor.
+    This version creates tools from standalone functions to ensure model compatibility.
+    """
+    print(f"Initializing agent with provider: {provider}")
+    # Step 1: Build LLMs
+    if provider == "google": main_llm = ChatGoogleGenerativeAI(model="gemini-1.5-pro-latest", temperature=0)
+    elif provider == "groq": main_llm = ChatGroq(model_name="meta-llama/llama-4-maverick-17b-128e-instruct", temperature=0)
+    elif provider == "huggingface": main_llm = ChatHuggingFace(llm=HuggingFaceEndpoint(repo_id="mistralai/Mixtral-8x7B-Instruct-v0.1", temperature=0.1))
+    else: raise ValueError("Invalid provider selected")
+    vision_llm = ChatGroq(model_name="meta-llama/llama-4-maverick-17b-128e-instruct", temperature=0)
+    # Step 2: Build Retriever
+    embeddings = HuggingFaceEmbeddings(model_name=EMBED_MODEL)
+    if FAISS_CACHE.exists():
+        with open(FAISS_CACHE, "rb") as f: vector_store = pickle.load(f)
+    else:
+        docs = [Document(page_content=f"Question: {rec['Question']}\n\nFinal answer: {rec['Final answer']}", metadata={"source": rec["task_id"]}) for rec in (json.loads(line) for line in open(JSONL_PATH, "rt", encoding="utf-8"))]
+        vector_store = FAISS.from_documents(docs, embeddings)
+        with open(FAISS_CACHE, "wb") as f: pickle.dump(vector_store, f)
+    retriever = vector_store.as_retriever(search_kwargs={"k": RETRIEVER_K})
+    # Step 3: Create the final list of tools
+    # We use functools.partial to "bake in" the dependencies (like the LLM or cache) into our standalone functions.
+    # This creates new functions with a simpler signature that the agent can easily call.
+    tools_list = [
+        python_repl,
+        Tool(name="describe_image", func=functools.partial(describe_image_func, vision_llm_instance=vision_llm), description="Describes an image from a local file path or a URL."),
+        Tool(name="web_search", func=functools.partial(web_search_func, cache_func=cached_get), description="Performs a web search using Tavily."),
+        Tool(name="wiki_search", func=functools.partial(wiki_search_func, cache_func=cached_get), description="Searches Wikipedia."),
+        Tool(name="arxiv_search", func=functools.partial(arxiv_search_func, cache_func=cached_get), description="Searches Arxiv for scientific papers."),
+        create_retriever_tool(retriever=retriever, name="retrieve_examples", description="Retrieve solved questions similar to the user's query."),
+    ]
+    llm_with_tools = main_llm.bind_tools(tools_list)
+    # Step 4: Define Graph Nodes
     def retriever_node(state: MessagesState):
         user_query = state["messages"][-1].content
+        docs = retriever.invoke(user_query)
         messages = [SystemMessage(content=SYSTEM_PROMPT)]
         if docs:
             example_text = "\n\n---\n\n".join(d.page_content for d in docs)
+            messages.append(AIMessage(content=f"I have found {len(docs)} similar solved examples:\n\n{example_text}", name="ExampleRetriever"))
         messages.extend(state["messages"])
         return {"messages": messages}
     def assistant_node(state: MessagesState):
         result = llm_with_tools.invoke(state["messages"])
         return {"messages": [result]}
+    # Step 5: Build Graph
     builder = StateGraph(MessagesState)
     builder.add_node("retriever", retriever_node)
     builder.add_node("assistant", assistant_node)
     return agent_executor
 # ----------------------------------------------------------
+# Section 5: Pre-flight check and Direct Execution Block
 # ----------------------------------------------------------
+def test_llm_connection(provider: str = "google"):
+    """Performs a quick test to see if the LLM provider is accessible."""
+    print(f"--- Performing pre-flight check for LLM provider: {provider} ---")
+    try:
+        if provider == "google": llm, name = ChatGoogleGenerativeAI(model="gemini-1.5-pro-latest"), "Google Gemini"
+        elif provider == "groq": llm, name = ChatGroq(model_name="llama3-70b-8192"), "Groq"
+        elif provider == "huggingface": llm, name = ChatHuggingFace(llm=HuggingFaceEndpoint(repo_id="mistralai/Mixtral-8x7B-Instruct-v0.1")), "Hugging Face"
+        else: return "❌ **LLM Status:** Invalid provider configured."
+        llm.invoke("hello")
+        success_message = f"✅ **LLM Status:** Connection to {name} is successful."
+        print(success_message)
+        return success_message
+    except Exception as e:
+        error_message = f"❌ **LLM Status:** FAILED to connect. Check API keys/credits. Details: {e}"
+        print(error_message)
+        return error_message
 if __name__ == "__main__":
+    """Allows for direct testing of the agent's logic."""
     print("--- Running Agent in Test Mode ---")
     agent = create_agent_executor(provider="google")
     question = "According to wikipedia, what is the main difference between a lama and an alpaca?"