Spaces:

HASHIRUAgentX
/

hashiruAI

Running

App Files Files Community

helloparthshah commited on May 12

Commit

1476939

1 Parent(s): 0e323dc

Giving agent access to the model costs

Browse files

Files changed (5) hide show

src/manager/agent_manager.py +2 -2
src/manager/budget_manager.py +1 -0
src/manager/manager.py +3 -2
src/tools/default_tools/agent_cost_manager.py +78 -0
src/tools/default_tools/agent_creater_tool.py +7 -76

src/manager/agent_manager.py CHANGED Viewed

@@ -141,8 +141,8 @@ class AgentManager():
     def validate_budget(self, amount: float) -> None:
         if not self.budget_manager.can_spend(amount):
-            raise ValueError(f"Do not have enough budget to create the tool. "
-                        +f"Creating the tool costs {amount} but only {self.budget_manager.get_current_remaining_budget()} is remaining")
     def create_agent_class(self, agent_name: str, base_model: str, system_prompt: str, description: str = "", create_cost: float = 0, invoke_cost: float = 0,
                     **additional_params) -> Agent:

     def validate_budget(self, amount: float) -> None:
         if not self.budget_manager.can_spend(amount):
+            raise ValueError(f"Do not have enough budget to create/use the agent. "
+                        +f"Creating/Using the agent costs {amount} but only {self.budget_manager.get_current_remaining_budget()} is remaining")
     def create_agent_class(self, agent_name: str, base_model: str, system_prompt: str, description: str = "", create_cost: float = 0, invoke_cost: float = 0,
                     **additional_params) -> Agent:

src/manager/budget_manager.py CHANGED Viewed

@@ -1,6 +1,7 @@
 from src.manager.utils.singleton import singleton
 import torch
 import psutil
 @singleton
 class BudgetManager():
     TOTAL_BUDGET = 100

 from src.manager.utils.singleton import singleton
 import torch
 import psutil
 @singleton
 class BudgetManager():
     TOTAL_BUDGET = 100

src/manager/manager.py CHANGED Viewed

@@ -163,6 +163,7 @@ class GeminiManager:
         top_k = min(k, len(memories))
         # Semantic Retrieval with GPU
         device = 'cuda' if torch.cuda.is_available() else 'cpu'
         model = SentenceTransformer('all-MiniLM-L6-v2', device=device)
         doc_embeddings = model.encode(memories, convert_to_tensor=True, device=device)
         query_embedding = model.encode(query, convert_to_tensor=True, device=device)
@@ -195,13 +196,13 @@ class GeminiManager:
         logger.debug(f"Chat history: {chat_history}")
         try:
             response = suppress_output(self.generate_response)(chat_history)
         except Exception as e:
-            logger.debug(f"Error generating response: {e}")
             messages.append({
                 "role": "assistant",
                 "content": f"Error generating response: {e}"
             })
-            logger.error(f"Error generating response: {e}")
             yield messages
             return
         logger.debug(f"Response: {response}")

         top_k = min(k, len(memories))
         # Semantic Retrieval with GPU
         device = 'cuda' if torch.cuda.is_available() else 'cpu'
+        print(f"Using device: {device}")
         model = SentenceTransformer('all-MiniLM-L6-v2', device=device)
         doc_embeddings = model.encode(memories, convert_to_tensor=True, device=device)
         query_embedding = model.encode(query, convert_to_tensor=True, device=device)
         logger.debug(f"Chat history: {chat_history}")
         try:
             response = suppress_output(self.generate_response)(chat_history)
+            print(f"Response: {response}")
         except Exception as e:
             messages.append({
                 "role": "assistant",
                 "content": f"Error generating response: {e}"
             })
+            logger.error(f"Error generating response", e)
             yield messages
             return
         logger.debug(f"Response: {response}")

src/tools/default_tools/agent_cost_manager.py ADDED Viewed

	@@ -0,0 +1,78 @@

+__all__ = ['AgentCostManager']
+class AgentCostManager():
+    dependencies = []
+    inputSchema = {
+        "name": "AgentCostManager",
+        "description": "Retrieves the cost of creating and invoking an agent. Please make sure to use this before creating an agent.",
+        "parameters": {
+            "type": "object",
+            "properties": {},
+            "required": [],
+        }
+    }
+    costs = {
+        "llama3.2": {
+            "description": "3 Billion parameter model",
+            "create_cost": 10,
+            "invoke_cost": 20,
+        },
+        "mistral": {
+            "description": "7 Billion parameter model",
+            "create_cost": 20,
+            "invoke_cost": 50,
+        },
+        "gemini-2.5-flash-preview-04-17": {
+            "description": "Adaptive thinking, cost efficiency",
+            "create_cost": 20,
+            "invoke_cost": 50
+        },
+        "gemini-2.5-pro-preview-03-25": {
+            "description": "Enhanced thinking and reasoning, multimodal understanding, advanced coding, and more",
+            "create_cost": 20,
+            "invoke_cost": 50
+        },
+        "gemini-2.0-flash": {
+            "description": "Next generation features, speed, thinking, realtime streaming, and multimodal generation",
+            "create_cost": 20,
+            "invoke_cost": 50
+        },
+        "gemini-2.0-flash-lite": {
+            "description": "Cost efficiency and low latency",
+            "create_cost": 20,
+            "invoke_cost": 50
+        },
+        "gemini-1.5-flash": {
+            "description": "Fast and versatile performance across a diverse variety of tasks",
+            "create_cost": 20,
+            "invoke_cost": 50
+        },
+        "gemini-1.5-flash-8b": {
+            "description": "High volume and lower intelligence tasks",
+            "create_cost": 20,
+            "invoke_cost": 50
+        },
+        "gemini-1.5-pro": {
+            "description": "Complex reasoning tasks requiring more intelligence",
+            "create_cost": 20,
+            "invoke_cost": 50
+        },
+        "gemini-2.0-flash-live-001": {
+            "description": "Low-latency bidirectional voice and video interactions",
+            "create_cost": 20,
+            "invoke_cost": 50
+        }
+    }
+    def get_costs(self):
+        return self.costs
+    def run(self, **kwargs):
+        return {
+            "status": "success",
+            "message": "Cost of creating and invoking an agent",
+            "output": self.costs,
+        }

src/tools/default_tools/agent_creater_tool.py CHANGED Viewed

@@ -1,6 +1,7 @@
 from src.manager.agent_manager import AgentManager
 from src.manager.config.model_selector import choose_best_model
 from src.manager.utils.runtime_selector import detect_runtime_environment
 __all__ = ['AgentCreator']
 class AgentCreator():
@@ -20,7 +21,7 @@ class AgentCreator():
                 },
                 "base_model": {
                     "type": "string",
-                    "description": "A base model from which the new agent mode is to be created. Available models are: llama3.2, mistral, gemini-2.5-flash-preview-04-17, gemini-2.5-pro-preview-03-25, gemini-2.0-flash, gemini-2.0-flash-lite, gemini-1.5-flash, gemini-1.5-flash-8b, gemini-1.5-pro, and gemini-2.0-flash-live-001"
                 },
                 "system_prompt": {
                     "type": "string",
@@ -31,78 +32,7 @@ class AgentCreator():
                     "description": "Description of the agent. This is a string that describes the agent and its capabilities. It should be a single line description.",
                 },
             },
-            "required": ["agent_name", "system_prompt", "description"],
-            #"required": ["agent_name", "base_model", "system_prompt", "description"],
-        },
-        "creates": {
-            "selector": "base_model",
-            "types": {
-                "llama3.2":{
-                    "description": "3 Billion parameter model",
-                    "create_cost": 10,
-                    "invoke_cost": 20,
-                },
-                "mistral":{
-                    "description": "7 Billion parameter model",
-                    "create_cost": 20,
-                    "invoke_cost": 50,
-                },
-                "gemini-2.5-flash-preview-04-17": {
-                    "description": "Adaptive thinking, cost efficiency",
-                    "create_cost": 20,
-                    "invoke_cost": 50
-                },
-                "gemini-2.5-pro-preview-03-25": {
-                    "description": "Enhanced thinking and reasoning, multimodal understanding, advanced coding, and more",
-                    "create_cost": 20,
-                    "invoke_cost": 50
-                },
-                "gemini-2.0-flash": {
-                    "description": "Next generation features, speed, thinking, realtime streaming, and multimodal generation",
-                    "create_cost": 20,
-                    "invoke_cost": 50
-                },
-                "gemini-2.0-flash-lite": {
-                    "description": "Cost efficiency and low latency",
-                    "create_cost": 20,
-                    "invoke_cost": 50
-                },
-                "gemini-1.5-flash": {
-                    "description": "Fast and versatile performance across a diverse variety of tasks",
-                    "create_cost": 20,
-                    "invoke_cost": 50
-                },
-                "gemini-1.5-flash-8b": {
-                    "description": "High volume and lower intelligence tasks",
-                    "create_cost": 20,
-                    "invoke_cost": 50
-                },
-                "gemini-1.5-pro": {
-                    "description": "Complex reasoning tasks requiring more intelligence",
-                    "create_cost": 20,
-                    "invoke_cost": 50
-                },
-                # "gemini-embedding-exp": {
-                #     "description": "Measuring the relatedness of text strings",
-                #     "create_cost": 20,
-                #     "invoke_cost": 50
-                # },
-                # "imagen-3.0-generate-002": {
-                #     "description": "Our most advanced image generation model",
-                #     "create_cost": 20,
-                #     "invoke_cost": 50
-                # },
-                # "veo-2.0-generate-001": {
-                #     "description": "High quality video generation",
-                #     "create_cost": 20,
-                #     "invoke_cost": 50
-                # },
-                "gemini-2.0-flash-live-001": {
-                    "description": "Low-latency bidirectional voice and video interactions",
-                    "create_cost": 20,
-                    "invoke_cost": 50
-                }
-            }
         }
     }
@@ -118,11 +48,12 @@ class AgentCreator():
         system_prompt = kwargs.get("system_prompt")
         description = kwargs.get("description")
-        create_cost = self.inputSchema["creates"]["types"][base_model]["create_cost"]
-        if base_model not in self.inputSchema["creates"]["types"]:
             print(f"[WARN] Auto-selected model '{base_model}' not in schema. Falling back to gemini-2.0-flash")
             base_model = "gemini-2.0-flash"
-        invoke_cost = self.inputSchema["creates"]["types"][base_model]["invoke_cost"]
         agent_manager = AgentManager()
         try:

 from src.manager.agent_manager import AgentManager
 from src.manager.config.model_selector import choose_best_model
 from src.manager.utils.runtime_selector import detect_runtime_environment
+from src.tools.default_tools.agent_cost_manager import AgentCostManager
 __all__ = ['AgentCreator']
 class AgentCreator():
                 },
                 "base_model": {
                     "type": "string",
+                    "description": "A base model from which the new agent mode is to be created. Check the available models using the AgentCostManager tool.",
                 },
                 "system_prompt": {
                     "type": "string",
                     "description": "Description of the agent. This is a string that describes the agent and its capabilities. It should be a single line description.",
                 },
             },
+            "required": ["agent_name", "base_model", "system_prompt", "description"],
         }
     }
         system_prompt = kwargs.get("system_prompt")
         description = kwargs.get("description")
+        model_costs = AgentCostManager().get_costs()
+        create_cost = model_costs[base_model]["create_cost"]
+        if base_model not in model_costs:
             print(f"[WARN] Auto-selected model '{base_model}' not in schema. Falling back to gemini-2.0-flash")
             base_model = "gemini-2.0-flash"
+        invoke_cost = model_costs[base_model]["invoke_cost"]
         agent_manager = AgentManager()
         try: