hashiruAI

Sleeping

App Files Files Community

helloparthshah commited on May 23

Commit

657847e

1 Parent(s): 979f76c

updated costs

Browse files

Files changed (2) hide show

src/manager/agent_manager.py +4 -4
src/tools/default_tools/agent_cost_manager.py +18 -18

src/manager/agent_manager.py CHANGED Viewed

@@ -111,6 +111,7 @@ class GeminiAgent(Agent):
         # Initialize the Gemini API
         self.client = genai.Client(api_key=self.api_key)
         # Call parent constructor after API setup
         super().__init__(agent_name,
@@ -125,9 +126,8 @@ class GeminiAgent(Agent):
         self.messages = []
     def ask_agent(self, prompt):
-        response = self.client.models.generate_content(
-            model=self.base_model,
-            contents=prompt,
             config=types.GenerateContentConfig(
                 system_instruction=self.system_prompt,
             )
@@ -369,7 +369,7 @@ class AgentManager():
         if not self.is_cloud_invocation_enabled and agent.get_type() == "cloud":
             raise ValueError("Cloud invocation mode is disabled.")
-        n_tokens = len(prompt.split())/1000
         self.validate_budget(agent.invoke_resource_cost,
                              agent.invoke_expense_cost*n_tokens)

         # Initialize the Gemini API
         self.client = genai.Client(api_key=self.api_key)
+        self.chat = self.client.chats.create(model=base_model)
         # Call parent constructor after API setup
         super().__init__(agent_name,
         self.messages = []
     def ask_agent(self, prompt):
+        response = self.chat.send_message(
+            message=prompt,
             config=types.GenerateContentConfig(
                 system_instruction=self.system_prompt,
             )
         if not self.is_cloud_invocation_enabled and agent.get_type() == "cloud":
             raise ValueError("Cloud invocation mode is disabled.")
+        n_tokens = len(prompt.split())/1000000
         self.validate_budget(agent.invoke_resource_cost,
                              agent.invoke_expense_cost*n_tokens)

src/tools/default_tools/agent_cost_manager.py CHANGED Viewed

@@ -32,43 +32,43 @@ class AgentCostManager():
         },
         "gemini-2.5-flash-preview-04-17": {
             "description": "Adaptive thinking, cost efficiency",
-            "create_expense_cost": 0.005,
-            "invoke_expense_cost": 0.00017
         },
-        "gemini-2.5-pro-preview-03-25": {
             "description": "Enhanced thinking and reasoning, multimodal understanding, advanced coding, and more",
-            "create_expense_cost": 0.005,
-            "invoke_expense_cost": 0.0001275
         },
         "gemini-2.0-flash": {
-            "description": "Next generation features, speed, thinking, realtime streaming, and multimodal generation",
-            "create_expense_cost": 0.005,
-            "invoke_expense_cost": 0.00017
         },
         "gemini-2.0-flash-lite": {
             "description": "Cost efficiency and low latency",
-            "create_expense_cost": 0.005,
-            "invoke_expense_cost": 0.00017
         },
         "gemini-1.5-flash": {
             "description": "Fast and versatile performance across a diverse variety of tasks",
-            "create_expense_cost": 0.005,
-            "invoke_expense_cost": 0.00017
         },
         "gemini-1.5-flash-8b": {
             "description": "High volume and lower intelligence tasks",
-            "create_expense_cost": 0.005,
-            "invoke_expense_cost": 0.00017
         },
         "gemini-1.5-pro": {
             "description": "Complex reasoning tasks requiring more intelligence",
-            "create_expense_cost": 0.005,
-            "invoke_expense_cost": 0.0001275
         },
         "gemini-2.0-flash-live-001": {
             "description": "Low-latency bidirectional voice and video interactions",
-            "create_expense_cost": 0.005,
-            "invoke_expense_cost": 0.000635
         }
     }

         },
         "gemini-2.5-flash-preview-04-17": {
             "description": "Adaptive thinking, cost efficiency",
+            "create_expense_cost": 0,
+            "invoke_expense_cost": 0.15,
         },
+        "gemini-2.5-pro-preview-05-06": {
             "description": "Enhanced thinking and reasoning, multimodal understanding, advanced coding, and more",
+            "create_expense_cost": 0,
+            "invoke_expense_cost": 1.25,
         },
         "gemini-2.0-flash": {
+            "description": "Next generation features, speed.",
+            "create_expense_cost": 0,
+            "invoke_expense_cost": 0.10,
         },
         "gemini-2.0-flash-lite": {
             "description": "Cost efficiency and low latency",
+            "create_expense_cost": 0,
+            "invoke_expense_cost": 0.075
         },
         "gemini-1.5-flash": {
             "description": "Fast and versatile performance across a diverse variety of tasks",
+            "create_expense_cost": 0,
+            "invoke_expense_cost": 0.075,
         },
         "gemini-1.5-flash-8b": {
             "description": "High volume and lower intelligence tasks",
+            "create_expense_cost": 0,
+            "invoke_expense_cost": 0.0375,
         },
         "gemini-1.5-pro": {
             "description": "Complex reasoning tasks requiring more intelligence",
+            "create_expense_cost": 0,
+            "invoke_expense_cost": 1.25,
         },
         "gemini-2.0-flash-live-001": {
             "description": "Low-latency bidirectional voice and video interactions",
+            "create_expense_cost": 0,
+            "invoke_expense_cost": 0.50,
         }
     }