hashiruAI / src /tools /default_tools /agent_cost_manager.py
Kunal Pai
Refactor LambdaAgent to use OpenAI client and update cost manager with new Lambda model expenses
fcdfb63
__all__ = ['AgentCostManager']
class AgentCostManager():
dependencies = []
inputSchema = {
"name": "AgentCostManager",
"description": "Retrieves the cost of creating and invoking an agent. Also includes the strengths of each model. Please make sure to use this before creating an agent.",
"parameters": {
"type": "object",
"properties": {},
"required": [],
}
}
costs = {
"llama3.2": {
"description": "Avg Accuracy: 49.75%, Latency 0.9s, 63.4% on multi-task understanding, 40.8% on rewriting, 78.6% on reasoning.",
"create_resource_cost": 10,
"invoke_resource_cost": 40,
},
"mistral": {
"description": "Avg Accuracy: 51.3%, Latency 9.7s, 51% on LegalBench, 60.1% on multi-task understanding, 69.9% on TriviaQA, 67.9% on reasoning",
"create_resource_cost": 20,
"invoke_resource_cost": 100,
},
"deepseek-r1": {
"description": "Avg Accuracy: 77.3%, Latency: 120s, 69.9% on LegalBench, 71.1% on multi-task understanding, 92.2% on Math",
"create_resource_cost": 20,
"invoke_resource_cost": 150,
},
"gemini-2.5-flash-preview-05-20": {
"description": "Avg Accuracy: 75.8%, 82.8% on LegalBench, 81.6% on multi-task understanding, 91.6% on Math",
"create_expense_cost": 0,
"invoke_expense_cost": 0.15,
"output_expense_cost": 0.60,
},
"gemini-2.5-pro-exp-03-25": {
"description": "Avg Accuracy: 64.3%, 83.6% on LegalBench, 84.1% on multi-task understanding, 95.2% on Math, 63.8% on Coding",
"create_expense_cost": 0,
"invoke_expense_cost": 1.25,
"output_expense_cost": 10.00,
},
"gemini-2.0-flash": {
"description": "Avg Accuracy: 64.3%, 79.9% on LegalBench, 77.4% on multi-task understanding, 90.9% on Math, 34.5% on Coding",
"create_expense_cost": 0,
"invoke_expense_cost": 0.10,
"output_expense_cost": 0.40,
},
"gemini-2.0-flash-lite": {
"description": "Avg Accuracy: 64.1%, 71.6% on multi-task understanding, 86.8% on Math, 28.9% on Coding",
"create_expense_cost": 0,
"invoke_expense_cost": 0.075,
"output_expense_cost": 0.30,
},
"gemini-1.5-flash": {
"description": "62.0% on LegalBench, 61.0% on MMLU, 59.0% on MATH",
"create_expense_cost": 0,
"invoke_expense_cost": 0.075,
"output_expense_cost": 0.30,
},
"gemini-1.5-flash-8b": {
"description": "High volume and lower intelligence tasks",
"create_expense_cost": 0,
"invoke_expense_cost": 0.0375,
"output_expense_cost": 0.15,
},
"groq-qwen-qwq-32b": {
"description": "79.5% on AIME24, is comparable to o1-mini and DeepSeek-R1 on all reasonig tasks",
"create_expense_cost": 0,
"invoke_expense_cost": 0.29,
"output_expense_cost": 0.39,
},
"lambda-hermes3-8b": {
"description": "High volume and lower intelligence tasks, 60.0% on MMLU, 58.0% on MATH",
"create_expense_cost": 0,
"invoke_expense_cost": 0.025,
"output_expense_cost": 0.04,
},
}
def get_costs(self):
return self.costs
def run(self, **kwargs):
return {
"status": "success",
"message": "Cost of creating and invoking an agent",
"output": self.costs,
}