__all__ = ['AgentCostManager'] class AgentCostManager(): dependencies = [] inputSchema = { "name": "AgentCostManager", "description": "Retrieves the cost of creating and invoking an agent. Also includes the strengths of each model. Please make sure to use this before creating an agent.", "parameters": { "type": "object", "properties": {}, "required": [], } } costs = { "llama3.2": { "description": "Avg Accuracy: 49.75%, Latency 0.9s, 63.4% on multi-task understanding, 40.8% on rewriting, 78.6% on reasoning.", "create_resource_cost": 10, "invoke_resource_cost": 40, }, "mistral": { "description": "Avg Accuracy: 51.3%, Latency 9.7s, 51% on LegalBench, 60.1% on multi-task understanding, 69.9% on TriviaQA, 67.9% on reasoning", "create_resource_cost": 20, "invoke_resource_cost": 100, }, "deepseek-r1": { "description": "Avg Accuracy: 77.3%, Latency: 120s, 69.9% on LegalBench, 71.1% on multi-task understanding, 92.2% on Math", "create_resource_cost": 20, "invoke_resource_cost": 150, }, "gemini-2.5-flash-preview-05-20": { "description": "Avg Accuracy: 75.8%, 82.8% on LegalBench, 81.6% on multi-task understanding, 91.6% on Math", "create_expense_cost": 0, "invoke_expense_cost": 0.15, "output_expense_cost": 0.60, }, "gemini-2.5-pro-exp-03-25": { "description": "Avg Accuracy: 64.3%, 83.6% on LegalBench, 84.1% on multi-task understanding, 95.2% on Math, 63.8% on Coding", "create_expense_cost": 0, "invoke_expense_cost": 1.25, "output_expense_cost": 10.00, }, "gemini-2.0-flash": { "description": "Avg Accuracy: 64.3%, 79.9% on LegalBench, 77.4% on multi-task understanding, 90.9% on Math, 34.5% on Coding", "create_expense_cost": 0, "invoke_expense_cost": 0.10, "output_expense_cost": 0.40, }, "gemini-2.0-flash-lite": { "description": "Avg Accuracy: 64.1%, 71.6% on multi-task understanding, 86.8% on Math, 28.9% on Coding", "create_expense_cost": 0, "invoke_expense_cost": 0.075, "output_expense_cost": 0.30, }, "gemini-1.5-flash": { "description": "62.0% on LegalBench, 61.0% on MMLU, 59.0% on MATH", "create_expense_cost": 0, "invoke_expense_cost": 0.075, "output_expense_cost": 0.30, }, "gemini-1.5-flash-8b": { "description": "High volume and lower intelligence tasks", "create_expense_cost": 0, "invoke_expense_cost": 0.0375, "output_expense_cost": 0.15, }, "groq-qwen-qwq-32b": { "description": "79.5% on AIME24, is comparable to o1-mini and DeepSeek-R1 on all reasonig tasks", "create_expense_cost": 0, "invoke_expense_cost": 0.29, "output_expense_cost": 0.39, }, "lambda-hermes3-8b": { "description": "High volume and lower intelligence tasks, 60.0% on MMLU, 58.0% on MATH", "create_expense_cost": 0, "invoke_expense_cost": 0.025, "output_expense_cost": 0.04, }, } def get_costs(self): return self.costs def run(self, **kwargs): return { "status": "success", "message": "Cost of creating and invoking an agent", "output": self.costs, }