hashiruAI

Running

hashiruAI / src /tools /default_tools /agent_cost_manager.py

Kunal Pai

Refactor LambdaAgent to use OpenAI client and update cost manager with new Lambda model expenses

fcdfb63 9 days ago

3.69 kB

	__all__ = ['AgentCostManager']


	class AgentCostManager():
	dependencies = []

	inputSchema = {
	"name": "AgentCostManager",
	"description": "Retrieves the cost of creating and invoking an agent. Also includes the strengths of each model. Please make sure to use this before creating an agent.",
	"parameters": {
	"type": "object",
	"properties": {},
	"required": [],
	}
	}

	costs = {
	"llama3.2": {
	"description": "Avg Accuracy: 49.75%, Latency 0.9s, 63.4% on multi-task understanding, 40.8% on rewriting, 78.6% on reasoning.",
	"create_resource_cost": 10,
	"invoke_resource_cost": 40,
	},
	"mistral": {
	"description": "Avg Accuracy: 51.3%, Latency 9.7s, 51% on LegalBench, 60.1% on multi-task understanding, 69.9% on TriviaQA, 67.9% on reasoning",
	"create_resource_cost": 20,
	"invoke_resource_cost": 100,
	},
	"deepseek-r1": {
	"description": "Avg Accuracy: 77.3%, Latency: 120s, 69.9% on LegalBench, 71.1% on multi-task understanding, 92.2% on Math",
	"create_resource_cost": 20,
	"invoke_resource_cost": 150,
	},
	"gemini-2.5-flash-preview-05-20": {
	"description": "Avg Accuracy: 75.8%, 82.8% on LegalBench, 81.6% on multi-task understanding, 91.6% on Math",
	"create_expense_cost": 0,
	"invoke_expense_cost": 0.15,
	"output_expense_cost": 0.60,
	},
	"gemini-2.5-pro-exp-03-25": {
	"description": "Avg Accuracy: 64.3%, 83.6% on LegalBench, 84.1% on multi-task understanding, 95.2% on Math, 63.8% on Coding",
	"create_expense_cost": 0,
	"invoke_expense_cost": 1.25,
	"output_expense_cost": 10.00,
	},
	"gemini-2.0-flash": {
	"description": "Avg Accuracy: 64.3%, 79.9% on LegalBench, 77.4% on multi-task understanding, 90.9% on Math, 34.5% on Coding",
	"create_expense_cost": 0,
	"invoke_expense_cost": 0.10,
	"output_expense_cost": 0.40,
	},
	"gemini-2.0-flash-lite": {
	"description": "Avg Accuracy: 64.1%, 71.6% on multi-task understanding, 86.8% on Math, 28.9% on Coding",
	"create_expense_cost": 0,
	"invoke_expense_cost": 0.075,
	"output_expense_cost": 0.30,
	},
	"gemini-1.5-flash": {
	"description": "62.0% on LegalBench, 61.0% on MMLU, 59.0% on MATH",
	"create_expense_cost": 0,
	"invoke_expense_cost": 0.075,
	"output_expense_cost": 0.30,
	},
	"gemini-1.5-flash-8b": {
	"description": "High volume and lower intelligence tasks",
	"create_expense_cost": 0,
	"invoke_expense_cost": 0.0375,
	"output_expense_cost": 0.15,
	},
	"groq-qwen-qwq-32b": {
	"description": "79.5% on AIME24, is comparable to o1-mini and DeepSeek-R1 on all reasonig tasks",
	"create_expense_cost": 0,
	"invoke_expense_cost": 0.29,
	"output_expense_cost": 0.39,
	},
	"lambda-hermes3-8b": {
	"description": "High volume and lower intelligence tasks, 60.0% on MMLU, 58.0% on MATH",
	"create_expense_cost": 0,
	"invoke_expense_cost": 0.025,
	"output_expense_cost": 0.04,
	},
	}

	def get_costs(self):
	return self.costs

	def run(self, **kwargs):
	return {
	"status": "success",
	"message": "Cost of creating and invoking an agent",
	"output": self.costs,
	}