File size: 3,122 Bytes
1476939
 
 
 
 
 
 
 
dc94b28
1476939
 
 
 
 
 
 
 
 
dc94b28
904d53f
7e51da8
1476939
 
dc94b28
904d53f
7e51da8
1476939
2c0c391
dc94b28
904d53f
7e51da8
2c0c391
7d69384
dc94b28
657847e
 
1476939
7d69384
dc94b28
657847e
 
1476939
 
dc94b28
657847e
 
1476939
 
dc94b28
657847e
 
1476939
 
dc94b28
657847e
 
1476939
 
 
657847e
 
1476939
1b3d55c
 
 
 
 
1476939
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
__all__ = ['AgentCostManager']


class AgentCostManager():
    dependencies = []

    inputSchema = {
        "name": "AgentCostManager",
        "description": "Retrieves the cost of creating and invoking an agent. Also includes the strengths of each model. Please make sure to use this before creating an agent.",
        "parameters": {
            "type": "object",
            "properties": {},
            "required": [],
        }
    }

    costs = {
        "llama3.2": {
            "description": "Avg Accuracy: 49.75%, Latency 0.9s, 63.4% on multi-task understanding, 40.8% on rewriting, 78.6% on reasoning.",
            "create_resource_cost": 10,
            "invoke_resource_cost": 40,
        },
        "mistral": {
            "description": "Avg Accuracy: 51.3%, Latency 9.7s, 51% on LegalBench, 60.1% on multi-task understanding, 69.9% on TriviaQA, 67.9% on reasoning",
            "create_resource_cost": 20,
            "invoke_resource_cost": 100,
        },
        "deepseek-r1": {
            "description": "Avg Accuracy: 77.3%, Latency: 120s, 69.9% on LegalBench, 71.1% on multi-task understanding, 92.2% on Math",
            "create_resource_cost": 20,
            "invoke_resource_cost": 150,
        },
        "gemini-2.5-flash-preview-05-20": {
            "description": "Avg Accuracy: 75.8%, 82.8% on LegalBench, 81.6% on multi-task understanding, 91.6% on Math",
            "create_expense_cost": 0,
            "invoke_expense_cost": 0.15,
        },
        "gemini-2.5-pro-exp-03-25": {
            "description": "Avg Accuracy: 64.3%, 83.6% on LegalBench, 84.1% on multi-task understanding, 95.2% on Math, 63.8% on Coding",
            "create_expense_cost": 0,
            "invoke_expense_cost": 1.25,
        },
        "gemini-2.0-flash": {
            "description": "Avg Accuracy: 64.3%, 79.9% on LegalBench, 77.4% on multi-task understanding, 90.9% on Math, 34.5% on Coding",
            "create_expense_cost": 0,
            "invoke_expense_cost": 0.10,
        },
        "gemini-2.0-flash-lite": {
            "description": "Avg Accuracy: 64.1%, 71.6% on multi-task understanding, 86.8% on Math, 28.9% on Coding",
            "create_expense_cost": 0,
            "invoke_expense_cost": 0.075
        },
        "gemini-1.5-flash": {
            "description": "62.0% on LegalBench, 61.0% on MMLU, 59.0% on MATH",
            "create_expense_cost": 0,
            "invoke_expense_cost": 0.075,
        },
        "gemini-1.5-flash-8b": {
            "description": "High volume and lower intelligence tasks",
            "create_expense_cost": 0,
            "invoke_expense_cost": 0.0375,
        },
        "groq-qwen-qwq-32b": {
            "description": "Avg Accuracy: 60.0%, 70.0% on multi-task understanding, 80.0% on Math",
            "create_expense_cost": 0,
            "invoke_expense_cost": 0.05,
        },
    }

    def get_costs(self):
        return self.costs

    def run(self, **kwargs):
        return {
            "status": "success",
            "message": "Cost of creating and invoking an agent",
            "output": self.costs,
        }