helloparthshah commited on
Commit
904d53f
·
1 Parent(s): 7e51da8

Updated costs since ollama does use resources when creating a model

Browse files
Projects/test ADDED
@@ -0,0 +1 @@
 
 
1
+ Subproject commit d433face249d65807f57e82932629098e2124fce
src/tools/default_tools/agent_cost_manager.py CHANGED
@@ -17,17 +17,17 @@ class AgentCostManager():
17
  costs = {
18
  "llama3.2": {
19
  "description": "Avg Accuracy: 49.75%, Latency 0.9s, 63.4% on multi-task understanding, 40.8% on rewriting, 78.6% on reasoning.",
20
- "create_resource_cost": 0,
21
  "invoke_resource_cost": 40,
22
  },
23
  "mistral": {
24
  "description": "Avg Accuracy: 51.3%, Latency 9.7s, 51% on LegalBench, 60.1% on multi-task understanding, 69.9% on TriviaQA, 67.9% on reasoning",
25
- "create_resource_cost": 0,
26
  "invoke_resource_cost": 100,
27
  },
28
  "deepseek-r1": {
29
  "description": "Avg Accuracy: 77.3%, Latency: 120s, 69.9% on LegalBench, 71.1% on multi-task understanding, 92.2% on Math",
30
- "create_resource_cost": 0,
31
  "invoke_resource_cost": 150,
32
  },
33
  "gemini-2.5-flash-preview-05-20": {
 
17
  costs = {
18
  "llama3.2": {
19
  "description": "Avg Accuracy: 49.75%, Latency 0.9s, 63.4% on multi-task understanding, 40.8% on rewriting, 78.6% on reasoning.",
20
+ "create_resource_cost": 10,
21
  "invoke_resource_cost": 40,
22
  },
23
  "mistral": {
24
  "description": "Avg Accuracy: 51.3%, Latency 9.7s, 51% on LegalBench, 60.1% on multi-task understanding, 69.9% on TriviaQA, 67.9% on reasoning",
25
+ "create_resource_cost": 20,
26
  "invoke_resource_cost": 100,
27
  },
28
  "deepseek-r1": {
29
  "description": "Avg Accuracy: 77.3%, Latency: 120s, 69.9% on LegalBench, 71.1% on multi-task understanding, 92.2% on Math",
30
+ "create_resource_cost": 20,
31
  "invoke_resource_cost": 150,
32
  },
33
  "gemini-2.5-flash-preview-05-20": {