Spaces:
Running
Running
Commit
·
904d53f
1
Parent(s):
7e51da8
Updated costs since ollama does use resources when creating a model
Browse files
Projects/test
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
Subproject commit d433face249d65807f57e82932629098e2124fce
|
src/tools/default_tools/agent_cost_manager.py
CHANGED
@@ -17,17 +17,17 @@ class AgentCostManager():
|
|
17 |
costs = {
|
18 |
"llama3.2": {
|
19 |
"description": "Avg Accuracy: 49.75%, Latency 0.9s, 63.4% on multi-task understanding, 40.8% on rewriting, 78.6% on reasoning.",
|
20 |
-
"create_resource_cost":
|
21 |
"invoke_resource_cost": 40,
|
22 |
},
|
23 |
"mistral": {
|
24 |
"description": "Avg Accuracy: 51.3%, Latency 9.7s, 51% on LegalBench, 60.1% on multi-task understanding, 69.9% on TriviaQA, 67.9% on reasoning",
|
25 |
-
"create_resource_cost":
|
26 |
"invoke_resource_cost": 100,
|
27 |
},
|
28 |
"deepseek-r1": {
|
29 |
"description": "Avg Accuracy: 77.3%, Latency: 120s, 69.9% on LegalBench, 71.1% on multi-task understanding, 92.2% on Math",
|
30 |
-
"create_resource_cost":
|
31 |
"invoke_resource_cost": 150,
|
32 |
},
|
33 |
"gemini-2.5-flash-preview-05-20": {
|
|
|
17 |
costs = {
|
18 |
"llama3.2": {
|
19 |
"description": "Avg Accuracy: 49.75%, Latency 0.9s, 63.4% on multi-task understanding, 40.8% on rewriting, 78.6% on reasoning.",
|
20 |
+
"create_resource_cost": 10,
|
21 |
"invoke_resource_cost": 40,
|
22 |
},
|
23 |
"mistral": {
|
24 |
"description": "Avg Accuracy: 51.3%, Latency 9.7s, 51% on LegalBench, 60.1% on multi-task understanding, 69.9% on TriviaQA, 67.9% on reasoning",
|
25 |
+
"create_resource_cost": 20,
|
26 |
"invoke_resource_cost": 100,
|
27 |
},
|
28 |
"deepseek-r1": {
|
29 |
"description": "Avg Accuracy: 77.3%, Latency: 120s, 69.9% on LegalBench, 71.1% on multi-task understanding, 92.2% on Math",
|
30 |
+
"create_resource_cost": 20,
|
31 |
"invoke_resource_cost": 150,
|
32 |
},
|
33 |
"gemini-2.5-flash-preview-05-20": {
|