Spaces:
Running
Running
Commit ·
904d53f
1
Parent(s): 7e51da8
Updated costs since ollama does use resources when creating a model
Browse files
Projects/test
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
Subproject commit d433face249d65807f57e82932629098e2124fce
|
src/tools/default_tools/agent_cost_manager.py
CHANGED
|
@@ -17,17 +17,17 @@ class AgentCostManager():
|
|
| 17 |
costs = {
|
| 18 |
"llama3.2": {
|
| 19 |
"description": "Avg Accuracy: 49.75%, Latency 0.9s, 63.4% on multi-task understanding, 40.8% on rewriting, 78.6% on reasoning.",
|
| 20 |
-
"create_resource_cost":
|
| 21 |
"invoke_resource_cost": 40,
|
| 22 |
},
|
| 23 |
"mistral": {
|
| 24 |
"description": "Avg Accuracy: 51.3%, Latency 9.7s, 51% on LegalBench, 60.1% on multi-task understanding, 69.9% on TriviaQA, 67.9% on reasoning",
|
| 25 |
-
"create_resource_cost":
|
| 26 |
"invoke_resource_cost": 100,
|
| 27 |
},
|
| 28 |
"deepseek-r1": {
|
| 29 |
"description": "Avg Accuracy: 77.3%, Latency: 120s, 69.9% on LegalBench, 71.1% on multi-task understanding, 92.2% on Math",
|
| 30 |
-
"create_resource_cost":
|
| 31 |
"invoke_resource_cost": 150,
|
| 32 |
},
|
| 33 |
"gemini-2.5-flash-preview-05-20": {
|
|
|
|
| 17 |
costs = {
|
| 18 |
"llama3.2": {
|
| 19 |
"description": "Avg Accuracy: 49.75%, Latency 0.9s, 63.4% on multi-task understanding, 40.8% on rewriting, 78.6% on reasoning.",
|
| 20 |
+
"create_resource_cost": 10,
|
| 21 |
"invoke_resource_cost": 40,
|
| 22 |
},
|
| 23 |
"mistral": {
|
| 24 |
"description": "Avg Accuracy: 51.3%, Latency 9.7s, 51% on LegalBench, 60.1% on multi-task understanding, 69.9% on TriviaQA, 67.9% on reasoning",
|
| 25 |
+
"create_resource_cost": 20,
|
| 26 |
"invoke_resource_cost": 100,
|
| 27 |
},
|
| 28 |
"deepseek-r1": {
|
| 29 |
"description": "Avg Accuracy: 77.3%, Latency: 120s, 69.9% on LegalBench, 71.1% on multi-task understanding, 92.2% on Math",
|
| 30 |
+
"create_resource_cost": 20,
|
| 31 |
"invoke_resource_cost": 150,
|
| 32 |
},
|
| 33 |
"gemini-2.5-flash-preview-05-20": {
|