saisha09 commited on
Commit
b915149
·
1 Parent(s): 0144997

models_cost file updated

Browse files
Files changed (1) hide show
  1. src/models_cost.py +13 -8
src/models_cost.py CHANGED
@@ -40,41 +40,47 @@ class ModelRegistry:
40
  },
41
  "gemini-2.0-flash": {
42
  "size": 6,
43
- "tokens_sec": 60,
44
  "type": "api",
45
  "description": "Fast and efficient API model"
46
  },
47
  "gemini-2.5-pro-preview-03-25": {
48
  "size": 10,
49
- "tokens_sec": 45,
50
  "type": "api",
51
  "description": "High-reasoning API model"
52
  },
53
  "gemini-1.5-flash": {
54
  "size": 7,
55
- "tokens_sec": 55,
56
  "type": "api",
57
  "description": "Fast general-purpose model"
58
  },
59
  "gemini-2.0-flash-lite": {
60
  "size": 5,
61
- "tokens_sec": 58,
62
  "type": "api",
63
  "description": "Low-latency, cost-efficient API model"
64
  },
65
  "gemini-2.0-flash-live-001": {
66
  "size": 9,
67
- "tokens_sec": 52,
68
  "type": "api",
69
  "description": "Voice/video low-latency API model"
70
  }
71
  }
72
 
 
73
  models = {}
74
  for name, model in raw_models.items():
75
  is_api = model["type"] == "api"
76
- create_cost = self.estimate_create_cost(model["size"], is_api)
77
- invoke_cost = self.estimate_invoke_cost(model["tokens_sec"], is_api)
 
 
 
 
 
78
 
79
  models[name] = ModelInfo(
80
  name=name,
@@ -85,7 +91,6 @@ class ModelRegistry:
85
  create_cost=create_cost,
86
  invoke_cost=invoke_cost
87
  )
88
-
89
  return models
90
 
91
  def get_filtered_models(self) -> Dict[str, ModelInfo]:
 
40
  },
41
  "gemini-2.0-flash": {
42
  "size": 6,
43
+ "tokens_sec": 170,
44
  "type": "api",
45
  "description": "Fast and efficient API model"
46
  },
47
  "gemini-2.5-pro-preview-03-25": {
48
  "size": 10,
49
+ "tokens_sec": 148,
50
  "type": "api",
51
  "description": "High-reasoning API model"
52
  },
53
  "gemini-1.5-flash": {
54
  "size": 7,
55
+ "tokens_sec": 190,
56
  "type": "api",
57
  "description": "Fast general-purpose model"
58
  },
59
  "gemini-2.0-flash-lite": {
60
  "size": 5,
61
+ "tokens_sec": 208,
62
  "type": "api",
63
  "description": "Low-latency, cost-efficient API model"
64
  },
65
  "gemini-2.0-flash-live-001": {
66
  "size": 9,
67
+ "tokens_sec": 190,
68
  "type": "api",
69
  "description": "Voice/video low-latency API model"
70
  }
71
  }
72
 
73
+
74
  models = {}
75
  for name, model in raw_models.items():
76
  is_api = model["type"] == "api"
77
+
78
+ if is_api:
79
+ # Flat cost for all API models
80
+ create_cost, invoke_cost = 20, 50
81
+ else:
82
+ create_cost = self.estimate_create_cost(model["size"], is_api=False)
83
+ invoke_cost = self.estimate_invoke_cost(model["tokens_sec"], is_api=False)
84
 
85
  models[name] = ModelInfo(
86
  name=name,
 
91
  create_cost=create_cost,
92
  invoke_cost=invoke_cost
93
  )
 
94
  return models
95
 
96
  def get_filtered_models(self) -> Dict[str, ModelInfo]: