yasu-oh
commited on
Commit
·
47f79b3
1
Parent(s):
fd1928a
INF_MULT
Browse files
app.py
CHANGED
@@ -13,6 +13,7 @@ QUANTIZE = {
|
|
13 |
"Q5_K_M": 5.7,
|
14 |
"Q6_K": 6.6,
|
15 |
}
|
|
|
16 |
|
17 |
def get_model_api_info(model_name: str) -> dict:
|
18 |
"""
|
@@ -107,7 +108,7 @@ def estimate_gpu_memory(model_name: str) -> str:
|
|
107 |
# GPUメモリサイズの計算
|
108 |
total_params = sum(parameters.values())
|
109 |
for quant, multiplier in QUANTIZE.items():
|
110 |
-
gpu_memory = total_params * multiplier / 8 / (1024 ** 3) *
|
111 |
result_lines.append(f"【{quant}】約 {gpu_memory:.2f} GB")
|
112 |
|
113 |
result_lines.append("となります。")
|
|
|
13 |
"Q5_K_M": 5.7,
|
14 |
"Q6_K": 6.6,
|
15 |
}
|
16 |
+
INF_MULT = 1.25
|
17 |
|
18 |
def get_model_api_info(model_name: str) -> dict:
|
19 |
"""
|
|
|
108 |
# GPUメモリサイズの計算
|
109 |
total_params = sum(parameters.values())
|
110 |
for quant, multiplier in QUANTIZE.items():
|
111 |
+
gpu_memory = total_params * multiplier / 8 / (1024 ** 3) * INF_MULT
|
112 |
result_lines.append(f"【{quant}】約 {gpu_memory:.2f} GB")
|
113 |
|
114 |
result_lines.append("となります。")
|