Update app.py
Browse files
app.py
CHANGED
@@ -14,8 +14,8 @@ def load_model():
|
|
14 |
model = AutoModelForCausalLM.from_pretrained(
|
15 |
"umar141/Gemma_1B_Baro_v2_vllm",
|
16 |
torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
|
17 |
-
|
18 |
-
)
|
19 |
return tokenizer, model
|
20 |
|
21 |
tokenizer, model = load_model()
|
|
|
14 |
model = AutoModelForCausalLM.from_pretrained(
|
15 |
"umar141/Gemma_1B_Baro_v2_vllm",
|
16 |
torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
|
17 |
+
|
18 |
+
).to("cuda" if torch.cuda.is_available() else "cpu")
|
19 |
return tokenizer, model
|
20 |
|
21 |
tokenizer, model = load_model()
|