umar141 commited on
Commit
07d710e
·
verified ·
1 Parent(s): 43ab288

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -14,8 +14,8 @@ def load_model():
14
  model = AutoModelForCausalLM.from_pretrained(
15
  "umar141/Gemma_1B_Baro_v2_vllm",
16
  torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
17
- device_map="auto" # Automatically puts model on CUDA if available
18
- )
19
  return tokenizer, model
20
 
21
  tokenizer, model = load_model()
 
14
  model = AutoModelForCausalLM.from_pretrained(
15
  "umar141/Gemma_1B_Baro_v2_vllm",
16
  torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
17
+
18
+ ).to("cuda" if torch.cuda.is_available() else "cpu")
19
  return tokenizer, model
20
 
21
  tokenizer, model = load_model()