Spaces:

Fas1
/

capybara_fas_ai

Runtime error

Fas1 commited on 13 days ago

Commit

03955fe

verified ·

1 Parent(s): 77d15ad

ы

Files changed (1) hide show

app.py CHANGED Viewed

@@ -2,7 +2,6 @@ import os
 import gradio as gr
 import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
-from accelerate import dispatch_model
 # Токен, если модель приватная
 hf_token = os.getenv("HF_TOKEN", None)
@@ -20,16 +19,11 @@ model = AutoModelForCausalLM.from_pretrained(
     model_path,
     token=hf_token,
     torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
     trust_remote_code=True,
 )
-# Dispatch model to devices with offloading
 os.makedirs("offload", exist_ok=True)
-model = dispatch_model(
-    model,
-    device_map="auto",
-    offload_state_dict=True,
-)
 # Создаём пайплайн
 pipe = pipeline("text-generation", model=model, tokenizer=tokenizer)

 import gradio as gr
 import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
 # Токен, если модель приватная
 hf_token = os.getenv("HF_TOKEN", None)
     model_path,
     token=hf_token,
     torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
+    device_map="auto",
     trust_remote_code=True,
 )
 os.makedirs("offload", exist_ok=True)
 # Создаём пайплайн
 pipe = pipeline("text-generation", model=model, tokenizer=tokenizer)