Fas1 commited on
Commit
03955fe
·
verified ·
1 Parent(s): 77d15ad
Files changed (1) hide show
  1. app.py +1 -7
app.py CHANGED
@@ -2,7 +2,6 @@ import os
2
  import gradio as gr
3
  import torch
4
  from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
5
- from accelerate import dispatch_model
6
 
7
  # Токен, если модель приватная
8
  hf_token = os.getenv("HF_TOKEN", None)
@@ -20,16 +19,11 @@ model = AutoModelForCausalLM.from_pretrained(
20
  model_path,
21
  token=hf_token,
22
  torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
 
23
  trust_remote_code=True,
24
  )
25
 
26
- # Dispatch model to devices with offloading
27
  os.makedirs("offload", exist_ok=True)
28
- model = dispatch_model(
29
- model,
30
- device_map="auto",
31
- offload_state_dict=True,
32
- )
33
 
34
  # Создаём пайплайн
35
  pipe = pipeline("text-generation", model=model, tokenizer=tokenizer)
 
2
  import gradio as gr
3
  import torch
4
  from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
 
5
 
6
  # Токен, если модель приватная
7
  hf_token = os.getenv("HF_TOKEN", None)
 
19
  model_path,
20
  token=hf_token,
21
  torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
22
+ device_map="auto",
23
  trust_remote_code=True,
24
  )
25
 
 
26
  os.makedirs("offload", exist_ok=True)
 
 
 
 
 
27
 
28
  # Создаём пайплайн
29
  pipe = pipeline("text-generation", model=model, tokenizer=tokenizer)