DocterXray-v1.2

Runtime error

Aekanun commited on Nov 26, 2024

Commit

2500471

1 Parent(s): 2a60823

rev app

Files changed (1) hide show

app.py CHANGED Viewed

@@ -70,7 +70,7 @@ else:
 #         traceback.print_exc()  # เพิ่มการแสดง stack trace
 #         return False
-@spaces.GPU
 def load_model():
     global model, tokenizer
     print("กำลังโหลดโมเดล...")
@@ -81,7 +81,8 @@ def load_model():
         print("กำลังโหลด tokenizer...")
         base_model, _tokenizer = FastVisionModel.from_pretrained(
             "unsloth/Llama-3.2-11B-Vision-Instruct",
-            use_gradient_checkpointing = "unsloth"
         )
         tokenizer = _tokenizer  # กำหนดค่าให้ตัวแปร global โดยตรง
@@ -96,7 +97,8 @@ def load_model():
         print("กำลังโหลดโมเดล fine-tuned...")
         model = AutoModelForVision2Seq.from_pretrained(
             "Aekanun/Llama-3.2-11B-Vision-Instruct-XRay",
-            load_in_4bit=True,
             torch_dtype=torch.float16
         ).to('cuda')

 #         traceback.print_exc()  # เพิ่มการแสดง stack trace
 #         return False
+###@spaces.GPU
 def load_model():
     global model, tokenizer
     print("กำลังโหลดโมเดล...")
         print("กำลังโหลด tokenizer...")
         base_model, _tokenizer = FastVisionModel.from_pretrained(
             "unsloth/Llama-3.2-11B-Vision-Instruct",
+            use_gradient_checkpointing = "unsloth",
+            device_map="auto"  ### เพิ่มตรงนี้
         )
         tokenizer = _tokenizer  # กำหนดค่าให้ตัวแปร global โดยตรง
         print("กำลังโหลดโมเดล fine-tuned...")
         model = AutoModelForVision2Seq.from_pretrained(
             "Aekanun/Llama-3.2-11B-Vision-Instruct-XRay",
+            device_map="auto",  ### เพิ่มตรงนี้
+            ###load_in_4bit=True,
             torch_dtype=torch.float16
         ).to('cuda')