Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -70,6 +70,25 @@ class BasicAgent:
|
|
70 |
device_map="auto",
|
71 |
)
|
72 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
73 |
# Verify where model actually loaded
|
74 |
if hasattr(self.model, 'device'):
|
75 |
print(f"✅ Model loaded on device: {self.model.device}")
|
|
|
70 |
device_map="auto",
|
71 |
)
|
72 |
|
73 |
+
if hasattr(self.model, 'tokenizer') and self.model.tokenizer is not None:
|
74 |
+
# Set left padding for better batching with causal models
|
75 |
+
self.model.tokenizer.padding_side = "left"
|
76 |
+
# Ensure pad token is set
|
77 |
+
if self.model.tokenizer.pad_token is None:
|
78 |
+
self.model.tokenizer.pad_token = self.model.tokenizer.eos_token
|
79 |
+
# Set default padding behavior for FlashAttention
|
80 |
+
self.model.tokenizer.pad_to_multiple_of = 8
|
81 |
+
print("✅ Applied tokenizer padding fix for FlashAttention alignment")
|
82 |
+
|
83 |
+
# If the model has a processor with tokenizer, fix that too
|
84 |
+
if hasattr(self.model, 'processor') and hasattr(self.model.processor, 'tokenizer'):
|
85 |
+
self.model.processor.tokenizer.padding_side = "left"
|
86 |
+
if self.model.processor.tokenizer.pad_token is None:
|
87 |
+
self.model.processor.tokenizer.pad_token = self.model.processor.tokenizer.eos_token
|
88 |
+
self.model.processor.tokenizer.pad_to_multiple_of = 8
|
89 |
+
print("✅ Applied processor tokenizer padding fix")
|
90 |
+
|
91 |
+
|
92 |
# Verify where model actually loaded
|
93 |
if hasattr(self.model, 'device'):
|
94 |
print(f"✅ Model loaded on device: {self.model.device}")
|