zmeeks commited on
Commit
2418331
·
verified ·
1 Parent(s): 30b42bb

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +19 -0
app.py CHANGED
@@ -70,6 +70,25 @@ class BasicAgent:
70
  device_map="auto",
71
  )
72
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
73
  # Verify where model actually loaded
74
  if hasattr(self.model, 'device'):
75
  print(f"✅ Model loaded on device: {self.model.device}")
 
70
  device_map="auto",
71
  )
72
 
73
+ if hasattr(self.model, 'tokenizer') and self.model.tokenizer is not None:
74
+ # Set left padding for better batching with causal models
75
+ self.model.tokenizer.padding_side = "left"
76
+ # Ensure pad token is set
77
+ if self.model.tokenizer.pad_token is None:
78
+ self.model.tokenizer.pad_token = self.model.tokenizer.eos_token
79
+ # Set default padding behavior for FlashAttention
80
+ self.model.tokenizer.pad_to_multiple_of = 8
81
+ print("✅ Applied tokenizer padding fix for FlashAttention alignment")
82
+
83
+ # If the model has a processor with tokenizer, fix that too
84
+ if hasattr(self.model, 'processor') and hasattr(self.model.processor, 'tokenizer'):
85
+ self.model.processor.tokenizer.padding_side = "left"
86
+ if self.model.processor.tokenizer.pad_token is None:
87
+ self.model.processor.tokenizer.pad_token = self.model.processor.tokenizer.eos_token
88
+ self.model.processor.tokenizer.pad_to_multiple_of = 8
89
+ print("✅ Applied processor tokenizer padding fix")
90
+
91
+
92
  # Verify where model actually loaded
93
  if hasattr(self.model, 'device'):
94
  print(f"✅ Model loaded on device: {self.model.device}")