sitammeur commited on
Commit
5d77312
·
verified ·
1 Parent(s): 7a84512

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -14,14 +14,14 @@ import gradio as gr
14
 
15
 
16
  # Enable flash attention
17
- subprocess.run('pip install flash-attn --no-build-isolation', env={'FLASH_ATTENTION_SKIP_CUDA_BUILD': "TRUE"}, shell=True)
18
 
19
  # Load the visual document retrieval model (ColQwen2)
20
  model = ColQwen2.from_pretrained(
21
  "vidore/colqwen2-v1.0",
22
  torch_dtype=torch.bfloat16,
23
  device_map="cuda:0",
24
- attn_implementation="flash_attention_2",
25
  ).eval()
26
  processor = ColQwen2Processor.from_pretrained("vidore/colqwen2-v1.0")
27
 
 
14
 
15
 
16
  # Enable flash attention
17
+ # subprocess.run('pip install flash-attn --no-build-isolation', env={'FLASH_ATTENTION_SKIP_CUDA_BUILD': "TRUE"}, shell=True)
18
 
19
  # Load the visual document retrieval model (ColQwen2)
20
  model = ColQwen2.from_pretrained(
21
  "vidore/colqwen2-v1.0",
22
  torch_dtype=torch.bfloat16,
23
  device_map="cuda:0",
24
+ # attn_implementation="flash_attention_2",
25
  ).eval()
26
  processor = ColQwen2Processor.from_pretrained("vidore/colqwen2-v1.0")
27