davanstrien HF staff commited on
Commit
803024b
·
verified ·
1 Parent(s): 948c8ce

use smaller model

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -20,12 +20,12 @@ os.environ["HF_HUB_ENABLE_HF_TRANSFER"] = "1"
20
 
21
 
22
  model = Qwen2_5_VLForConditionalGeneration.from_pretrained(
23
- "Qwen/Qwen2.5-VL-7B-Instruct",
24
  torch_dtype=torch.bfloat16,
25
  attn_implementation="flash_attention_2",
26
  device_map="auto",
27
  )
28
- processor = AutoProcessor.from_pretrained("Qwen/Qwen2.5-VL-7B-Instruct")
29
 
30
 
31
  class GeneralRetrievalQuery(BaseModel):
 
20
 
21
 
22
  model = Qwen2_5_VLForConditionalGeneration.from_pretrained(
23
+ "Qwen/Qwen2.5-VL-3B-Instruct",
24
  torch_dtype=torch.bfloat16,
25
  attn_implementation="flash_attention_2",
26
  device_map="auto",
27
  )
28
+ processor = AutoProcessor.from_pretrained("Qwen/Qwen2.5-VL-3B-Instruct")
29
 
30
 
31
  class GeneralRetrievalQuery(BaseModel):