syedfaisalabrar commited on
Commit
4b68d34
·
verified ·
1 Parent(s): e7bec8c

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -20,11 +20,12 @@ path = "OpenGVLab/InternVL2_5-4B"
20
  model = AutoModel.from_pretrained(
21
  path,
22
  cache_dir=cache_folder,
23
- torch_dtype=torch.bfloat16 if torch.cuda.is_available() else torch.float32,
 
24
  low_cpu_mem_usage=True,
25
  use_flash_attn=True,
26
  trust_remote_code=True
27
- ).eval().to("cpu")
28
 
29
  tokenizer = AutoTokenizer.from_pretrained(
30
  path,
 
20
  model = AutoModel.from_pretrained(
21
  path,
22
  cache_dir=cache_folder,
23
+ torch_dtype=torch.bfloat16,,
24
+ load_in_8bit=True,
25
  low_cpu_mem_usage=True,
26
  use_flash_attn=True,
27
  trust_remote_code=True
28
+ ).eval()
29
 
30
  tokenizer = AutoTokenizer.from_pretrained(
31
  path,