Update handler.py
Browse files- handler.py +1 -1
handler.py
CHANGED
@@ -14,7 +14,7 @@ class EndpointHandler():
|
|
14 |
device_map="cuda:0", # or "mps" if on Apple Silicon
|
15 |
attn_implementation="flash_attention_2" if is_flash_attn_2_available() else None,
|
16 |
).eval()
|
17 |
-
self.processor = ColQwen2Processor.from_pretrained(path
|
18 |
# self.model = torch.compile(self.model)
|
19 |
print(f"Model and processor loaded {'with' if is_flash_attn_2_available() else 'without'} FA2")
|
20 |
|
|
|
14 |
device_map="cuda:0", # or "mps" if on Apple Silicon
|
15 |
attn_implementation="flash_attention_2" if is_flash_attn_2_available() else None,
|
16 |
).eval()
|
17 |
+
self.processor = ColQwen2Processor.from_pretrained(path) #, max_num_visual_tokens=8192) # temporary
|
18 |
# self.model = torch.compile(self.model)
|
19 |
print(f"Model and processor loaded {'with' if is_flash_attn_2_available() else 'without'} FA2")
|
20 |
|