Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -1,4 +1,4 @@
|
|
1 |
-
from transformers import MllamaForConditionalGeneration, AutoProcessor, TextIteratorStreamer , AutoModel,Qwen2VLForConditionalGeneration, AutoModelForImageTextToText
|
2 |
from qwen_vl_utils import process_vision_info
|
3 |
from PIL import Image
|
4 |
import requests
|
@@ -18,8 +18,8 @@ logging.basicConfig(level=logging.INFO)
|
|
18 |
logger = logging.getLogger(__name__)
|
19 |
|
20 |
# Load model and processor
|
21 |
-
ckpt ="
|
22 |
-
model =
|
23 |
processor = AutoProcessor.from_pretrained(ckpt,trust_remote_code=True)
|
24 |
|
25 |
class DocumentState:
|
@@ -49,7 +49,7 @@ def process_pdf_file(file_path):
|
|
49 |
if page_text.strip():
|
50 |
text += f"Page {page_num + 1}:\n{page_text}\n\n"
|
51 |
|
52 |
-
zoom =
|
53 |
mat = fitz.Matrix(zoom, zoom)
|
54 |
pix = page.get_pixmap(matrix=mat, alpha=False)
|
55 |
img_data = pix.tobytes("png")
|
|
|
1 |
+
from transformers import MllamaForConditionalGeneration, AutoProcessor, TextIteratorStreamer , AutoModel,Qwen2VLForConditionalGeneration, AutoModelForImageTextToText , Qwen2_5_VLForConditionalGeneration
|
2 |
from qwen_vl_utils import process_vision_info
|
3 |
from PIL import Image
|
4 |
import requests
|
|
|
18 |
logger = logging.getLogger(__name__)
|
19 |
|
20 |
# Load model and processor
|
21 |
+
ckpt ="Qwen/Qwen2.5-VL-7B-Instruct"
|
22 |
+
model = Qwen2_5_VLForConditionalGeneration.from_pretrained(ckpt, torch_dtype=torch.bfloat16,trust_remote_code=True).to("cuda")
|
23 |
processor = AutoProcessor.from_pretrained(ckpt,trust_remote_code=True)
|
24 |
|
25 |
class DocumentState:
|
|
|
49 |
if page_text.strip():
|
50 |
text += f"Page {page_num + 1}:\n{page_text}\n\n"
|
51 |
|
52 |
+
zoom = 3
|
53 |
mat = fitz.Matrix(zoom, zoom)
|
54 |
pix = page.get_pixmap(matrix=mat, alpha=False)
|
55 |
img_data = pix.tobytes("png")
|