Ritvik19's picture
Add all files and directories
c8a32e7
raw
history blame contribute delete
473 Bytes
from typing import List
from marker.schema.page import Page
def get_image_filename(page: Page, image_idx):
return f"{page.pnum}_image_{image_idx}.png"
def images_to_dict(pages: List[Page]):
images = {}
for page in pages:
if page.images is None:
continue
for image_idx, image in enumerate(page.images):
image_filename = get_image_filename(page, image_idx)
images[image_filename] = image
return images