naver-hyperclovax
/

HyperCLOVAX-SEED-Vision-Instruct-3B

hyperclovax_vlm

Model card Files Files and versions Community

BDLEE commited on about 5 hours ago

Commit

41a5265

·

verified ·

1 Parent(s): e9d93a4

Update preprocessor.py

Files changed (1) hide show

preprocessor.py +8 -7

preprocessor.py CHANGED Viewed

@@ -241,20 +241,21 @@ def resize_longside(
 def select_best_resolution(original_size: tuple, possible_resolutions: list) -> tuple:
-    """
     Selects the best-fit resolution from a list of possible resolutions based on the original image size.
-    This function, adapted from LLaVA-Next
-    (https://github.com/huggingface/transformers/blob/v4.40.2/src/transformers/models/llava_next/image_processing_llava_next.py),
-    evaluates each resolution by computing its effective and wasted area compared to the original size.
     The optimal resolution is the one that maximizes the effective area while minimizing unused (wasted) space.
     Args:
         original_size (tuple): The original image size in the format (height, width).
         possible_resolutions (list): A list of candidate resolutions in the format [(height1, width1), (height2, width2), ...].
     Returns:
         tuple: The best-fit resolution in the format (height, width).
     """
     original_height, original_width = original_size
     best_fit = None

 def select_best_resolution(original_size: tuple, possible_resolutions: list) -> tuple:
+    """
     Selects the best-fit resolution from a list of possible resolutions based on the original image size.
+    This function evaluates each resolution by computing its effective and wasted area compared to the original size.
     The optimal resolution is the one that maximizes the effective area while minimizing unused (wasted) space.
     Args:
         original_size (tuple): The original image size in the format (height, width).
         possible_resolutions (list): A list of candidate resolutions in the format [(height1, width1), (height2, width2), ...].
     Returns:
         tuple: The best-fit resolution in the format (height, width).
+    This function includes code adapted from the file image_processing_llava_next.py in the LLaVA-Next
+    project(https://github.com/huggingface/transformers/blob/v4.40.2/src/transformers/models/llava_next/image_processing_llava_next.py),
+    which is licensed under apache-2.0.
     """
     original_height, original_width = original_size
     best_fit = None