Spaces:

cwhuh
/

ponix-generator

Running on Zero

App Files Files Community

cwhuh commited on Mar 10

Commit

2c61b33

1 Parent(s): ac860b2

add : llm wrapper

Browse files

Files changed (1) hide show

llm_wrapper.py +99 -99

llm_wrapper.py CHANGED Viewed

@@ -1,101 +1,101 @@
-# import logging
-# from PIL import Image
-# from io import BytesIO
-# import requests, os, json, time
-# from google import genai
-# prompt_base_path = "src/llm_wrapper/prompt"
-# client = genai.Client(api_key=os.getenv("GEMINI_API_KEY"))
-# def encode_image(image_source):
-#     """
-#     이미지 경로가 URL이든 로컬 파일이든 Pillow Image 객체이든 동일하게 처리하는 함수.
-#     이미지를 열어 google.genai.types.Part 객체로 변환합니다.
-#     Pillow에서 지원되지 않는 포맷에 대해서는 예외를 발생시킵니다.
-#     """
-#     try:
-#         # 이미 Pillow 이미지 객체인 경우 그대로 사용
-#         if isinstance(image_source, Image.Image):
-#             image = image_source
-#         else:
-#             # URL에서 이미지 다운로드
-#             if isinstance(image_source, str) and (
-#                 image_source.startswith("http://")
-#                 or image_source.startswith("https://")
-#             ):
-#                 response = requests.get(image_source)
-#                 image = Image.open(BytesIO(response.content))
-#             # 로컬 파일에서 이미지 열기
-#             else:
-#                 image = Image.open(image_source)
-#         # 이미지 포맷이 None인 경우 (메모리에서 생성된 이미지 등)
-#         if image.format is None:
-#             image_format = "JPEG"
-#         else:
-#             image_format = image.format
-#         # 이미지 포맷이 지원되지 않는 경우 예외 발생
-#         if image_format not in Image.registered_extensions().values():
-#             raise ValueError(f"Unsupported image format: {image_format}.")
-#         buffered = BytesIO()
-#         # PIL에서 지원되지 않는 포맷이나 다양한 채널을 RGB로 변환 후 저장
-#         if image.mode in ("RGBA", "P", "CMYK"):  # RGBA, 팔레트, CMYK 등은 RGB로 변환
-#             image = image.convert("RGB")
-#         image.save(buffered, format="JPEG")
-#         return genai.types.Part.from_bytes(data=buffered.getvalue(), mime_type="image/jpeg")
-#     except requests.exceptions.RequestException as e:
-#         raise ValueError(f"Failed to download the image from URL: {e}")
-#     except IOError as e:
-#         raise ValueError(f"Failed to process the image file: {e}")
-#     except ValueError as e:
-#         raise ValueError(e)
-# def run_gemini(
-#     target_prompt: str,
-#     prompt_in_path: str,
-#     img_in_data: str = None,
-#     model: str = "gemini-2.0-flash",
-# ) -> str:
-#     """
-#     GEMINI API를 동기 방식으로 호출하여 문자열 응답을 받습니다.
-#     retry 논리는 제거되었습니다.
-#     """
-#     with open(os.path.join(prompt_base_path, prompt_in_path), "r", encoding="utf-8") as file:
-#         prompt_dict = json.load(file)
-#     system_prompt = prompt_dict["system_prompt"]
-#     user_prompt_head = prompt_dict["user_prompt"]["head"]
-#     user_prompt_tail = prompt_dict["user_prompt"]["tail"]
-#     user_prompt_text = "\n".join([user_prompt_head, target_prompt, user_prompt_tail])
-#     input_content = [user_prompt_text]
-#     if img_in_data is not None:
-#         encoded_image = encode_image(img_in_data)
-#         input_content.append(encoded_image)
-#     logging.info("Requested API for chat completion response (sync call)...")
-#     start_time = time.time()
-#     # 동기 방식: client.models.generate_content(...)
-#     chat_completion = client.models.generate_content(
-#         model=model,
-#         contents=input_content,
-#     )
-#     chat_output = chat_completion.parsed
-#     input_token = chat_completion.usage_metadata.prompt_token_count
-#     output_token = chat_completion.usage_metadata.candidates_token_count
-#     pricing = input_token / 1000000 * 0.1 * 1500 + output_token / 1000000 * 0.7 * 1500
-#     logging.info(
-#         f"[GEMINI] Request completed (sync). Time taken: {time.time()-start_time:.2f}s / Pricing(KRW): {pricing:.2f}"
-#     )
-#     return chat_output, chat_completion

+import logging
+from PIL import Image
+from io import BytesIO
+import requests, os, json, time
+from google import genai
+prompt_base_path = "src/llm_wrapper/prompt"
+client = genai.Client(api_key=os.getenv("GEMINI_API_KEY"))
+def encode_image(image_source):
+    """
+    이미지 경로가 URL이든 로컬 파일이든 Pillow Image 객체이든 동일하게 처리하는 함수.
+    이미지를 열어 google.genai.types.Part 객체로 변환합니다.
+    Pillow에서 지원되지 않는 포맷에 대해서는 예외를 발생시킵니다.
+    """
+    try:
+        # 이미 Pillow 이미지 객체인 경우 그대로 사용
+        if isinstance(image_source, Image.Image):
+            image = image_source
+        else:
+            # URL에서 이미지 다운로드
+            if isinstance(image_source, str) and (
+                image_source.startswith("http://")
+                or image_source.startswith("https://")
+            ):
+                response = requests.get(image_source)
+                image = Image.open(BytesIO(response.content))
+            # 로컬 파일에서 이미지 열기
+            else:
+                image = Image.open(image_source)
+        # 이미지 포맷이 None인 경우 (메모리에서 생성된 이미지 등)
+        if image.format is None:
+            image_format = "JPEG"
+        else:
+            image_format = image.format
+        # 이미지 포맷이 지원되지 않는 경우 예외 발생
+        if image_format not in Image.registered_extensions().values():
+            raise ValueError(f"Unsupported image format: {image_format}.")
+        buffered = BytesIO()
+        # PIL에서 지원되지 않는 포맷이나 다양한 채널을 RGB로 변환 후 저장
+        if image.mode in ("RGBA", "P", "CMYK"):  # RGBA, 팔레트, CMYK 등은 RGB로 변환
+            image = image.convert("RGB")
+        image.save(buffered, format="JPEG")
+        return genai.types.Part.from_bytes(data=buffered.getvalue(), mime_type="image/jpeg")
+    except requests.exceptions.RequestException as e:
+        raise ValueError(f"Failed to download the image from URL: {e}")
+    except IOError as e:
+        raise ValueError(f"Failed to process the image file: {e}")
+    except ValueError as e:
+        raise ValueError(e)
+def run_gemini(
+    target_prompt: str,
+    prompt_in_path: str,
+    img_in_data: str = None,
+    model: str = "gemini-2.0-flash",
+) -> str:
+    """
+    GEMINI API를 동기 방식으로 호출하여 문자열 응답을 받습니다.
+    retry 논리는 제거되었습니다.
+    """
+    with open(os.path.join(prompt_base_path, prompt_in_path), "r", encoding="utf-8") as file:
+        prompt_dict = json.load(file)
+    system_prompt = prompt_dict["system_prompt"]
+    user_prompt_head = prompt_dict["user_prompt"]["head"]
+    user_prompt_tail = prompt_dict["user_prompt"]["tail"]
+    user_prompt_text = "\n".join([user_prompt_head, target_prompt, user_prompt_tail])
+    input_content = [user_prompt_text]
+    if img_in_data is not None:
+        encoded_image = encode_image(img_in_data)
+        input_content.append(encoded_image)
+    logging.info("Requested API for chat completion response (sync call)...")
+    start_time = time.time()
+    # 동기 방식: client.models.generate_content(...)
+    chat_completion = client.models.generate_content(
+        model=model,
+        contents=input_content,
+    )
+    chat_output = chat_completion.parsed
+    input_token = chat_completion.usage_metadata.prompt_token_count
+    output_token = chat_completion.usage_metadata.candidates_token_count
+    pricing = input_token / 1000000 * 0.1 * 1500 + output_token / 1000000 * 0.7 * 1500
+    logging.info(
+        f"[GEMINI] Request completed (sync). Time taken: {time.time()-start_time:.2f}s / Pricing(KRW): {pricing:.2f}"
+    )
+    return chat_output, chat_completion