Spaces:

cwhuh
/

ponix-generator

Running on Zero

App Files Files Community

cwhuh commited on Mar 10

Commit

889c270

1 Parent(s): 52ee639

chore

Browse files

Files changed (2) hide show

llm_wrapper.py +99 -99
requirements.txt +1 -2

llm_wrapper.py CHANGED Viewed

@@ -1,101 +1,101 @@
-import logging
-from PIL import Image
-from io import BytesIO
-import requests, os, json, time
-from google import genai
-prompt_base_path = "src/llm_wrapper/prompt"
-client = genai.Client(api_key=os.getenv("GEMINI_API_KEY"))
-def encode_image(image_source):
-    """
-    이미지 경로가 URL이든 로컬 파일이든 Pillow Image 객체이든 동일하게 처리하는 함수.
-    이미지를 열어 google.genai.types.Part 객체로 변환합니다.
-    Pillow에서 지원되지 않는 포맷에 대해서는 예외를 발생시킵니다.
-    """
-    try:
-        # 이미 Pillow 이미지 객체인 경우 그대로 사용
-        if isinstance(image_source, Image.Image):
-            image = image_source
-        else:
-            # URL에서 이미지 다운로드
-            if isinstance(image_source, str) and (
-                image_source.startswith("http://")
-                or image_source.startswith("https://")
-            ):
-                response = requests.get(image_source)
-                image = Image.open(BytesIO(response.content))
-            # 로컬 파일에서 이미지 열기
-            else:
-                image = Image.open(image_source)
-        # 이미지 포맷이 None인 경우 (메모리에서 생성된 이미지 등)
-        if image.format is None:
-            image_format = "JPEG"
-        else:
-            image_format = image.format
-        # 이미지 포맷이 지원되지 않는 경우 예외 발생
-        if image_format not in Image.registered_extensions().values():
-            raise ValueError(f"Unsupported image format: {image_format}.")
-        buffered = BytesIO()
-        # PIL에서 지원되지 않는 포맷이나 다양한 채널을 RGB로 변환 후 저장
-        if image.mode in ("RGBA", "P", "CMYK"):  # RGBA, 팔레트, CMYK 등은 RGB로 변환
-            image = image.convert("RGB")
-        image.save(buffered, format="JPEG")
-        return genai.types.Part.from_bytes(data=buffered.getvalue(), mime_type="image/jpeg")
-    except requests.exceptions.RequestException as e:
-        raise ValueError(f"Failed to download the image from URL: {e}")
-    except IOError as e:
-        raise ValueError(f"Failed to process the image file: {e}")
-    except ValueError as e:
-        raise ValueError(e)
-def run_gemini(
-    target_prompt: str,
-    prompt_in_path: str,
-    img_in_data: str = None,
-    model: str = "gemini-2.0-flash",
-) -> str:
-    """
-    GEMINI API를 동기 방식으로 호출하여 문자열 응답을 받습니다.
-    retry 논리는 제거되었습니다.
-    """
-    with open(os.path.join(prompt_base_path, prompt_in_path), "r", encoding="utf-8") as file:
-        prompt_dict = json.load(file)
-    system_prompt = prompt_dict["system_prompt"]
-    user_prompt_head = prompt_dict["user_prompt"]["head"]
-    user_prompt_tail = prompt_dict["user_prompt"]["tail"]
-    user_prompt_text = "\n".join([user_prompt_head, target_prompt, user_prompt_tail])
-    input_content = [user_prompt_text]
-    if img_in_data is not None:
-        encoded_image = encode_image(img_in_data)
-        input_content.append(encoded_image)
-    logging.info("Requested API for chat completion response (sync call)...")
-    start_time = time.time()
-    # 동기 방식: client.models.generate_content(...)
-    chat_completion = client.models.generate_content(
-        model=model,
-        contents=input_content,
-    )
-    chat_output = chat_completion.parsed
-    input_token = chat_completion.usage_metadata.prompt_token_count
-    output_token = chat_completion.usage_metadata.candidates_token_count
-    pricing = input_token / 1000000 * 0.1 * 1500 + output_token / 1000000 * 0.7 * 1500
-    logging.info(
-        f"[GEMINI] Request completed (sync). Time taken: {time.time()-start_time:.2f}s / Pricing(KRW): {pricing:.2f}"
-    )
-    return chat_output, chat_completion

+# import logging
+# from PIL import Image
+# from io import BytesIO
+# import requests, os, json, time
+# from google import genai
+# prompt_base_path = "src/llm_wrapper/prompt"
+# client = genai.Client(api_key=os.getenv("GEMINI_API_KEY"))
+# def encode_image(image_source):
+#     """
+#     이미지 경로가 URL이든 로컬 파일이든 Pillow Image 객체이든 동일하게 처리하는 함수.
+#     이미지를 열어 google.genai.types.Part 객체로 변환합니다.
+#     Pillow에서 지원되지 않는 포맷에 대해서는 예외를 발생시킵니다.
+#     """
+#     try:
+#         # 이미 Pillow 이미지 객체인 경우 그대로 사용
+#         if isinstance(image_source, Image.Image):
+#             image = image_source
+#         else:
+#             # URL에서 이미지 다운로드
+#             if isinstance(image_source, str) and (
+#                 image_source.startswith("http://")
+#                 or image_source.startswith("https://")
+#             ):
+#                 response = requests.get(image_source)
+#                 image = Image.open(BytesIO(response.content))
+#             # 로컬 파일에서 이미지 열기
+#             else:
+#                 image = Image.open(image_source)
+#         # 이미지 포맷이 None인 경우 (메모리에서 생성된 이미지 등)
+#         if image.format is None:
+#             image_format = "JPEG"
+#         else:
+#             image_format = image.format
+#         # 이미지 포맷이 지원되지 않는 경우 예외 발생
+#         if image_format not in Image.registered_extensions().values():
+#             raise ValueError(f"Unsupported image format: {image_format}.")
+#         buffered = BytesIO()
+#         # PIL에서 지원되지 않는 포맷이나 다양한 채널을 RGB로 변환 후 저장
+#         if image.mode in ("RGBA", "P", "CMYK"):  # RGBA, 팔레트, CMYK 등은 RGB로 변환
+#             image = image.convert("RGB")
+#         image.save(buffered, format="JPEG")
+#         return genai.types.Part.from_bytes(data=buffered.getvalue(), mime_type="image/jpeg")
+#     except requests.exceptions.RequestException as e:
+#         raise ValueError(f"Failed to download the image from URL: {e}")
+#     except IOError as e:
+#         raise ValueError(f"Failed to process the image file: {e}")
+#     except ValueError as e:
+#         raise ValueError(e)
+# def run_gemini(
+#     target_prompt: str,
+#     prompt_in_path: str,
+#     img_in_data: str = None,
+#     model: str = "gemini-2.0-flash",
+# ) -> str:
+#     """
+#     GEMINI API를 동기 방식으로 호출하여 문자열 응답을 받습니다.
+#     retry 논리는 제거되었습니다.
+#     """
+#     with open(os.path.join(prompt_base_path, prompt_in_path), "r", encoding="utf-8") as file:
+#         prompt_dict = json.load(file)
+#     system_prompt = prompt_dict["system_prompt"]
+#     user_prompt_head = prompt_dict["user_prompt"]["head"]
+#     user_prompt_tail = prompt_dict["user_prompt"]["tail"]
+#     user_prompt_text = "\n".join([user_prompt_head, target_prompt, user_prompt_tail])
+#     input_content = [user_prompt_text]
+#     if img_in_data is not None:
+#         encoded_image = encode_image(img_in_data)
+#         input_content.append(encoded_image)
+#     logging.info("Requested API for chat completion response (sync call)...")
+#     start_time = time.time()
+#     # 동기 방식: client.models.generate_content(...)
+#     chat_completion = client.models.generate_content(
+#         model=model,
+#         contents=input_content,
+#     )
+#     chat_output = chat_completion.parsed
+#     input_token = chat_completion.usage_metadata.prompt_token_count
+#     output_token = chat_completion.usage_metadata.candidates_token_count
+#     pricing = input_token / 1000000 * 0.1 * 1500 + output_token / 1000000 * 0.7 * 1500
+#     logging.info(
+#         f"[GEMINI] Request completed (sync). Time taken: {time.time()-start_time:.2f}s / Pricing(KRW): {pricing:.2f}"
+#     )
+#     return chat_output, chat_completion

requirements.txt CHANGED Viewed

@@ -4,5 +4,4 @@ torch
 transformers==4.42.4
 xformers
 sentencepiece
-peft==0.12.0
-google-genai

 transformers==4.42.4
 xformers
 sentencepiece
+peft==0.12.0