Spaces:

cwhuh
/

ponix-generator

Running on Zero

App Files Files Community

cwhuh commited on Mar 10

Commit

dc592b9

1 Parent(s): eb9cbe1

fix : google-genai -> openai

Browse files

Files changed (4) hide show

__pycache__/live_preview_helpers.cpython-310.pyc +0 -0
__pycache__/llm_wrapper.cpython-310.pyc +0 -0
llm_wrapper.py +25 -87
requirements.txt +2 -2

__pycache__/live_preview_helpers.cpython-310.pyc CHANGED Viewed

Binary files a/__pycache__/live_preview_helpers.cpython-310.pyc and b/__pycache__/live_preview_helpers.cpython-310.pyc differ

__pycache__/llm_wrapper.cpython-310.pyc CHANGED Viewed

Binary files a/__pycache__/llm_wrapper.cpython-310.pyc and b/__pycache__/llm_wrapper.cpython-310.pyc differ

llm_wrapper.py CHANGED Viewed

@@ -1,105 +1,43 @@
-import logging
-from PIL import Image
-from io import BytesIO
-import requests, os, json, time
-from google import genai
 prompt_base_path = ""
-client = genai.Client(api_key=os.getenv("GEMINI_API_KEY"))
-def encode_image(image_source):
-    """
-    이미지 경로가 URL이든 로컬 파일이든 Pillow Image 객체이든 동일하게 처리하는 함수.
-    이미지를 열어 google.genai.types.Part 객체로 변환합니다.
-    Pillow에서 지원되지 않는 포맷에 대해서는 예외를 발생시킵니다.
-    """
-    try:
-        # 이미 Pillow 이미지 객체인 경우 그대로 사용
-        if isinstance(image_source, Image.Image):
-            image = image_source
-        else:
-            # URL에서 이미지 다운로드
-            if isinstance(image_source, str) and (
-                image_source.startswith("http://")
-                or image_source.startswith("https://")
-            ):
-                response = requests.get(image_source)
-                image = Image.open(BytesIO(response.content))
-            # 로컬 파일에서 이미지 열기
-            else:
-                image = Image.open(image_source)
-        # 이미지 포맷이 None인 경우 (메모리에서 생성된 이미지 등)
-        if image.format is None:
-            image_format = "JPEG"
-        else:
-            image_format = image.format
-        # 이미지 포맷이 지원되지 않는 경우 예외 발생
-        if image_format not in Image.registered_extensions().values():
-            raise ValueError(f"Unsupported image format: {image_format}.")
-        buffered = BytesIO()
-        # PIL에서 지원되지 않는 포맷이나 다양한 채널을 RGB로 변환 후 저장
-        if image.mode in ("RGBA", "P", "CMYK"):  # RGBA, 팔레트, CMYK 등은 RGB로 변환
-            image = image.convert("RGB")
-        image.save(buffered, format="JPEG")
-        return genai.types.Part.from_bytes(data=buffered.getvalue(), mime_type="image/jpeg")
-    except requests.exceptions.RequestException as e:
-        raise ValueError(f"Failed to download the image from URL: {e}")
-    except IOError as e:
-        raise ValueError(f"Failed to process the image file: {e}")
-    except ValueError as e:
-        raise ValueError(e)
 def run_gemini(
     target_prompt: str,
     prompt_in_path: str,
-    img_in_data: str = None,
-    model: str = "gemini-2.0-flash",
 ) -> str:
     """
-    GEMINI API를 동기 방식으로 호출하여 문자열 응답을 받습니다.
-    retry 논리는 제거되었습니다.
     """
-    with open(os.path.join(prompt_base_path, prompt_in_path), "r", encoding="utf-8") as file:
         prompt_dict = json.load(file)
     system_prompt = prompt_dict["system_prompt"]
-    user_prompt_head = prompt_dict["user_prompt"]["head"]
-    user_prompt_tail = prompt_dict["user_prompt"]["tail"]
-    user_prompt_text = "\n".join([user_prompt_head, target_prompt, user_prompt_tail])
-    input_content = [user_prompt_text]
-    if img_in_data is not None:
-        encoded_image = encode_image(img_in_data)
-        input_content.append(encoded_image)
-    logging.info("Requested API for chat completion response (sync call)...")
-    start_time = time.time()
-    # 동기 방식: client.models.generate_content(...)
-    chat_completion = client.models.generate_content(
-        model=model,
-        contents=input_content,
-        config={
-            "system_instruction": system_prompt,
-        }
     )
-    print(f"Chat Completion: {chat_completion}")
-    chat_output = chat_completion.candidates[0].content.parts[0].text
-    input_token = chat_completion.usage_metadata.prompt_token_count
-    output_token = chat_completion.usage_metadata.candidates_token_count
-    pricing = input_token / 1000000 * 0.1 * 1500 + output_token / 1000000 * 0.7 * 1500
-    logging.info(
-        f"[GEMINI] Request completed (sync). Time taken: {time.time()-start_time:.2f}s / Pricing(KRW): {pricing:.2f}"
     )
     return chat_output

+import openai, os, json
 prompt_base_path = ""
+client = openai.OpenAI(
+    api_key=os.getenv("GEMINI_API_KEY"),
+    base_url="https://generativelanguage.googleapis.com/v1beta/openai/",
+)
 def run_gemini(
     target_prompt: str,
     prompt_in_path: str,
+    llm_model: str = "gemini-2.0-flash-exp",
 ) -> str:
     """
+    gemini 모델 사용 코드
     """
+    # Load prompt
+    with open(
+        os.path.join(prompt_base_path, prompt_in_path), "r", encoding="utf-8"
+    ) as file:
         prompt_dict = json.load(file)
     system_prompt = prompt_dict["system_prompt"]
+    user_prompt_head, user_prompt_tail = (
+        prompt_dict["user_prompt"]["head"],
+        prompt_dict["user_prompt"]["tail"],
     )
+    user_prompt_text = "\n".join([user_prompt_head, target_prompt, user_prompt_tail])
+    input_content = [{"type": "text", "text": user_prompt_text}]
+    chat_completion = client.beta.chat.completions.parse(
+        model=llm_model,
+        messages=[
+            {"role": "system", "content": system_prompt},
+            {"role": "user", "content": input_content},
+        ],
     )
+    chat_output = chat_completion.choices[0].message.content
     return chat_output

requirements.txt CHANGED Viewed

@@ -5,5 +5,5 @@ transformers==4.42.4
 xformers
 sentencepiece
 peft==0.12.0
-google-genai
-gradio

 xformers
 sentencepiece
 peft==0.12.0
+openai
+gradio==4.43.0