kai-vision

Runtime error

App Files Files Community

seawolf2357 commited on Jun 24, 2024

Commit

d87e79b

verified ·

1 Parent(s): 655b8e8

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -10

app.py CHANGED Viewed

@@ -8,6 +8,7 @@ import re
 import requests
 from PIL import Image
 import io
 # 로깅 설정
 logging.basicConfig(level=logging.DEBUG, format='%(asctime)s:%(levelname)s:%(name)s: %(message)s', handlers=[logging.StreamHandler()])
@@ -36,21 +37,22 @@ def modify_caption(caption: str) -> str:
     return re.sub(pattern, replace_fn, caption, count=1, flags=re.IGNORECASE)
-def create_captions_rich(image: Image.Image) -> str:
     prompt = "caption en"
-    # 이미지 데이터를 전처리하여 processor에 전달
     image_tensor = processor(images=image, return_tensors="pt").pixel_values.to("cpu")
-    # 이미지 범위 조정 [0, 1]에서 [0, 255]로
     image_tensor = (image_tensor * 255).type(torch.uint8)
     model_inputs = processor(text=prompt, images=image_tensor, return_tensors="pt").to("cpu")
     input_len = model_inputs["input_ids"].shape[-1]
-    with torch.no_grad():
-        generation = model.generate(**model_inputs, max_new_tokens=256, do_sample=False)
-        generation = generation[0][input_len:]
-        decoded = processor.decode(generation, skip_special_tokens=True)
-        modified_caption = modify_caption(decoded)
     return modified_caption
 # 특정 채널 ID 설정
@@ -64,9 +66,12 @@ class MyClient(discord.Client):
     async def on_ready(self):
         logging.info(f'{self.user}로 로그인되었습니다!')
-        subprocess.Popen(["python", "web.py"])
         logging.info("Web.py 서버가 시작되었습니다.")
     async def on_message(self, message):
         if message.author == self.user:
             return
@@ -90,7 +95,7 @@ class MyClient(discord.Client):
 async def process_image(image_url, message):
     image = await download_image(image_url)
-    caption = create_captions_rich(image)
     return f"{message.author.mention}, 인식된 이미지 설명: {caption}"
 async def download_image(url):

 import requests
 from PIL import Image
 import io
+import asyncio
 # 로깅 설정
 logging.basicConfig(level=logging.DEBUG, format='%(asctime)s:%(levelname)s:%(name)s: %(message)s', handlers=[logging.StreamHandler()])
     return re.sub(pattern, replace_fn, caption, count=1, flags=re.IGNORECASE)
+async def create_captions_rich(image: Image.Image) -> str:
     prompt = "caption en"
     image_tensor = processor(images=image, return_tensors="pt").pixel_values.to("cpu")
     image_tensor = (image_tensor * 255).type(torch.uint8)
     model_inputs = processor(text=prompt, images=image_tensor, return_tensors="pt").to("cpu")
     input_len = model_inputs["input_ids"].shape[-1]
+    loop = asyncio.get_event_loop()
+    generation = await loop.run_in_executor(
+        None,
+        lambda: model.generate(**model_inputs, max_new_tokens=256, do_sample=False)
+    )
+    generation = generation[0][input_len:]
+    decoded = processor.decode(generation, skip_special_tokens=True)
+    modified_caption = modify_caption(decoded)
     return modified_caption
 # 특정 채널 ID 설정
     async def on_ready(self):
         logging.info(f'{self.user}로 로그인되었습니다!')
+        asyncio.create_task(self.start_gradio_server())
         logging.info("Web.py 서버가 시작되었습니다.")
+    async def start_gradio_server(self):
+        subprocess.run(["python", "web.py"], check=True)
     async def on_message(self, message):
         if message.author == self.user:
             return
 async def process_image(image_url, message):
     image = await download_image(image_url)
+    caption = await create_captions_rich(image)
     return f"{message.author.mention}, 인식된 이미지 설명: {caption}"
 async def download_image(url):