kai-vision

Runtime error

App Files Files Community

seawolf2357 commited on Jun 24, 2024

Commit

234a076

verified ·

1 Parent(s): d87e79b

Update web.py

Browse files

Files changed (1) hide show

web.py +61 -28

web.py CHANGED Viewed

@@ -1,33 +1,66 @@
 import gradio as gr
-import datetime
-import asyncio
-def update_live_message():
-    """ 현재 시간과 'live' 메시지를 반환합니다. """
-    current_time = datetime.datetime.now().strftime('%Y-%m-%d %H:%M:%S')
-    return f"{current_time} - live"
-async def periodic_update(interface, interval=60):
-    """ 주어진 인터페이스에 1분 간격으로 업데이트를 실행합니다. """
-    while True:
-        live_message = update_live_message()
-        interface.update(live_message)
-        await asyncio.sleep(interval)
-def run_gradio():
-    """ Gradio 웹 인터페이스를 설정하고 실행합니다. """
-    live_block = gr.Textbox(label="Live Output", value="Starting...", elem_id="live_output")
-    demo = gr.Blocks()
-    with demo:
-        gr.Markdown("## Live Server Output")
-        live_block
-    demo.launch(server_name="0.0.0.0", server_port=7860, inbrowser=True)
-    # 비동기 업데이트 작업 시작
-    asyncio.run(periodic_update(live_block))
-if __name__ == "__main__":
-    run_gradio()

 import gradio as gr
+from transformers import PaliGemmaForConditionalGeneration, PaliGemmaProcessor
+import torch
+import re
+import os
+# 모델 로드 및 전처리 설정
+model = PaliGemmaForConditionalGeneration.from_pretrained("gokaygokay/sd3-long-captioner").to("cpu").eval()
+processor = PaliGemmaProcessor.from_pretrained("gokaygokay/sd3-long-captioner")
+def modify_caption(caption: str) -> str:
+    prefix_substrings = [
+        ('captured from ', ''),
+        ('captured at ', '')
+    ]
+    pattern = '|'.join([re.escape(opening) for opening, _ in prefix_substrings])
+    replacers = {opening: replacer for opening, replacer in prefix_substrings}
+    def replace_fn(match):
+        return replacers[match.group(0)]
+    return re.sub(pattern, replace_fn, caption, count=1, flags=re.IGNORECASE)
+def create_captions_rich(image):
+    prompt = "caption en"
+    image_tensor = processor(images=image, return_tensors="pt").pixel_values.to("cpu")
+    image_tensor = (image_tensor * 255).type(torch.uint8)
+    model_inputs = processor(text=prompt, images=image_tensor, return_tensors="pt").to("cpu")
+    input_len = model_inputs["input_ids"].shape[-1]
+    with torch.no_grad():
+        generation = model.generate(**model_inputs, max_new_tokens=256, do_sample=False)
+        generation = generation[0][input_len:]
+        decoded = processor.decode(generation, skip_special_tokens=True)
+        modified_caption = modify_caption(decoded)
+    return modified_caption
+css = """
+  #mkd {
+    height: 500px;
+    overflow: auto;
+    border: 1px solid #ccc;
+  }
+"""
+with gr.Blocks(css=css) as demo:
+    gr.HTML("<h1><center>PaliGemma Fine-tuned for Long Captioning<center><h1>")
+    with gr.Tab(label="PaliGemma Long Captioner"):
+        with gr.Row():
+            with gr.Column():
+                input_img = gr.Image(label="Input Picture")
+                submit_btn = gr.Button(value="Submit")
+            output = gr.Text(label="Caption")
+        gr.Examples(
+            [["image1.jpg"], ["image2.jpg"], ["image3.png"], ["image4.jpg"], ["image5.jpg"], ["image6.PNG"]],
+            inputs=[input_img],
+            outputs=[output],
+            fn=create_captions_rich,
+            label='Try captioning on examples'
+        )
+        submit_btn.click(create_captions_rich, [input_img], [output])
+# 포트 변경
+demo.launch(server_name="0.0.0.0", server_port=int(os.getenv