Spaces:

vfontech
/

Multi-Input-Res-Diffusion-VFI

Sleeping

App Files Files Community

VicFonch commited on 15 days ago

Commit

a89535f

unverified ·

1 Parent(s): 42bdc86

app.py: New styles

Browse files

Files changed (1) hide show

app.py +58 -29

app.py CHANGED Viewed

@@ -26,7 +26,10 @@ def to_numpy(img_tensor: torch.Tensor) -> np.ndarray:
     img_np = np.clip(img_np, 0, 1)
     return (img_np * 255).astype(np.uint8)
-def interpolate(img0_pil, img2_pil, tau=0.5, num_samples=1):
     img0 = transform(img0_pil.convert("RGB")).unsqueeze(0).to(device)
     img2 = transform(img2_pil.convert("RGB")).unsqueeze(0).to(device)
@@ -49,34 +52,60 @@ def interpolate(img0_pil, img2_pil, tau=0.5, num_samples=1):
     except Exception as e:
         print(f"Error during interpolation: {e}")
         return None, None
-demo = gr.Interface(
-    fn=interpolate,
-    inputs=[
-        gr.Image(type="pil", label="Initial Image (frame1)"),
-        gr.Image(type="pil", label="Final Image (frame3)"),
-        gr.Slider(0.0, 1.0, step=0.05, value=0.5, label="Tau Value (only if Num Samples = 1)"),
-        gr.Slider(1, 15, step=1, value=1, label="Number of Samples"),
-    ],
-    outputs=[
-        gr.Image(label="Interpolated Image (if num_samples = 1)"),
-        gr.Video(label="Interpolation in video (if num_samples > 1)"),
-    ],
-    title="Multi-Input ResShift Diffusion VFI",
-    description=(
-        "📄 [arXiv Paper](https://arxiv.org/pdf/2504.05402) • "
-        "🤗 [Model](https://huggingface.co/vfontech/Multiple-Input-Resshift-VFI) • "
-        "🧪 [Colab](https://colab.research.google.com/drive/1MGYycbNMW6Mxu5MUqw_RW_xxiVeHK5Aa#scrollTo=EKaYCioiP3tQ) • "
-        "🌐 [GitHub](https://github.com/VicFonch/Multi-Input-Resshift-Diffusion-VFI)\n\n"
-        "Video interpolation using Conditional Residual Diffusion.\n"
-        "- All images are resized to 256x448.\n"
-        "- If `Number of Samples` = 1, generates only one intermediate image with the given Tau value.\n"
-        "- If `Number of Samples` > 1, ignores Tau and generates a sequence of interpolated images."
-    ),
-    examples=[
-        ["_data/example_images/frame1.png", "_data/example_images/frame3.png", 0.5, 1],
-    ]
-)
 if __name__ == "__main__":
-    demo.launch(server_name="0.0.0.0", ssr_mode=False)

     img_np = np.clip(img_np, 0, 1)
     return (img_np * 255).astype(np.uint8)
+def interpolate(img0_pil: Image.Image,
+                img2_pil: Image.Image,
+                tau: float=0.5,
+                num_samples: int=1) -> tuple:
     img0 = transform(img0_pil.convert("RGB")).unsqueeze(0).to(device)
     img2 = transform(img2_pil.convert("RGB")).unsqueeze(0).to(device)
     except Exception as e:
         print(f"Error during interpolation: {e}")
         return None, None
+# Lo integras en Blocks y le agregas HTML arriba
+def build_demo() -> gr.Blocks:
+    header = """
+    <div style="text-align: center; padding: 1rem 0;">
+        <h1 style="font-size: 2.2rem; margin-bottom: 0.4rem;">🎞️ Multi-Input ResShift Diffusion VFI</h1>
+        <p style="font-size: 1.1rem; color: #555; margin-bottom: 1rem;">
+            Efficient and stochastic video frame interpolation for hand-drawn animation
+        </p>
+        <div style="display: flex; justify-content: center; flex-wrap: wrap; gap: 10px;">
+            <a href="https://arxiv.org/pdf/2504.05402">
+                <img src="https://img.shields.io/badge/arXiv-Paper-A42C25.svg" alt="arXiv">
+            </a>
+            <a href="https://huggingface.co/vfontech/Multiple-Input-Resshift-VFI">
+                <img src="https://img.shields.io/badge/🤗-Model-ffbd45.svg" alt="HF">
+            </a>
+            <a href="https://colab.research.google.com/drive/1MGYycbNMW6Mxu5MUqw_RW_xxiVeHK5Aa#scrollTo=EKaYCioiP3tQ">
+                <img src="https://img.shields.io/badge/Colab-Demo-green.svg" alt="Colab">
+            </a>
+            <a href="https://github.com/VicFonch/Multi-Input-Resshift-Diffusion-VFI">
+                <img src="https://img.shields.io/badge/GitHub-Code-blue.svg?logo=github" alt="GitHub">
+            </a>
+        </div>
+    </div>
+    """
+    with gr.Blocks() as demo:
+        gr.HTML(header)
+        gr.Interface(
+            fn=interpolate,
+            inputs=[
+                gr.Image(type="pil", label="Initial Image (frame1)"),
+                gr.Image(type="pil", label="Final Image (frame3)"),
+                gr.Slider(0.0, 1.0, step=0.05, value=0.5, label="Tau Value (only if Num Samples = 1)"),
+                gr.Slider(1, 15, step=1, value=1, label="Number of Samples"),
+            ],
+            outputs=[
+                gr.Image(label="Interpolated Image (if num_samples = 1)"),
+                gr.Video(label="Interpolation in video (if num_samples > 1)"),
+            ],
+            #title="Multi-Input ResShift Diffusion VFI",
+            description=(
+                "Video interpolation using Conditional Residual Diffusion.\n"
+                "- All images are resized to 256x448.\n"
+                "- If `Number of Samples = 1`, generates only one intermediate image with the given Tau value.\n"
+                "- If `Number of Samples > 1`, ignores Tau and generates a sequence of interpolated images."
+            ),
+            examples=[
+                ["_data/example_images/frame1.png", "_data/example_images/frame3.png", 0.5, 1],
+            ],
+        )
+    return demo
 if __name__ == "__main__":
+    demo = build_demo()
+    #demo.launch(server_name="0.0.0.0", ssr_mode=False)
+    demo.launch()