ghibli

Runtime error

App Files Files Community

Update app.py

by ar08 - opened Apr 6

base: refs/heads/main

←

from: refs/pr/1

Discussion Files changed

+88

-32

Files changed (1) hide show

app.py +88 -32

app.py CHANGED Viewed

@@ -3,56 +3,112 @@ import torch
 from diffusers import StableDiffusionImg2ImgPipeline
 from PIL import Image
 import numpy as np
 device = "cuda" if torch.cuda.is_available() else "cpu"
 model_id = "nitrosocke/Ghibli-Diffusion"
-# Load the model (keep safety_checker to avoid warning)
 pipe = StableDiffusionImg2ImgPipeline.from_pretrained(
     model_id,
     torch_dtype=torch.float16 if device == "cuda" else torch.float32,
 )
-pipe.to(device)
 pipe.enable_attention_slicing()
-# Function to convert PIL image to latent-compatible numpy
-def pil_to_np(image):
-    return np.array(image).astype(np.uint8)
-# Generator with step-wise callback
-def generate_ghibli_style(image, steps=25):
-    prompt = "ghibli style portrait"
     intermediate_images = []
-    def callback(step: int, timestep: int, latents):
         with torch.no_grad():
-            img = pipe.decode_latents(latents)
-            img = pipe.numpy_to_pil(img)[0]
-        intermediate_images.append(img)
     with torch.inference_mode():
-        pipe(
             prompt=prompt,
-            image=image,
-            strength=0.6,
-            guidance_scale=6.0,
             num_inference_steps=steps,
             callback=callback,
-            callback_steps=1,
         )
-    return intermediate_images
-# Gradio Interface without deprecated style()
-iface = gr.Interface(
-    fn=generate_ghibli_style,
-    inputs=[
-        gr.Image(type="pil", label="Upload a photo"),
-        gr.Slider(minimum=10, maximum=50, value=25, step=1, label="Inference Steps")
-    ],
-    outputs=gr.Gallery(label="Ghibli-style Generation Progress"),
-    title="✨ Studio Ghibli Portrait Generator ✨",
-    description="Upload a photo and watch it transform into a Ghibli-style portrait step by step!"
-)
-iface.launch()

 from diffusers import StableDiffusionImg2ImgPipeline
 from PIL import Image
 import numpy as np
+from typing import Generator, List
+# Set up device and model
 device = "cuda" if torch.cuda.is_available() else "cpu"
 model_id = "nitrosocke/Ghibli-Diffusion"
+# Load the pipeline
 pipe = StableDiffusionImg2ImgPipeline.from_pretrained(
     model_id,
     torch_dtype=torch.float16 if device == "cuda" else torch.float32,
 )
+pipe = pipe.to(device)
 pipe.enable_attention_slicing()
+def generate_ghibli_style(
+    input_image: Image.Image,
+    steps: int = 25,
+    strength: float = 0.6,
+    guidance_scale: float = 7.0,
+    progress: gr.Progress = gr.Progress()
+) -> Generator[List[Image.Image], None, None]:
+    """
+    Generate Ghibli-style images in real-time with intermediate steps
+    """
+    prompt = "ghibli style, high quality, detailed portrait"
+    negative_prompt = "low quality, blurry, bad anatomy"
     intermediate_images = []
+    def callback(step: int, timestep: int, latents: torch.Tensor):
         with torch.no_grad():
+            # Decode the latents to image
+            image = pipe.decode_latents(latents)
+            image = pipe.numpy_to_pil(image)[0]
+            intermediate_images.append(image)
+        # Update progress and yield the current images
+        progress(step / steps, desc="Generating...")
+        yield intermediate_images
+    # Run the pipeline
     with torch.inference_mode():
+        # Create a generator that will yield the images
+        generator = pipe(
             prompt=prompt,
+            image=input_image,
+            negative_prompt=negative_prompt,
+            strength=strength,
+            guidance_scale=guidance_scale,
             num_inference_steps=steps,
             callback=callback,
+            callback_steps=1  # Call after every step
         )
+        # Yield the final result
+        final_image = generator.images[0]
+        intermediate_images.append(final_image)
+        yield intermediate_images
+# Custom CSS for better appearance
+css = """
+.gallery {
+    min-height: 500px;
+}
+.gallery img {
+    max-height: 400px;
+    object-fit: contain;
+}
+"""
+# Gradio interface
+with gr.Blocks(css=css) as demo:
+    gr.Markdown("# ✨ Studio Ghibli Portrait Generator ✨")
+    gr.Markdown("Upload a photo and watch it transform into a Ghibli-style portrait in real-time!")
+    with gr.Row():
+        with gr.Column():
+            input_image = gr.Image(label="Upload Photo", type="pil")
+            steps_slider = gr.Slider(10, 50, value=25, step=1, label="Inference Steps")
+            strength_slider = gr.Slider(0.1, 0.9, value=0.6, step=0.05, label="Transformation Strength")
+            generate_btn = gr.Button("Generate", variant="primary")
+        with gr.Column():
+            gallery = gr.Gallery(
+                label="Generation Progress",
+                show_label=True,
+                elem_id="gallery",
+                preview=True
+            )
+    # Example images
+    gr.Examples(
+        examples=[
+            ["examples/portrait1.jpg", 25, 0.6],
+            ["examples/portrait2.jpg", 30, 0.5],
+        ],
+        inputs=[input_image, steps_slider, strength_slider],
+        label="Try these examples!"
+    )
+    generate_btn.click(
+        fn=generate_ghibli_style,
+        inputs=[input_image, steps_slider, strength_slider],
+        outputs=gallery
+    )
+# Launch the app
+if __name__ == "__main__":
+    demo.queue(concurrency_count=1).launch(share=True)