Spaces:

AmberHeart
/

AetherV1

Running on Zero

App Files Files Community

AmberHeart commited on Mar 28

Commit

f69b2cb

1 Parent(s): b77de08

update example

Browse files

Files changed (1) hide show

app.py +86 -91

app.py CHANGED Viewed

@@ -461,7 +461,7 @@ def save_output_files(
     return paths
-@spaces.GPU(duration=100)
 def process_reconstruction(
     video_file,
     height,
@@ -860,26 +860,24 @@ def update_task_ui(task):
     """Update UI elements based on selected task."""
     if task == "reconstruction":
         return (
-            gr.update(visible=True),  # video_input
-            gr.update(visible=False),  # image_input
-            gr.update(visible=False),  # goal_input
-            gr.update(visible=False),  # image_preview
-            gr.update(visible=False),  # goal_preview
             gr.update(value=4),  # num_inference_steps
             gr.update(visible=True),  # sliding_window_stride
             gr.update(visible=False),  # use_dynamic_cfg
             gr.update(visible=False),  # raymap_option
             gr.update(visible=False),  # post_reconstruction
             gr.update(value=1.0),  # guidance_scale
-            gr.update(visible=False),  # gpu_time_warning
         )
     elif task == "prediction":
         return (
-            gr.update(visible=False),  # video_input
-            gr.update(visible=True),  # image_input
-            gr.update(visible=False),  # goal_input
-            gr.update(visible=True),  # image_preview
-            gr.update(visible=False),  # goal_preview
             gr.update(value=50),  # num_inference_steps
             gr.update(visible=False),  # sliding_window_stride
             gr.update(visible=True),  # use_dynamic_cfg
@@ -890,11 +888,10 @@ def update_task_ui(task):
         )
     elif task == "planning":
         return (
-            gr.update(visible=False),  # video_input
-            gr.update(visible=True),  # image_input
-            gr.update(visible=True),  # goal_input
-            gr.update(visible=True),  # image_preview
-            gr.update(visible=True),  # goal_preview
             gr.update(value=50),  # num_inference_steps
             gr.update(visible=False),  # sliding_window_stride
             gr.update(visible=True),  # use_dynamic_cfg
@@ -1389,44 +1386,85 @@ with gr.Blocks(
                     gpu_time_warning = gr.Markdown(
                         """
                         <div class="warning-box">
-                        <strong>⚠️ Note:</strong> Due to HuggingFace Spaces ZERO GPU quota limitations (5 minutes max),
-                        prediction and planning tasks may not complete in time. We strongly recommend deploying
-                        our model locally for the full Aether experience.
                         </div>
                         """,
                         visible=False
                     )
                 with gr.Group(elem_classes=["input-section"]):
-                    # Input section - changes based on task
                     gr.Markdown("## 📥 Input", elem_classes=["task-header"])
                     # Task-specific inputs
-                    video_input = gr.Video(
-                        label="Upload Input Video",
-                        sources=["upload"],
-                        visible=True,
-                        interactive=True,
-                        elem_id="video_input",
-                    )
-                    image_input = gr.File(
-                        label="Upload Start Image",
-                        file_count="single",
-                        file_types=["image"],
-                        visible=False,
-                        interactive=True,
-                        elem_id="image_input",
-                    )
-                    goal_input = gr.File(
-                        label="Upload Goal Image",
-                        file_count="single",
-                        file_types=["image"],
-                        visible=False,
-                        interactive=True,
-                        elem_id="goal_input",
-                    )
                     with gr.Row(visible=False) as preview_row:
                         image_preview = gr.Image(
@@ -1646,58 +1684,15 @@ with gr.Blocks(
                             """
                         )
-        # Example Accordion
-        with gr.Tab("Reconstruction"):
-            reconstruction_examples = gr.Examples(
-                examples=[
-                    ["assets/example_videos/bridge.mp4"],
-                    ["assets/example_videos/moviegen.mp4"],
-                    ["assets/example_videos/nuscenes.mp4"],
-                    ["assets/example_videos/veo2.mp4"],
-                ],
-                inputs=[video_input],
-                label="Reconstruction Examples",
-                fn=lambda x: {"task": gr.update(value="reconstruction")}
-            )
-        with gr.Tab("Prediction"):
-            prediction_examples = gr.Examples(
-                examples=[
-                    ["assets/example_obs/car.png"],
-                    ["assets/example_obs/cartoon.png"],
-                    ["assets/example_obs/garden.jpg"],
-                    ["assets/example_obs/room.jpg"],
-                ],
-                inputs=[image_input],
-                label="Prediction Examples",
-                fn=lambda x: {"task": gr.update(value="prediction")},
-                examples_per_page=4,
-            )
-        with gr.Tab("Planning"):
-            planning_examples = gr.Examples(
-                examples=[
-                    ["assets/example_obs_goal/01_obs.png", "assets/example_obs_goal/01_goal.png"],
-                    ["assets/example_obs_goal/02_obs.png", "assets/example_obs_goal/02_goal.png"],
-                    ["assets/example_obs_goal/03_obs.png", "assets/example_obs_goal/03_goal.png"],
-                    ["assets/example_obs_goal/04_obs.png", "assets/example_obs_goal/04_goal.png"],
-                ],
-                inputs=[image_input, goal_input],
-                label="Planning Examples",
-                fn=lambda x: {"task": gr.update(value="planning")},
-                examples_per_page=4,
-            )
     # Event handlers
     task.change(
         fn=update_task_ui,
         inputs=[task],
         outputs=[
-            video_input,
-            image_input,
-            goal_input,
-            image_preview,
-            goal_preview,
             num_inference_steps,
             sliding_window_stride,
             use_dynamic_cfg,

     return paths
+@spaces.GPU(duration=300)
 def process_reconstruction(
     video_file,
     height,
     """Update UI elements based on selected task."""
     if task == "reconstruction":
         return (
+            gr.update(visible=True),  # reconstruction_group
+            gr.update(visible=False),  # prediction_group
+            gr.update(visible=False),  # planning_group
+            gr.update(visible=False),  # preview_row
             gr.update(value=4),  # num_inference_steps
             gr.update(visible=True),  # sliding_window_stride
             gr.update(visible=False),  # use_dynamic_cfg
             gr.update(visible=False),  # raymap_option
             gr.update(visible=False),  # post_reconstruction
             gr.update(value=1.0),  # guidance_scale
+            gr.update(visible=True),  # gpu_time_warning
         )
     elif task == "prediction":
         return (
+            gr.update(visible=False),  # reconstruction_group
+            gr.update(visible=True),  # prediction_group
+            gr.update(visible=False),  # planning_group
+            gr.update(visible=True),  # preview_row
             gr.update(value=50),  # num_inference_steps
             gr.update(visible=False),  # sliding_window_stride
             gr.update(visible=True),  # use_dynamic_cfg
         )
     elif task == "planning":
         return (
+            gr.update(visible=False),  # reconstruction_group
+            gr.update(visible=False),  # prediction_group
+            gr.update(visible=True),  # planning_group
+            gr.update(visible=True),  # preview_row
             gr.update(value=50),  # num_inference_steps
             gr.update(visible=False),  # sliding_window_stride
             gr.update(visible=True),  # use_dynamic_cfg
                     gpu_time_warning = gr.Markdown(
                         """
                         <div class="warning-box">
+                        <strong>⚠️ Warning:</strong> Due to HuggingFace Spaces ZERO GPU quota limitations,
+                        only short video reconstruction tasks (less than 10s) can be completed online.
+                        For long video reconstruction, prediction, and planning tasks, we strongly
+                        recommend deploying the model locally to experience the full capabilities of Aether.
                         </div>
                         """,
                         visible=False
                     )
                 with gr.Group(elem_classes=["input-section"]):
                     gr.Markdown("## 📥 Input", elem_classes=["task-header"])
                     # Task-specific inputs
+                    with gr.Group(visible=True) as reconstruction_group:
+                        video_input = gr.Video(
+                            label="Upload Input Video",
+                            sources=["upload"],
+                            interactive=True,
+                            elem_id="video_input",
+                        )
+                        reconstruction_examples = gr.Examples(
+                            examples=[
+                                ["assets/example_videos/bridge.mp4"],
+                                ["assets/example_videos/moviegen.mp4"],
+                                ["assets/example_videos/nuscenes.mp4"],
+                                ["assets/example_videos/veo2.mp4"],
+                            ],
+                            inputs=[video_input],
+                            label="Reconstruction Examples",
+                            examples_per_page=4,
+                        )
+                    with gr.Group(visible=False) as prediction_group:
+                        image_input = gr.File(
+                            label="Upload Start Image",
+                            file_count="single",
+                            file_types=["image"],
+                            interactive=True,
+                            elem_id="image_input",
+                        )
+                        prediction_examples = gr.Examples(
+                            examples=[
+                                ["assets/example_obs/car.png"],
+                                ["assets/example_obs/cartoon.png"],
+                                ["assets/example_obs/garden.jpg"],
+                                ["assets/example_obs/room.jpg"],
+                            ],
+                            inputs=[image_input],
+                            label="Prediction Examples",
+                            examples_per_page=4,
+                        )
+                    with gr.Group(visible=False) as planning_group:
+                        with gr.Row():
+                            image_input_planning = gr.File(
+                                label="Upload Start Image",
+                                file_count="single",
+                                file_types=["image"],
+                                interactive=True,
+                                elem_id="image_input_planning",
+                            )
+                            goal_input = gr.File(
+                                label="Upload Goal Image",
+                                file_count="single",
+                                file_types=["image"],
+                                interactive=True,
+                                elem_id="goal_input",
+                            )
+                        planning_examples = gr.Examples(
+                            examples=[
+                                ["assets/example_obs_goal/01_obs.png", "assets/example_obs_goal/01_goal.png"],
+                                ["assets/example_obs_goal/02_obs.png", "assets/example_obs_goal/02_goal.png"],
+                                ["assets/example_obs_goal/03_obs.png", "assets/example_obs_goal/03_goal.png"],
+                                ["assets/example_obs_goal/04_obs.png", "assets/example_obs_goal/04_goal.png"],
+                            ],
+                            inputs=[image_input_planning, goal_input],
+                            label="Planning Examples",
+                            examples_per_page=4,
+                        )
                     with gr.Row(visible=False) as preview_row:
                         image_preview = gr.Image(
                             """
                         )
     # Event handlers
     task.change(
         fn=update_task_ui,
         inputs=[task],
         outputs=[
+            reconstruction_group,
+            prediction_group,
+            planning_group,
+            preview_row,
             num_inference_steps,
             sliding_window_stride,
             use_dynamic_cfg,