Spaces:

Bils
/

AIPromoStudio

Running on Zero

App Files Files Community

Bils commited on Jan 30

Commit

ced3fa2

verified ·

1 Parent(s): 4f8a245

Update app.py

Browse files

Files changed (1) hide show

app.py +61 -41

app.py CHANGED Viewed

@@ -75,25 +75,26 @@ model_manager = ModelManager()
 # Core Functions
 # -------------------------------
 @spaces.GPU
-def generate_script(user_prompt, model_id, duration, temperature=0.7):
     try:
         text_pipeline = model_manager.get_llama_pipeline(model_id, HF_TOKEN)
-        prompt = f"""Create a {duration}-second audio promo script with these elements:
-1. Voice Script: [clear narration]
 2. Sound Design: [3-5 effects]
-3. Music: [genre/tempo]
 Concept: {user_prompt}"""
         result = text_pipeline(
-            prompt,
             max_new_tokens=300,
-            temperature=temperature,
             do_sample=True
         )
-        return parse_generated_content(result[0]["generated_text"])
     except Exception as e:
         return f"Error: {str(e)}", "", ""
@@ -123,7 +124,7 @@ def parse_generated_content(text):
     return sections["Voice Script"].strip(), sections["Sound Design"].strip(), sections["Music"].strip()
 @spaces.GPU
-def generate_voice(script, tts_model, speed=1.0):
     try:
         if not script.strip():
             return "Error: No script provided"
@@ -170,53 +171,72 @@ def blend_audio(voice_path, music_path, ducking=True, duck_level=10):
         return f"Error: {str(e)}"
 # -------------------------------
-# Gradio Interface
 # -------------------------------
-with gr.Blocks(title="AI Radio Studio", css=".gradio-container {max-width: 800px !important}") as demo:
     gr.Markdown("""
     # 🎙️ AI Radio Studio
-    *Create professional audio content in 4 easy steps*
     """)
     with gr.Tabs():
-        with gr.Tab("1️⃣ Concept"):
-            concept_input = gr.Textbox(label="Your Idea", placeholder="Describe your radio promo...", lines=3)
             with gr.Row():
-                model_select = gr.Dropdown(
-                    choices=list(MODEL_CONFIG["llama_models"].values()),
-                    label="AI Model",
-                    value="meta-llama/Meta-Llama-3-8B-Instruct"
-                )
-                duration_select = gr.Slider(15, 60, 30, step=15, label="Duration (sec)")
-            generate_btn = gr.Button("Generate Script", variant="primary")
-            script_output = gr.Textbox(label="Voice Script", interactive=True)
-            sound_output = gr.Textbox(label="Sound Effects", interactive=True)
-            music_output = gr.Textbox(label="Music Style", interactive=True)
-        with gr.Tab("2️⃣ Voice"):
-            tts_select = gr.Dropdown(
-                choices=list(MODEL_CONFIG["tts_models"].values()),
-                label="Voice Model",
-                value="tts_models/en/ljspeech/tacotron2-DDC"
-            )
-            voice_btn = gr.Button("Generate Voiceover", variant="primary")
-            voice_preview = gr.Audio(label="Preview", type="filepath")
-        with gr.Tab("3️⃣ Music"):
-            music_btn = gr.Button("Generate Music", variant="primary")
             music_preview = gr.Audio(label="Preview", type="filepath")
-        with gr.Tab("4️⃣ Mix"):
             with gr.Row():
-                ducking_toggle = gr.Checkbox(True, label="Duck Music")
-                duck_level = gr.Slider(0, 20, 10, label="Duck Level (dB)")
-            mix_btn = gr.Button("Create Final Mix", variant="primary")
-            final_mix = gr.Audio(label="Final Output", type="filepath")
     # Footer Section
     gr.Markdown("""
-    <div style="text-align: center; margin-top: 20px; padding: 15px; border-top: 1px solid #e0e0e0;">
         <p style="font-size: 0.9em; color: #666;">
             Created with ❤️ by <a href="https://bilsimaging.com" target="_blank">bilsimaging.com</a>
         </p>

 # Core Functions
 # -------------------------------
 @spaces.GPU
+def generate_script(user_prompt, model_id, duration):
     try:
         text_pipeline = model_manager.get_llama_pipeline(model_id, HF_TOKEN)
+        system_prompt = f"""Create a {duration}-second audio promo with these elements:
+1. Voice Script: [Clear narration]
 2. Sound Design: [3-5 effects]
+3. Music: [Genre/tempo]
 Concept: {user_prompt}"""
         result = text_pipeline(
+            system_prompt,
             max_new_tokens=300,
+            temperature=0.7,
             do_sample=True
         )
+        generated_text = result[0]["generated_text"]
+        return parse_generated_content(generated_text)
     except Exception as e:
         return f"Error: {str(e)}", "", ""
     return sections["Voice Script"].strip(), sections["Sound Design"].strip(), sections["Music"].strip()
 @spaces.GPU
+def generate_voice(script, tts_model):
     try:
         if not script.strip():
             return "Error: No script provided"
         return f"Error: {str(e)}"
 # -------------------------------
+# Gradio Interface (Second UI Version)
 # -------------------------------
+with gr.Blocks(title="AI Radio Studio", css="""
+    .gradio-container {max-width: 800px; margin: auto;}
+    .tab-item {padding: 20px; border-radius: 10px;}
+    """) as demo:
     gr.Markdown("""
     # 🎙️ AI Radio Studio
+    *Professional Audio Production Made Simple*
     """)
     with gr.Tabs():
+        # Concept Tab
+        with gr.Tab("🎯 Concept"):
             with gr.Row():
+                with gr.Column():
+                    concept_input = gr.Textbox(
+                        label="Your Idea",
+                        placeholder="Describe your audio project...",
+                        lines=3
+                    )
+                    model_select = gr.Dropdown(
+                        choices=list(MODEL_CONFIG["llama_models"].values()),
+                        label="AI Model",
+                        value="meta-llama/Meta-Llama-3-8B-Instruct"
+                    )
+                    duration_select = gr.Slider(15, 60, 30, step=15, label="Duration (seconds)")
+                    generate_btn = gr.Button("Generate Script", variant="primary")
+                with gr.Column():
+                    script_output = gr.Textbox(label="Voice Script", interactive=True)
+                    sound_output = gr.Textbox(label="Sound Design", interactive=True)
+                    music_output = gr.Textbox(label="Music Suggestions", interactive=True)
+        # Voice Tab
+        with gr.Tab("🗣️ Voice"):
+            with gr.Row():
+                with gr.Column():
+                    tts_select = gr.Dropdown(
+                        choices=list(MODEL_CONFIG["tts_models"].values()),
+                        label="Voice Model",
+                        value="tts_models/en/ljspeech/tacotron2-DDC"
+                    )
+                    voice_btn = gr.Button("Generate Voiceover", variant="primary")
+                with gr.Column():
+                    voice_preview = gr.Audio(label="Preview", type="filepath")
+        # Music Tab
+        with gr.Tab("🎵 Music"):
+            music_btn = gr.Button("Generate Music Track", variant="primary")
             music_preview = gr.Audio(label="Preview", type="filepath")
+        # Mix Tab
+        with gr.Tab("🔊 Mix"):
             with gr.Row():
+                with gr.Column():
+                    ducking_toggle = gr.Checkbox(True, label="Enable Voice Ducking")
+                    duck_level = gr.Slider(0, 20, 10, label="Ducking Level (dB)")
+                    mix_btn = gr.Button("Create Final Mix", variant="primary")
+                with gr.Column():
+                    final_mix = gr.Audio(label="Final Output", type="filepath")
     # Footer Section
     gr.Markdown("""
+    <div style="text-align: center; margin-top: 30px; padding: 15px; border-top: 1px solid #e0e0e0;">
         <p style="font-size: 0.9em; color: #666;">
             Created with ❤️ by <a href="https://bilsimaging.com" target="_blank">bilsimaging.com</a>
         </p>