Spaces:

Bils
/

AIPromoStudio

Running on Zero

App Files Files Community

Bils commited on Jan 30

Commit

1a03830

verified ·

1 Parent(s): ced3fa2

Update app.py

Browse files

Files changed (1) hide show

app.py +41 -61

app.py CHANGED Viewed

@@ -75,26 +75,25 @@ model_manager = ModelManager()
 # Core Functions
 # -------------------------------
 @spaces.GPU
-def generate_script(user_prompt, model_id, duration):
     try:
         text_pipeline = model_manager.get_llama_pipeline(model_id, HF_TOKEN)
-        system_prompt = f"""Create a {duration}-second audio promo with these elements:
-1. Voice Script: [Clear narration]
 2. Sound Design: [3-5 effects]
-3. Music: [Genre/tempo]
 Concept: {user_prompt}"""
         result = text_pipeline(
-            system_prompt,
             max_new_tokens=300,
-            temperature=0.7,
             do_sample=True
         )
-        generated_text = result[0]["generated_text"]
-        return parse_generated_content(generated_text)
     except Exception as e:
         return f"Error: {str(e)}", "", ""
@@ -124,7 +123,7 @@ def parse_generated_content(text):
     return sections["Voice Script"].strip(), sections["Sound Design"].strip(), sections["Music"].strip()
 @spaces.GPU
-def generate_voice(script, tts_model):
     try:
         if not script.strip():
             return "Error: No script provided"
@@ -171,72 +170,53 @@ def blend_audio(voice_path, music_path, ducking=True, duck_level=10):
         return f"Error: {str(e)}"
 # -------------------------------
-# Gradio Interface (Second UI Version)
 # -------------------------------
-with gr.Blocks(title="AI Radio Studio", css="""
-    .gradio-container {max-width: 800px; margin: auto;}
-    .tab-item {padding: 20px; border-radius: 10px;}
-    """) as demo:
     gr.Markdown("""
     # 🎙️ AI Radio Studio
-    *Professional Audio Production Made Simple*
     """)
     with gr.Tabs():
-        # Concept Tab
-        with gr.Tab("🎯 Concept"):
-            with gr.Row():
-                with gr.Column():
-                    concept_input = gr.Textbox(
-                        label="Your Idea",
-                        placeholder="Describe your audio project...",
-                        lines=3
-                    )
-                    model_select = gr.Dropdown(
-                        choices=list(MODEL_CONFIG["llama_models"].values()),
-                        label="AI Model",
-                        value="meta-llama/Meta-Llama-3-8B-Instruct"
-                    )
-                    duration_select = gr.Slider(15, 60, 30, step=15, label="Duration (seconds)")
-                    generate_btn = gr.Button("Generate Script", variant="primary")
-                with gr.Column():
-                    script_output = gr.Textbox(label="Voice Script", interactive=True)
-                    sound_output = gr.Textbox(label="Sound Design", interactive=True)
-                    music_output = gr.Textbox(label="Music Suggestions", interactive=True)
-        # Voice Tab
-        with gr.Tab("🗣️ Voice"):
             with gr.Row():
-                with gr.Column():
-                    tts_select = gr.Dropdown(
-                        choices=list(MODEL_CONFIG["tts_models"].values()),
-                        label="Voice Model",
-                        value="tts_models/en/ljspeech/tacotron2-DDC"
-                    )
-                    voice_btn = gr.Button("Generate Voiceover", variant="primary")
-                with gr.Column():
-                    voice_preview = gr.Audio(label="Preview", type="filepath")
-        # Music Tab
-        with gr.Tab("🎵 Music"):
-            music_btn = gr.Button("Generate Music Track", variant="primary")
             music_preview = gr.Audio(label="Preview", type="filepath")
-        # Mix Tab
-        with gr.Tab("🔊 Mix"):
             with gr.Row():
-                with gr.Column():
-                    ducking_toggle = gr.Checkbox(True, label="Enable Voice Ducking")
-                    duck_level = gr.Slider(0, 20, 10, label="Ducking Level (dB)")
-                    mix_btn = gr.Button("Create Final Mix", variant="primary")
-                with gr.Column():
-                    final_mix = gr.Audio(label="Final Output", type="filepath")
     # Footer Section
     gr.Markdown("""
-    <div style="text-align: center; margin-top: 30px; padding: 15px; border-top: 1px solid #e0e0e0;">
         <p style="font-size: 0.9em; color: #666;">
             Created with ❤️ by <a href="https://bilsimaging.com" target="_blank">bilsimaging.com</a>
         </p>

 # Core Functions
 # -------------------------------
 @spaces.GPU
+def generate_script(user_prompt, model_id, duration, temperature=0.7):
     try:
         text_pipeline = model_manager.get_llama_pipeline(model_id, HF_TOKEN)
+        prompt = f"""Create a {duration}-second audio promo script with these elements:
+1. Voice Script: [clear narration]
 2. Sound Design: [3-5 effects]
+3. Music: [genre/tempo]
 Concept: {user_prompt}"""
         result = text_pipeline(
+            prompt,
             max_new_tokens=300,
+            temperature=temperature,
             do_sample=True
         )
+        return parse_generated_content(result[0]["generated_text"])
     except Exception as e:
         return f"Error: {str(e)}", "", ""
     return sections["Voice Script"].strip(), sections["Sound Design"].strip(), sections["Music"].strip()
 @spaces.GPU
+def generate_voice(script, tts_model, speed=1.0):
     try:
         if not script.strip():
             return "Error: No script provided"
         return f"Error: {str(e)}"
 # -------------------------------
+# Gradio Interface
 # -------------------------------
+with gr.Blocks(title="AI Radio Studio", css=".gradio-container {max-width: 800px !important}") as demo:
     gr.Markdown("""
     # 🎙️ AI Radio Studio
+    *Create professional audio content in 4 easy steps*
     """)
     with gr.Tabs():
+        with gr.Tab("1️⃣ Concept"):
+            concept_input = gr.Textbox(label="Your Idea", placeholder="Describe your radio promo...", lines=3)
             with gr.Row():
+                model_select = gr.Dropdown(
+                    choices=list(MODEL_CONFIG["llama_models"].values()),
+                    label="AI Model",
+                    value="meta-llama/Meta-Llama-3-8B-Instruct"
+                )
+                duration_select = gr.Slider(15, 60, 30, step=15, label="Duration (sec)")
+            generate_btn = gr.Button("Generate Script", variant="primary")
+            script_output = gr.Textbox(label="Voice Script", interactive=True)
+            sound_output = gr.Textbox(label="Sound Effects", interactive=True)
+            music_output = gr.Textbox(label="Music Style", interactive=True)
+        with gr.Tab("2️⃣ Voice"):
+            tts_select = gr.Dropdown(
+                choices=list(MODEL_CONFIG["tts_models"].values()),
+                label="Voice Model",
+                value="tts_models/en/ljspeech/tacotron2-DDC"
+            )
+            voice_btn = gr.Button("Generate Voiceover", variant="primary")
+            voice_preview = gr.Audio(label="Preview", type="filepath")
+        with gr.Tab("3️⃣ Music"):
+            music_btn = gr.Button("Generate Music", variant="primary")
             music_preview = gr.Audio(label="Preview", type="filepath")
+        with gr.Tab("4️⃣ Mix"):
             with gr.Row():
+                ducking_toggle = gr.Checkbox(True, label="Duck Music")
+                duck_level = gr.Slider(0, 20, 10, label="Duck Level (dB)")
+            mix_btn = gr.Button("Create Final Mix", variant="primary")
+            final_mix = gr.Audio(label="Final Output", type="filepath")
     # Footer Section
     gr.Markdown("""
+    <div style="text-align: center; margin-top: 20px; padding: 15px; border-top: 1px solid #e0e0e0;">
         <p style="font-size: 0.9em; color: #666;">
             Created with ❤️ by <a href="https://bilsimaging.com" target="_blank">bilsimaging.com</a>
         </p>