Spaces:

Jaward
/

optimus

Sleeping

App Files Files Community

Jaward commited on Aug 20, 2024

Commit

3169305

verified ·

1 Parent(s): c274feb

Update app.py

Browse files

Files changed (1) hide show

app.py +43 -52

app.py CHANGED Viewed

@@ -124,64 +124,57 @@ def models(text, model="Llama 3 8B Service", seed=42):
         return output
-def translate_speech(audio_file, target_language):
-    if audio_file is None:
-        return None
-    language_code = LANGUAGE_CODES[target_language]
-    output_file = "translated_audio.wav"
-    command = [
-        "expressivity_predict",
-        audio_file,
-        "--tgt_lang", language_code,
-        "--model_name", "seamless_expressivity",
-        "--vocoder_name", "vocoder_pretssel",
-        "--gated-model-dir", "models",
-        "--output_path", output_file
-    ]
-    subprocess.run(command, check=True)
-    if os.path.exists(output_file):
-        print(f"File created successfully: {output_file}")
-        return output_file
-    else:
-        print(f"File not found: {output_file}")
         return None
-async def respond_with_retry(audio, model, seed, target_language, max_retries=3):
-    for attempt in range(max_retries):
-        try:
-            return await respond(audio, model, seed, target_language)
-        except ClientDisconnect:
-            if attempt < max_retries - 1:
-                logger.warning(f"Client disconnected. Retrying... (Attempt {attempt + 1}/{max_retries})")
-                await asyncio.sleep(1)  # Wait a bit before retrying
-            else:
-                logger.error("Max retries reached. Client repeatedly disconnected.")
-                return None, None
-        except Exception as e:
-            logger.error(f"An error occurred: {str(e)}")
-            return None, None
 async def respond(audio, model, seed, target_language):
-    start_time = time.time()
     try:
         if audio is None:
             return None, None
         user_input = transcribe(audio)
         if not user_input:
             return None, None
-        logger.info(f"Processing input: {user_input[:50]}...")  # Log the first 50 characters of input
         if user_input.lower().startswith("please translate"):
-            content_to_translate = user_input[len("please translate"):].strip()
-            translated_audio = translate_speech(audio, target_language)
-            logger.info(f"Translation completed in {time.time() - start_time:.2f} seconds")
             return None, translated_audio
         else:
             reply = models(user_input, model, seed)
@@ -189,10 +182,12 @@ async def respond(audio, model, seed, target_language):
             with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp_file:
                 tmp_path = tmp_file.name
                 await communicate.save(tmp_path)
-            logger.info(f"Voice assistant response generated in {time.time() - start_time:.2f} seconds")
             return tmp_path, None
     except Exception as e:
-        logger.error(f"An error occurred: {str(e)}")
         return None, None
 def clear_history():
@@ -237,7 +232,7 @@ with gr.Blocks(css="style.css") as demo:
             translated_audio = gr.Audio(label="Translated Audio", type="filepath", interactive=False, autoplay=True)
     input_audio.change(
-        fn=respond_with_retry,
         inputs=[input_audio, select, seed, target_lang],
         outputs=[output_audio, translated_audio],
     )
@@ -245,8 +240,4 @@ with gr.Blocks(css="style.css") as demo:
     clear_button.click(fn=clear_history, inputs=[], outputs=[output_audio, translated_audio])
 if __name__ == "__main__":
-    demo.queue(concurrency_count=5, max_size=20).launch(
-        share=True,
-        debug=True,
-        enable_queue=True,
-    )

         return output
+async def translate_speech_with_timeout(audio_file, target_language, timeout=30):
+    try:
+        language_code = LANGUAGE_CODES[target_language]
+        output_file = f"translated_audio_{int(time.time())}.wav"
+        command = [
+            "expressivity_predict",
+            audio_file,
+            "--tgt_lang", language_code,
+            "--model_name", "seamless_expressivity",
+            "--vocoder_name", "vocoder_pretssel",
+            "--gated-model-dir", "models",
+            "--output_path", output_file
+        ]
+        process = await asyncio.create_subprocess_exec(
+            *command,
+            stdout=asyncio.subprocess.PIPE,
+            stderr=asyncio.subprocess.PIPE
+        )
+        try:
+            stdout, stderr = await asyncio.wait_for(process.communicate(), timeout=timeout)
+        except asyncio.TimeoutError:
+            process.kill()
+            raise Exception("Translation process timed out")
+        if process.returncode != 0:
+            raise Exception(f"Translation process failed: {stderr.decode()}")
+        if os.path.exists(output_file):
+            print(f"File created successfully: {output_file}")
+            return output_file
+        else:
+            raise Exception(f"File not found: {output_file}")
+    except Exception as e:
+        print(f"Translation error: {str(e)}")
         return None
 async def respond(audio, model, seed, target_language):
     try:
         if audio is None:
             return None, None
         user_input = transcribe(audio)
         if not user_input:
             return None, None
         if user_input.lower().startswith("please translate"):
+            # Use background task for translation
+            translated_audio = await translate_speech_with_timeout(audio, target_language)
             return None, translated_audio
         else:
             reply = models(user_input, model, seed)
             with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp_file:
                 tmp_path = tmp_file.name
                 await communicate.save(tmp_path)
             return tmp_path, None
+    except ClientDisconnect:
+        print("Client disconnected")
+        return None, None
     except Exception as e:
+        print(f"An error occurred: {str(e)}")
         return None, None
 def clear_history():
             translated_audio = gr.Audio(label="Translated Audio", type="filepath", interactive=False, autoplay=True)
     input_audio.change(
+        fn=respond,
         inputs=[input_audio, select, seed, target_lang],
         outputs=[output_audio, translated_audio],
     )
     clear_button.click(fn=clear_history, inputs=[], outputs=[output_audio, translated_audio])
 if __name__ == "__main__":
+    demo.queue(concurrency_count=5, max_size=20).launch()