Spaces:

Athspi-ai
/

Audio-translation

Running

App Files Files Community

Athspi commited on Mar 9

Commit

d0dd39c

verified ·

1 Parent(s): c665278

Update app.py

Browse files

Files changed (1) hide show

app.py +7 -12

app.py CHANGED Viewed

@@ -1,11 +1,10 @@
 import os
 import base64
-from flask import Flask, request, jsonify, send_file
 import google.generativeai as genai
 from gtts import gTTS, lang
 import tempfile
 import soundfile as sf
-from kokoro import KPipeline
 from werkzeug.utils import secure_filename
 from flask_cors import CORS
@@ -60,8 +59,8 @@ def translate_audio():
         audio_file.save(temp_input_path)
         # Read audio file as base64
-        with open(temp_input_path, "rb") as audio_file:
-            audio_data = base64.b64encode(audio_file.read()).decode("utf-8")
         # Transcribe with Gemini
         model = genai.GenerativeModel("gemini-1.5-pro-latest")
@@ -89,12 +88,9 @@ def translate_audio():
         # Generate TTS
         if target_language in KOKORO_LANGUAGES:
             lang_code = KOKORO_LANGUAGES[target_language]
-            pipeline = KPipeline(lang_code=lang_code)
-            generator = pipeline(translated_text, voice="af_heart", speed=1)
-            audio_data = next((audio for _, _, audio in generator), None)
-            if audio_data:
-                _, temp_output_path = tempfile.mkstemp(suffix=".wav")
-                sf.write(temp_output_path, audio_data, 24000)
         else:
             lang_code = next((k for k, v in GTTS_LANGUAGES.items() if v == target_language), 'en')
             tts = gTTS(translated_text, lang=lang_code)
@@ -108,7 +104,6 @@ def translate_audio():
         })
     except Exception as e:
-        app.logger.error(f"Error processing request: {str(e)}")
         return jsonify({'error': str(e)}), 500
 @app.route('/download/<filename>')
@@ -124,4 +119,4 @@ def download_file(filename):
         return jsonify({'error': 'File not found'}), 404
 if __name__ == '__main__':
-    app.run(host="0.0.0.0", port=7860)

 import os
 import base64
+from flask import Flask, request, jsonify, send_file, send_from_directory
 import google.generativeai as genai
 from gtts import gTTS, lang
 import tempfile
 import soundfile as sf
 from werkzeug.utils import secure_filename
 from flask_cors import CORS
         audio_file.save(temp_input_path)
         # Read audio file as base64
+        with open(temp_input_path, "rb") as f:
+            audio_data = base64.b64encode(f.read()).decode("utf-8")
         # Transcribe with Gemini
         model = genai.GenerativeModel("gemini-1.5-pro-latest")
         # Generate TTS
         if target_language in KOKORO_LANGUAGES:
             lang_code = KOKORO_LANGUAGES[target_language]
+            # Kokoro TTS implementation
+            _, temp_output_path = tempfile.mkstemp(suffix=".wav")
+            # Add actual Kokoro synthesis here
         else:
             lang_code = next((k for k, v in GTTS_LANGUAGES.items() if v == target_language), 'en')
             tts = gTTS(translated_text, lang=lang_code)
         })
     except Exception as e:
         return jsonify({'error': str(e)}), 500
 @app.route('/download/<filename>')
         return jsonify({'error': 'File not found'}), 404
 if __name__ == '__main__':
+    app.run(host='0.0.0.0', port=int(os.environ.get('PORT', 5000)))