Spaces:

Athspi-ai
/

AutoSubGen

Running

Athspi commited on Mar 11

Commit

00d9ff4

verified ·

1 Parent(s): 4620e6c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -13,7 +13,7 @@ logging.getLogger("moviepy").setLevel(logging.ERROR)
 # Configure Gemini API
 genai.configure(api_key=os.environ["GEMINI_API_KEY"])
-model = genai.GenerativeModel("gemini-2.0-pro-exp-02-05")
 # Supported languages
 SUPPORTED_LANGUAGES = [
@@ -46,6 +46,13 @@ ORIGINAL:
 TRANSLATED:"""
 def split_audio(audio_path, chunk_duration=60):
     """Split audio into smaller chunks (default: 60 seconds)"""
     audio = AudioSegment.from_wav(audio_path)
@@ -140,8 +147,18 @@ def create_srt(subtitles_text):
     return "\n".join(srt_output)
 def process_video(video_path, source_lang, target_lang):
     """Complete processing pipeline"""
     try:
         # Extract audio
         audio_path = extract_audio(video_path)
@@ -178,7 +195,7 @@ def process_video(video_path, source_lang, target_lang):
         print(f"Processing error: {str(e)}")
         return None, None
     finally:
-        if os.path.exists(audio_path):
             os.remove(audio_path)
 # Gradio Interface

 # Configure Gemini API
 genai.configure(api_key=os.environ["GEMINI_API_KEY"])
+model = genai.GenerativeModel("gemini-2.0-flash-exp")
 # Supported languages
 SUPPORTED_LANGUAGES = [
 TRANSLATED:"""
+def extract_audio(video_path):
+    """Extract high-quality audio from video"""
+    video = VideoFileClip(video_path)
+    audio_path = os.path.join(tempfile.gettempdir(), "extracted_audio.wav")
+    video.audio.write_audiofile(audio_path, fps=44100, nbytes=2, codec='pcm_s16le')
+    return audio_path
 def split_audio(audio_path, chunk_duration=60):
     """Split audio into smaller chunks (default: 60 seconds)"""
     audio = AudioSegment.from_wav(audio_path)
     return "\n".join(srt_output)
+def translate_subtitles(subtitles, target_lang):
+    """Translate subtitles while preserving timestamps"""
+    prompt = TRANSLATION_PROMPT.format(
+        target_language=target_lang,
+        subtitles=subtitles
+    )
+    response = model.generate_content(prompt)
+    return response.text
 def process_video(video_path, source_lang, target_lang):
     """Complete processing pipeline"""
+    audio_path = None
     try:
         # Extract audio
         audio_path = extract_audio(video_path)
         print(f"Processing error: {str(e)}")
         return None, None
     finally:
+        if audio_path and os.path.exists(audio_path):
             os.remove(audio_path)
 # Gradio Interface