Scribe_Transcription_Demo_2

Running

App Files Files Community

MrSimple07 commited on Mar 15

Commit

73f6d14

verified ·

1 Parent(s): fb7ca39

Update app.py

Browse files

Files changed (1) hide show

app.py +1 -59

app.py CHANGED Viewed

@@ -3,42 +3,10 @@ import gradio as gr
 import requests
 import json
 from moviepy import VideoFileClip
-import yt_dlp
 import uuid
 ELEVENLABS_API_KEY = os.environ.get("ELEVENLABS_API_KEY", None)
-def download_video_from_url(url):
-    try:
-        # Generate a unique filename
-        filename = f"downloaded_video_{uuid.uuid4().hex[:8]}.mp4"
-        # Configure yt-dlp options without browser cookies
-        ydl_opts = {
-            'format': 'bestvideo[ext=mp4]+bestaudio[ext=m4a]/mp4',
-            'outtmpl': filename,
-            'quiet': True,
-            'no_warnings': True,
-            'ignoreerrors': True,
-            'nocheckcertificate': True,
-            'extractor_args': {'youtube': {'skip': ['webpage']}},  # Skip webpage verification
-            'extractor_retries': 3,
-            # Add more formats as fallbacks
-            'merge_output_format': 'mp4',
-        }
-        # Download the video
-        with yt_dlp.YoutubeDL(ydl_opts) as ydl:
-            ydl.download([url])
-        if os.path.exists(filename) and os.path.getsize(filename) > 0:
-            return filename, None
-        else:
-            return None, "Failed to download video. Try providing a direct video URL instead of YouTube."
-    except Exception as e:
-        return None, f"Error downloading video: {str(e)}"
 def extract_audio(video_path, output_format="mp3"):
     if not video_path:
         return None, "No video provided"
@@ -47,7 +15,6 @@ def extract_audio(video_path, output_format="mp3"):
     try:
         video = VideoFileClip(video_path)
-        # Remove the verbose parameter that's causing issues
         video.audio.write_audiofile(output_path, logger=None)
         video.close()
         return output_path, f"Audio extracted successfully"
@@ -57,8 +24,6 @@ def extract_audio(video_path, output_format="mp3"):
 def save_transcription(transcription):
     if "error" in transcription:
         return None, transcription["error"]
-    # Create a filename for the transcription
     transcript_filename = f"transcription_{uuid.uuid4().hex[:8]}.txt"
     try:
@@ -86,15 +51,11 @@ def process_video_url(video_url, output_format, api_key, model_id):
     if not video_url.strip():
         return None, "Please enter a video URL", None, "No URL provided"
-    # Download the video
     video_path, error = download_video_from_url(video_url)
     if error:
         return None, error, None, "Video download failed, cannot transcribe"
-    # Extract audio from the downloaded video
-    audio_path, message = extract_audio(video_path, output_format)
-    # Clean up the downloaded video
     if video_path and os.path.exists(video_path):
         try:
             os.remove(video_path)
@@ -167,25 +128,6 @@ with gr.Blocks(title="Video to Audio to Transcription") as app:
                 inputs=[video_input, format_choice_file, api_key, model_id],
                 outputs=[audio_output_file, status_output_file, transcript_file_output, transcript_status_output]
             )
-        with gr.TabItem("Video URL"):
-            with gr.Row():
-                with gr.Column():
-                    url_input = gr.Textbox(label="Video URL (YouTube, etc.)", placeholder="https://www.youtube.com/watch?v=...")
-                    format_choice_url = gr.Radio(["mp3", "wav"], value="mp3", label="Output Format")
-                    extract_button_url = gr.Button("Extract Audio & Transcribe")
-                with gr.Column():
-                    audio_output_url = gr.Audio(label="Extracted Audio", type="filepath")
-                    status_output_url = gr.Textbox(label="Audio Extraction Status")
-                    transcript_file_output_url = gr.File(label="Transcription Text File")
-                    transcript_status_output_url = gr.Textbox(label="Transcription Status")
-            extract_button_url.click(
-                fn=process_video_url,
-                inputs=[url_input, format_choice_url, api_key, model_id],
-                outputs=[audio_output_url, status_output_url, transcript_file_output_url, transcript_status_output_url]
-            )
 if __name__ == "__main__":
     app.launch()

 import requests
 import json
 from moviepy import VideoFileClip
 import uuid
 ELEVENLABS_API_KEY = os.environ.get("ELEVENLABS_API_KEY", None)
 def extract_audio(video_path, output_format="mp3"):
     if not video_path:
         return None, "No video provided"
     try:
         video = VideoFileClip(video_path)
         video.audio.write_audiofile(output_path, logger=None)
         video.close()
         return output_path, f"Audio extracted successfully"
 def save_transcription(transcription):
     if "error" in transcription:
         return None, transcription["error"]
     transcript_filename = f"transcription_{uuid.uuid4().hex[:8]}.txt"
     try:
     if not video_url.strip():
         return None, "Please enter a video URL", None, "No URL provided"
     video_path, error = download_video_from_url(video_url)
     if error:
         return None, error, None, "Video download failed, cannot transcribe"
+    audio_path, message = extract_audio(video_path, output_format)
     if video_path and os.path.exists(video_path):
         try:
             os.remove(video_path)
                 inputs=[video_input, format_choice_file, api_key, model_id],
                 outputs=[audio_output_file, status_output_file, transcript_file_output, transcript_status_output]
             )
 if __name__ == "__main__":
     app.launch()