Spaces:

DemahAlmutairi
/

AudioToAudio

Runtime error

App Files Files Community

AudioToAudio / app.py

DemahAlmutairi

Update app.py

7396b9d verified 3 months ago

raw

history blame contribute delete

1.78 kB

	import gradio as gr
	import whisper
	from transformers import pipeline
	from gtts import gTTS
	import os

	# Load the Whisper model from openai-whisper
	whisper_model = whisper.load_model("tiny")

	# Load the summarization model from Hugging Face
	summarizer = pipeline("summarization", model="facebook/bart-large-cnn")


	def summarize_audio(audio_path):
	# Step 1: Transcribe the uploaded audio file using Whisper
	transcription_result = whisper_model.transcribe(audio_path)
	transcription = transcription_result["text"]

	# Step 2: Summarize the transcribed text using a pre-trained summarization model
	summary = summarizer(transcription, max_length=50, min_length=25, do_sample=False)[0]['summary_text']

	# Step 3: Convert the summarized text into speech using the Hugging Face TTS model
	# Breakdown into multiple steps
	tts = gTTS(text=summary, lang='en') # Generate the TTS output
	tts.save("summarized_audio.wav")

	# Save the TTS audio to a file (WAV format)


	# Return the path to the saved summarized audio file
	return "summarized_audio.wav"

	# Gradio interface
	interface = gr.Interface(
	fn=summarize_audio, # The function to process the audio and return summarized audio
	inputs=gr.Audio(type="filepath", label="Upload your audio file"), # Accept audio file uploads, file path as input
	outputs=gr.File(label="Download Summarized Audio"), # Provide a downloadable summarized audio file
	title="Audio Summarizer", # Interface title
	description="Upload an audio file, and this tool will summarize it and generate a downloadable audio summary." , # Interface description
	examples=[["Classification_and_Regression_in_Machine_Learning.mp3"]]
	)

	# Launch the Gradio interface
	interface.launch(debug=True)