speech-to-speech-translation

Sleeping

PhysHunter commited on Aug 20, 2023

Commit

b584d69

1 Parent(s): 748ad62

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -33,11 +33,11 @@ def speech_to_speech_translation(audio):
 title = "Cascaded STST"
-# description = """
-# Demo for cascaded speech-to-speech translation (STST), mapping from source speech in any language to target speech in French. Demo uses OpenAI's [Whisper Base](https://huggingface.co/openai/whisper-base) model for speech translation, and Facebook's
-# [MMS TTS](https://huggingface.co/facebook/mms-tts) model for text-to-speech:
-# ![Cascaded STST](https://huggingface.co/datasets/huggingface-course/audio-course-images/resolve/main/s2st_cascaded.png "Diagram of cascaded speech to speech translation")
-# """
 demo = gr.Blocks()
@@ -45,8 +45,9 @@ mic_translate = gr.Interface(
     fn=speech_to_speech_translation,
     inputs=gr.Audio(source="microphone", type="filepath"),
     outputs=gr.Audio(label="Generated Speech", type="numpy"),
     title=title,
-    #description=description,
 )
 file_translate = gr.Interface(
@@ -55,7 +56,7 @@ file_translate = gr.Interface(
     outputs=gr.Audio(label="Generated Speech", type="numpy"),
     examples=[["./example.wav"]],
     title=title,
-    #description=description,
 )
 with demo:

 title = "Cascaded STST"
+description = """
+Demo for cascaded speech-to-speech translation (STST), mapping from source speech in any language to target speech in French. Demo uses OpenAI's [Whisper Base](https://huggingface.co/openai/whisper-base) model for speech translation, and Facebook's
+[MMS TTS](https://huggingface.co/facebook/mms-tts) model for text-to-speech:
+![Cascaded STST](https://huggingface.co/datasets/huggingface-course/audio-course-images/resolve/main/s2st_cascaded.png "Diagram of cascaded speech to speech translation")
+"""
 demo = gr.Blocks()
     fn=speech_to_speech_translation,
     inputs=gr.Audio(source="microphone", type="filepath"),
     outputs=gr.Audio(label="Generated Speech", type="numpy"),
+    examples=[["./example.wav"]],
     title=title,
+    description=description,
 )
 file_translate = gr.Interface(
     outputs=gr.Audio(label="Generated Speech", type="numpy"),
     examples=[["./example.wav"]],
     title=title,
+    description=description,
 )
 with demo: