speech-to-speech-translation

Sleeping

PhysHunter commited on Aug 20, 2023

Commit

748ad62

1 Parent(s): ee3d3d0

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,7 +1,6 @@
 import gradio as gr
 import numpy as np
 import torch
-from datasets import load_dataset
 from transformers import VitsModel, VitsTokenizer, pipeline
 device = "cuda:0" if torch.cuda.is_available() else "cpu"
@@ -33,7 +32,7 @@ def speech_to_speech_translation(audio):
     return 16000, synthesised_speech
-# title = "Cascaded STST"
 # description = """
 # Demo for cascaded speech-to-speech translation (STST), mapping from source speech in any language to target speech in French. Demo uses OpenAI's [Whisper Base](https://huggingface.co/openai/whisper-base) model for speech translation, and Facebook's
 # [MMS TTS](https://huggingface.co/facebook/mms-tts) model for text-to-speech:
@@ -47,7 +46,7 @@ mic_translate = gr.Interface(
     inputs=gr.Audio(source="microphone", type="filepath"),
     outputs=gr.Audio(label="Generated Speech", type="numpy"),
     title=title,
-    description=description,
 )
 file_translate = gr.Interface(
@@ -56,7 +55,7 @@ file_translate = gr.Interface(
     outputs=gr.Audio(label="Generated Speech", type="numpy"),
     examples=[["./example.wav"]],
     title=title,
-    description=description,
 )
 with demo:

 import gradio as gr
 import numpy as np
 import torch
 from transformers import VitsModel, VitsTokenizer, pipeline
 device = "cuda:0" if torch.cuda.is_available() else "cpu"
     return 16000, synthesised_speech
+title = "Cascaded STST"
 # description = """
 # Demo for cascaded speech-to-speech translation (STST), mapping from source speech in any language to target speech in French. Demo uses OpenAI's [Whisper Base](https://huggingface.co/openai/whisper-base) model for speech translation, and Facebook's
 # [MMS TTS](https://huggingface.co/facebook/mms-tts) model for text-to-speech:
     inputs=gr.Audio(source="microphone", type="filepath"),
     outputs=gr.Audio(label="Generated Speech", type="numpy"),
     title=title,
+    #description=description,
 )
 file_translate = gr.Interface(
     outputs=gr.Audio(label="Generated Speech", type="numpy"),
     examples=[["./example.wav"]],
     title=title,
+    #description=description,
 )
 with demo: