Spaces:

paulbauriegel
/

simple_whisper

Sleeping

paulbauriegel commited on May 15, 2023

Commit

e77e1d8

1 Parent(s): 3146b8d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -7,18 +7,13 @@ import whisperx
 model = WhisperModel('large-v2', device="cuda", compute_type="float16")
-def speech_to_text(mic=None, file=None, lang=None):
     if mic is not None:
         audio = mic
     elif file is not None:
         audio = file
     else:
         raise gr.Error("You must either provide a mic recording or a file")
-    if lang is None or lang == '':
-        lang = None
-    task = 'transcribe' if lang is None else 'translate'
     print(lang, task)
     time_start = time.time()
@@ -73,11 +68,11 @@ with gr.Blocks(title='Whisper Demo', theme=theme) as demo:
     translate_btn = gr.Button("Translate audio")
     trans_df = gr.DataFrame(label="Transcription dataframe", row_count=(0, "dynamic"), max_rows = 10, wrap=True, overflow_row_behaviour='paginate')
     sys_info = gr.Markdown("")
-    transcribe_btn.click(speech_to_text,
                                  [audio_in, file_in, drop_down],
                                  [trans_df, sys_info]
                                 )
-    translate_btn.click(speech_to_text,
                             [audio_in, file_in, drop_down],
                             [trans_df, sys_info])

 model = WhisperModel('large-v2', device="cuda", compute_type="float16")
+def speech_to_text(mic=None, file=None, lang=None, task='transcribe'):
     if mic is not None:
         audio = mic
     elif file is not None:
         audio = file
     else:
         raise gr.Error("You must either provide a mic recording or a file")
     print(lang, task)
     time_start = time.time()
     translate_btn = gr.Button("Translate audio")
     trans_df = gr.DataFrame(label="Transcription dataframe", row_count=(0, "dynamic"), max_rows = 10, wrap=True, overflow_row_behaviour='paginate')
     sys_info = gr.Markdown("")
+    transcribe_btn.click(lambda x, y: speech_to_text(x, y, None, 'transcribe'),
                                  [audio_in, file_in, drop_down],
                                  [trans_df, sys_info]
                                 )
+    translate_btn.click(lambda x, y, z: speech_to_text(x, y, None, 'translate'),
                             [audio_in, file_in, drop_down],
                             [trans_df, sys_info])