Spaces:

tdurzynski
/

automatic-speech-recognition

Sleeping

tdurzynski commited on May 19, 2024

Commit

f28ce48

verified ·

1 Parent(s): b7aaa7f

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,46 +1,31 @@
 from transformers import pipeline
 import gradio as gr
 asr = pipeline(task="automatic-speech-recognition",
                model="./models/distil-whisper/distil-small.en")
-demo = gr.Blocks()
 def transcribe_long_form(filepath):
     if filepath is None:
-        gr.Warning("No audio found, please retry.")
-        return ""
-    output = asr(
-      filepath,
-      max_new_tokens=256,
-      chunk_length_s=30,
-      batch_size=8,
-    )
-    return output["text"]
-mic_transcribe = gr.Interface(
-    fn=transcribe_long_form,
-    inputs=gr.Audio(sources="microphone",
-                    type="filepath"),
-    outputs=gr.Textbox(label="Transcription",
-                       lines=3),
-    allow_flagging="never")
-file_transcribe = gr.Interface(
-    fn=transcribe_long_form,
-    inputs=gr.Audio(sources="upload",
-                    type="filepath"),
-    outputs=gr.Textbox(label="Transcription",
-                       lines=3),
-    allow_flagging="never",
-)
-with demo:
-    gr.TabbedInterface(
-        [mic_transcribe,
-         file_transcribe],
-        ["Transcribe Microphone",
-         "Transcribe Audio File"],
-    )
-demo.launch(share=True,
-            server_port=int(os.environ['PORT1']))

 from transformers import pipeline
 import gradio as gr
+import os
+# Load the ASR model
 asr = pipeline(task="automatic-speech-recognition",
                model="./models/distil-whisper/distil-small.en")
+# Define the transcription function
 def transcribe_long_form(filepath):
     if filepath is None:
+        return "No audio file provided, please upload a file or record one."
+    output = asr(filepath)
+    return output['text']
+# Set up the Gradio interface
+with gr.Blocks() as demo:
+    with gr.Tab("Transcribe Audio"):
+        with gr.Row():
+            audio_input = gr.Audio(sources=["microphone", "upload"], type="filepath")
+            submit_button = gr.Button("Transcribe")
+        transcription_output = gr.Textbox(label="Transcription", lines=3)
+        submit_button.click(
+            transcribe_long_form,
+            inputs=[audio_input],
+            outputs=[transcription_output]
+        )
+# Launch the Gradio app
+demo.launch(share=True, server_port=int(os.environ.get('PORT1', 7860)))  # Default port 7860 if PORT1 is not set