Spaces:

deepakkumar07
/

whisper-small-demo

Sleeping

deepakkumar07 commited on Mar 12

Commit

0ce1e34

verified ·

1 Parent(s): 2fad513

added model name param

Files changed (1) hide show

app.py CHANGED Viewed

@@ -7,15 +7,15 @@ pipe = pipeline(task="automatic-speech-recognition",
                 model="openai/whisper-small",
                 device="cuda" if torch.cuda.is_available() else "cpu")
-# Initialize the pipeline with the selected model
 def initialize_pipeline(model_name):
-    # Placeholder for the actual pipeline initialization
     return model_name
-def transcribe(audio, model_name):
-    pipe.model = model_name
     text = pipe(audio)["text"]
     return text
@@ -31,7 +31,6 @@ interface = gr.Interface(
 with gr.Blocks() as interface:
     # Dropdown to select the model
     model_dropdown = gr.Dropdown(choices=models, value=models[0], label="Select Model")
     # Audio input component
     audio_input = gr.Audio(sources=["microphone", "upload"], type="filepath", label="Upload or Record Audio")
     # Text output component
@@ -41,8 +40,7 @@ with gr.Blocks() as interface:
     # Event listener to initialize the pipeline when the model is selected
     model_dropdown.change(fn=initialize_pipeline, inputs=model_dropdown, outputs=None)
     # Event listener to transcribe the audio when the button is clicked
-    transcribe_button.click(fn=transcribe, inputs=[audio_input, model_dropdown], outputs=text_output)
-    # Event listener to show the download button when audio is uploaded or recorded
 if __name__ == "__main__":
     interface.launch()

                 model="openai/whisper-small",
                 device="cuda" if torch.cuda.is_available() else "cpu")
 def initialize_pipeline(model_name):
+    global pipe
+    pipe = pipeline(task="automatic-speech-recognition",
+                model=model_name,
+                device="cuda" if torch.cuda.is_available() else "cpu")
     return model_name
+def transcribe(audio):
     text = pipe(audio)["text"]
     return text
 with gr.Blocks() as interface:
     # Dropdown to select the model
     model_dropdown = gr.Dropdown(choices=models, value=models[0], label="Select Model")
     # Audio input component
     audio_input = gr.Audio(sources=["microphone", "upload"], type="filepath", label="Upload or Record Audio")
     # Text output component
     # Event listener to initialize the pipeline when the model is selected
     model_dropdown.change(fn=initialize_pipeline, inputs=model_dropdown, outputs=None)
     # Event listener to transcribe the audio when the button is clicked
+    transcribe_button.click(fn=transcribe, inputs=[audio_input], outputs=text_output)
 if __name__ == "__main__":
     interface.launch()