GetmanY1 commited on
Commit
cf20a06
·
1 Parent(s): 7e6e084

Fix audio loading script

Browse files
Files changed (2) hide show
  1. app.py +8 -2
  2. requirements.txt +3 -1
app.py CHANGED
@@ -1,9 +1,15 @@
1
  import gradio as gr
2
  from transformers import pipeline
3
- from librosa import load
4
 
5
  def transcribe(input_audio):
6
- speech, _ = load(input_audio, sr=16000, mono=True)
 
 
 
 
 
 
7
  output = pipe(speech, chunk_length_s=30, stride_length_s=5)['text']
8
  return output
9
 
 
1
  import gradio as gr
2
  from transformers import pipeline
3
+ from librosa import resample
4
 
5
  def transcribe(input_audio):
6
+ sr, speech = input_audio
7
+ # Convert to mono if stereo
8
+ if speech.ndim > 1:
9
+ speech = speech.mean(axis=1)
10
+ # Resample if sampling rate is not 16kHz
11
+ if sr!=16000:
12
+ speech = librosa.resample(speech, orig_sr=sr, target_sr=16000)
13
  output = pipe(speech, chunk_length_s=30, stride_length_s=5)['text']
14
  return output
15
 
requirements.txt CHANGED
@@ -1,3 +1,5 @@
1
  transformers
2
  torch
3
- librosa
 
 
 
1
  transformers
2
  torch
3
+ librosa
4
+ samplerate
5
+ resampy