kennethli319 commited on
Commit
8bc1b1b
·
1 Parent(s): 1da77a0

update tts

Browse files
Files changed (1) hide show
  1. app.py +14 -2
app.py CHANGED
@@ -1,13 +1,25 @@
1
  import gradio as gr
 
 
 
 
 
2
 
3
  def greet(name):
4
  return "Hello " + name + "!!"
5
 
 
 
 
 
 
 
6
  def run():
7
  demo = gr.Interface(
8
  fn=greet,
9
- inputs="text",
10
- outputs="text",
 
11
  )
12
 
13
  demo.launch(server_name="0.0.0.0", server_port=7860)
 
1
  import gradio as gr
2
+ from nemo.collections.tts.models import FastPitchModel
3
+ from nemo.collections.tts.models import HifiGanModel
4
+
5
+ spec_generator = FastPitchModel.from_pretrained("tts_en_fastpitch_multispeaker")
6
+ tts_model = HifiGanModel.from_pretrained(model_name="tts_en_hifitts_hifigan_ft_fastpitch")
7
 
8
  def greet(name):
9
  return "Hello " + name + "!!"
10
 
11
+ def generate_tts(text: str, speaker: int = 0):
12
+ parsed = spec_generator.parse(text)
13
+ spectrogram = spec_generator.generate_spectrogram(tokens=parsed, speaker=speaker)
14
+ audio = tts_model.convert_spectrogram_to_audio(spec=spectrogram)
15
+ return audio
16
+
17
  def run():
18
  demo = gr.Interface(
19
  fn=greet,
20
+ inputs=["text",
21
+ gr.Slider(4, 6, step=1)],
22
+ outputs="audio",
23
  )
24
 
25
  demo.launch(server_name="0.0.0.0", server_port=7860)