Spaces:

rimelabs
/

ivr

Runtime error

App Files Files Community

isdanni commited on May 2, 2024

Commit

972af1f

1 Parent(s): 32fc60a

Add optional sampling rate

Browse files

Files changed (1) hide show

app.py +11 -6

app.py CHANGED Viewed

@@ -2,6 +2,7 @@ import base64
 import random
 import requests
 import gradio as gr
 SCHEDULE_ME = [
     "Hi there, I'm Grant. And I'm on a mission to make local businesses shine.",
@@ -506,7 +507,7 @@ RIME_TEXTS = SCHEDULE_ME + SUPERSIZED + MONOPOLY
 RIME_SPEAKERS = ["marsh", "bayou", "creek", "brook", "flower", "spore", "glacier", "gulch", "alpine", "cove", "lagoon", "tundra", "steppe", "mesa", "grove", "rainforest", "moraine", "wildflower", "peak", "boulder"]
 MONOPOLY_SPEAKERS = ["alexis", "audrey", "hannah", "julie", "danielle", "breanna", "jeremy", "ronnie"]
-def synthesize(key, text, speakers_must, speed, request: gr.Request):
     print("Requesting user: ", request.username)
     monopoly_sids = MONOPOLY_SPEAKERS
     rime_sids = RIME_SPEAKERS
@@ -530,13 +531,14 @@ def synthesize(key, text, speakers_must, speed, request: gr.Request):
     sids = sids_random + sids_must
     print(sids)
     headers = {"Authorization": "Api-Key {}".format(key)}
     for i in range(N):
         json_data = {
             "text": text.lower(),
             "speaker": sids[i],
             "modelId": "mist",
-            "speedAlpha": speed
         }
         print(json_data)
         response = requests.post(
@@ -556,13 +558,16 @@ gradio_app = gr.Interface(
     fn=synthesize,
     inputs=[
         gr.Textbox(
-            type="password", info="This is where you put your Rime TTS API key that was given to you by our team."
         ),
         gr.Textbox(
-            info="Enter the text you want synthesized here. If empty, will populate with a sentence at random."
         ),
         gr.Textbox(
-            info="Include speakers that you like, they will stay in the output, comma separated, for example: 'river,oak'"
         ),
         gr.Slider(0.8, 1.2, value=1, label="Speed, higher is slower."),
     ],

 import random
 import requests
 import gradio as gr
+import samplerate
 SCHEDULE_ME = [
     "Hi there, I'm Grant. And I'm on a mission to make local businesses shine.",
 RIME_SPEAKERS = ["marsh", "bayou", "creek", "brook", "flower", "spore", "glacier", "gulch", "alpine", "cove", "lagoon", "tundra", "steppe", "mesa", "grove", "rainforest", "moraine", "wildflower", "peak", "boulder"]
 MONOPOLY_SPEAKERS = ["alexis", "audrey", "hannah", "julie", "danielle", "breanna", "jeremy", "ronnie"]
+def synthesize(key, text, speakers_must, sampling_rate, speed, request: gr.Request):
     print("Requesting user: ", request.username)
     monopoly_sids = MONOPOLY_SPEAKERS
     rime_sids = RIME_SPEAKERS
     sids = sids_random + sids_must
     print(sids)
     headers = {"Authorization": "Api-Key {}".format(key)}
     for i in range(N):
         json_data = {
             "text": text.lower(),
             "speaker": sids[i],
             "modelId": "mist",
+            "speedAlpha": speed,
+            "samplingRate": int(sampling_rate) if len(sampling_rate) > 0 else sampling_rate
         }
         print(json_data)
         response = requests.post(
     fn=synthesize,
     inputs=[
         gr.Textbox(
+            label="Key", type="password", info="This is where you put your Rime TTS API key that was given to you by our team."
+        ),
+        gr.Textbox(
+            label="[Optional] Text", info="Enter the text you want synthesized here. If empty, will populate with a sentence at random."
         ),
         gr.Textbox(
+            label="[Optional] Speakers", info="Include speakers that you like, they will stay in the output, comma separated, for example: 'river,oak'"
         ),
         gr.Textbox(
+            label="[Optional] Sampling Rate", info="Default value is 22050"
         ),
         gr.Slider(0.8, 1.2, value=1, label="Speed, higher is slower."),
     ],