XTTS_V2_CPU_fixed

Running

App Files Files Community

Deep50D commited on 8 days ago

Commit

6f98ffd

verified ·

1 Parent(s): 5549c65

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -18

app.py CHANGED Viewed

@@ -7,17 +7,19 @@ os.environ["COQUI_TOS_AGREED"] = "1"
 import gradio as gr
 from TTS.api import TTS
 from TTS.utils.manage import ModelManager
-# fixing current runtime errors
 from TTS.tts.configs.xtts_config import XttsConfig
 from TTS.tts.models.xtts import XttsAudioConfig
 from TTS.config.shared_configs import BaseDatasetConfig
 from TTS.tts.models.xtts import XttsArgs
 import torch.serialization
 # torch.serialization.add_safe_globals([XttsConfig])
 model_names = TTS().list_models()
 print(model_names.__dict__)
 print(model_names.__dir__())
-model_name = "tts_models/multilingual/multi-dataset/xtts_v2" # move in v2, since xtts_v1 is generated keyerror, I guess you can select it with old github's release.
 #m = ModelManager().download_model(model_name)
 #print(m)
@@ -33,7 +35,7 @@ def predict(prompt, language, audio_file_pth, mic_file_path, use_mic, agree, req
     I have been obliged to include a ‘display of additional information’ relating to the use of this area.
     As a reminder, sending illegal content (se*ual, offensive or threatening content) in any language is of course FORBIDDEN.
     language, is of course FORBIDDEN. I cannot be held responsible for those who violate a strictly [ETHICAL and MORAL] use of this space.
-    use of this model.
     """
     try:
@@ -112,30 +114,20 @@ def predict(prompt, language, audio_file_pth, mic_file_path, use_mic, agree, req
         gr.Warning("Please accept the Terms & Condition!")
         return None
-title = "XTTS D5D's remake of Glz's remake (Functional Text-2-Speech)"
 description = f"""
-<a href="https://huggingface.co/coqui/XTTS-v1">XTTS</a> is a Voice generation model that lets you clone voices into different languages by using just a quick 3-second audio clip.
-<br/>
 XTTS is built on previous research, like Tortoise, with additional architectural innovations and training to make cross-language voice cloning and multilingual speech generation possible.
-<br/>
 This is the same model that powers our creator application <a href="https://coqui.ai">Coqui Studio</a> as well as the <a href="https://docs.coqui.ai">Coqui API</a>. In production we apply modifications to make low-latency streaming possible.
-<br/>
-Leave a star on the Github <a href="https://github.com/coqui-ai/TTS">TTS</a>, where our open-source inference and training code lives.
-<br/>
-<p>For faster inference without waiting in the queue, you should duplicate this space and upgrade to GPU via the settings.
-<br/>
 <a href="https://huggingface.co/spaces/coqui/xtts?duplicate=true">
 <img style="margin-top: 0em; margin-bottom: 0em" src="https://bit.ly/3gLdBN6" alt="Duplicate Space"></a>
 </p>
 <p>
-<br>
-Due to the large number of abuses observed in the console's logs, ‘additional information’ on the use of this space has been added.
-<br>
 As a reminder, sending illegal content (se*ual, offensive or threatening content) in any language is, of course, FORBIDDEN.
-<br>
 The authors of this space cannot be held responsible for those who violate the strictly [ETHICAL AND MORAL] use of this model.
-<br>
 </p>
 """
@@ -251,7 +243,7 @@ gr.Interface(
         gr.Textbox(
             label="Text Prompt",
             info="One or two sentences at a time is better",
-            value="Hello, World !, here is an example of light voice cloning. Try to upload your best audio samples quality",
         ),
         gr.Dropdown(
             label="Language",

 import gradio as gr
 from TTS.api import TTS
 from TTS.utils.manage import ModelManager
 from TTS.tts.configs.xtts_config import XttsConfig
 from TTS.tts.models.xtts import XttsAudioConfig
 from TTS.config.shared_configs import BaseDatasetConfig
 from TTS.tts.models.xtts import XttsArgs
 import torch.serialization
 # torch.serialization.add_safe_globals([XttsConfig])
 model_names = TTS().list_models()
 print(model_names.__dict__)
 print(model_names.__dir__())
+model_name = "tts_models/multilingual/multi-dataset/xtts_v2" # using v2
 #m = ModelManager().download_model(model_name)
 #print(m)
     I have been obliged to include a ‘display of additional information’ relating to the use of this area.
     As a reminder, sending illegal content (se*ual, offensive or threatening content) in any language is of course FORBIDDEN.
     language, is of course FORBIDDEN. I cannot be held responsible for those who violate a strictly [ETHICAL and MORAL] use of this space.
+    use of this model. <- Glz's text not Deep50D's
     """
     try:
         gr.Warning("Please accept the Terms & Condition!")
         return None
+title = "XTTS Deep50D's remake of Glz's remake (Functional TTS)"
 description = f"""
+<p><a href="https://huggingface.co/coqui/XTTS-v1">XTTS</a> is a Voice generation model that lets you clone voices into different languages by using just a quick 3-second audio clip.
 XTTS is built on previous research, like Tortoise, with additional architectural innovations and training to make cross-language voice cloning and multilingual speech generation possible.
 This is the same model that powers our creator application <a href="https://coqui.ai">Coqui Studio</a> as well as the <a href="https://docs.coqui.ai">Coqui API</a>. In production we apply modifications to make low-latency streaming possible.
+Leave a star on the Github <a href="https://github.com/coqui-ai/TTS">TTS</a>, where our open-source inference and training code lives.</p>
+<p>For faster inference without waiting in the queue, you should duplicate this space.
 <a href="https://huggingface.co/spaces/coqui/xtts?duplicate=true">
 <img style="margin-top: 0em; margin-bottom: 0em" src="https://bit.ly/3gLdBN6" alt="Duplicate Space"></a>
 </p>
 <p>
 As a reminder, sending illegal content (se*ual, offensive or threatening content) in any language is, of course, FORBIDDEN.
 The authors of this space cannot be held responsible for those who violate the strictly [ETHICAL AND MORAL] use of this model.
 </p>
 """
         gr.Textbox(
             label="Text Prompt",
             info="One or two sentences at a time is better",
+            value="Hello, World! Here's an example of light voice cloning. Try to upload your best audio samples",
         ),
         gr.Dropdown(
             label="Language",