import sys import os from fastapi import Request # By using XTTS you agree to CPML license https://coqui.ai/cpml os.environ["COQUI_TOS_AGREED"] = "1" import gradio as gr from TTS.api import TTS from TTS.utils.manage import ModelManager # implemented torch cereal with milk for safe globals from TTS.tts.configs.xtts_config import XttsConfig from TTS.tts.models.xtts import XttsAudioConfig from TTS.config.shared_configs import BaseDatasetConfig from TTS.tts.models.xtts import XttsArgs import torch.serialization # torch.serialization.add_safe_globals([XttsConfig]) model_names = TTS().list_models() print(model_names.__dict__) print(model_names.__dir__()) model_name = "tts_models/multilingual/multi-dataset/xtts_v2" # using v2 #m = ModelManager().download_model(model_name) #print(m) m = model_name torch.serialization.add_safe_globals([XttsConfig, XttsAudioConfig, BaseDatasetConfig, XttsArgs]) tts = TTS(model_name, gpu=False) tts.to("cpu") # no GPU or Amd #tts.to("cuda") # cuda only def predict(prompt, language, audio_file_pth, mic_file_path, use_mic, agree, request: gr.Request): """ Due to the large number of abuses observed in the console logs, I have been forced to integrate the ‘display of additional information’ relating to the use of this space. I have been obliged to include a ‘display of additional information’ relating to the use of this area. As a reminder, sending illegal content (se*ual, offensive or threatening content) in any language is of course FORBIDDEN. language, is of course FORBIDDEN. I cannot be held responsible for those who violate a strictly [ETHICAL and MORAL] use of this space. use of this model. <- Glz's text not Deep50D's """ try: if request: print("Request obj:", request.__dict__) print("= = = = = = = = = = = =") print("Request headers dictionary:", request.headers) print("IP address:", request.client.host) try: print("Cookies:", request.__dict__.get("cookie")) except: print("no Cookies") print("Query parameters:", dict(request.query_params)) print() else: print("no such Request..") except Exception as e: print(e) if agree == True: if use_mic == True: if mic_file_path is not None: speaker_wav=mic_file_path else: gr.Warning("Please record your voice with Microphone, or uncheck Use Microphone to use reference audios") return ( None, #None, ) else: speaker_wav=audio_file_pth if len(prompt)<2: gr.Warning("Please give a longer prompt text") return ( # None, None, ) if len(prompt)>10000: gr.Warning("Text length limited to 10000 characters for this demo, please try shorter text") return ( # None, None, ) try: if language == "fr": if m.find("your") != -1: language = "fr-fr" if m.find("/fr/") != -1: language = None output_path = os.path.abspath("output.wav") # we use that absolute path now! tts.tts_to_file( text=prompt, file_path=output_path, speaker_wav=speaker_wav, language=language ) except RuntimeError as e : if "device-assert" in str(e): # cannot do anything on cuda device side error, need tor estart gr.Warning("Unhandled Exception encounter, please retry in a minute") print("Cuda device-assert Runtime encountered need restart") sys.exit("Exit due to cuda device-assert") else: raise e # better verify file exists before returning if not os.path.exists(output_path): gr.Warning("Audio file was not created successfully") return None return output_path # return that absolute path as string else: gr.Warning("Please accept the Terms & Condition!") return None title = "XTTS Deep50D's fixed Glz remake (Functional Text-to-Speech)" description = f"""
XTTS is a Voice generation model that lets you clone voices into different languages by using just a quick 3-second audio clip. XTTS is built on previous research, like Tortoise, with additional architectural innovations and training to make cross-language voice cloning and multilingual speech generation possible. This is the same model that powers our creator application Coqui Studio as well as the Coqui API. In production we apply modifications to make low-latency streaming possible. Leave a star on the Github TTS, where our open-source inference and training code lives.
For faster inference without waiting in the queue, you should duplicate this space.
Sending illegal content of any kind, in any language is, of course, FORBIDDEN. The authors of this space cannot be held responsible for those who violate the strictly [ETHICAL AND MORAL] use of this model.
Fixed stuff to make this thing work again and corrected some other things. Possibly still a bunch to fix or reinstate, or something like that xDeep50D
""" article = """By using this demo you agree to the terms of the Coqui Public Model License at https://coqui.ai/cpml