File size: 3,201 Bytes
d40e945
 
14c2908
 
 
 
16a9bac
 
14c2908
a7baba5
a5ea363
ec4baac
52c8671
15e3a1c
53dabb2
d4caa8b
d40e945
 
46161b4
e7d48ce
d40e945
01c46b8
d40e945
8851b82
01c46b8
c6b23cd
d40e945
 
5d5cc81
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
20c912c
5d5cc81
 
 
 
 
 
ec4baac
 
5d5cc81
 
 
 
 
 
 
a6bdce7
 
5d5cc81
d40e945
 
 
 
 
 
 
 
 
14c9322
d40e945
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
# Models to include in the leaderboard, only include models that users can vote on
AVAILABLE_MODELS = {
    'ElevenLabs': 'eleven',
    'Play.HT 2.0': 'playht',
    'StyleTTS 2': 'styletts2',
    'Parler TTS Large': 'parlerlarge',
    # 'Kokoro v0.19': 'kokoro0.19',
    # 'Kokoro v1.0': 'kokorov1',
    'CosyVoice 2.0': 'cosyvoice',
    'PlayDialog 1.0': 'playdialogv1',
    'Papla P1': 'papla',
    'Hume Octave': 'hume',
    # 'Fish Speech v1.5': 'anonymousfish',
    # 'MeloTTS': 'melo',
    # 'PlayDialog': 'playdialog',
    # 'XTTSv2': 'xtts',
    # 'WhisperSpeech': 'whisperspeech',
    # 'OpenVoice': 'openvoice',
    #'OpenVoice V2': 'openvoicev2',
    # 'Play.HT 3.0 Mini': 'playht3',
    # 'MetaVoice': 'metavoice',
    #'GPT-SoVITS': 'sovits',
    # 'Vokan TTS': 'vokan',
    # 'VoiceCraft 2.0': 'voicecraft',
    #'Parler TTS': 'parler',
    #'Fish Speech v1.4': 'fish',
}

model_links = {
    'ElevenLabs': 'https://elevenlabs.io/',
    'Play.HT 2.0': 'https://play.ht/',
    'Play.HT 3.0 Mini': 'https://play.ht/',
    'XTTSv2': 'https://huggingface.co/coqui/XTTS-v2',
    'MeloTTS': 'https://github.com/myshell-ai/MeloTTS',
    'StyleTTS 2': 'https://github.com/yl4579/StyleTTS2',
    'Parler TTS Large': 'https://github.com/huggingface/parler-tts',
    'Parler TTS': 'https://github.com/huggingface/parler-tts',
    'Fish Speech v1.5': 'https://github.com/fishaudio/fish-speech',
    'Fish Speech v1.4': 'https://github.com/fishaudio/fish-speech',
    'GPT-SoVITS': 'https://github.com/RVC-Boss/GPT-SoVITS',
    'WhisperSpeech': 'https://github.com/WhisperSpeech/WhisperSpeech',
    'VoiceCraft 2.0': 'https://github.com/jasonppy/VoiceCraft',
    'PlayDialog': 'https://play.ht/',
    'Kokoro v0.19': 'https://huggingface.co/hexgrad/Kokoro-82M',
    'Kokoro v1.0': 'https://huggingface.co/hexgrad/Kokoro-82M',
    'CosyVoice 2.0': 'https://github.com/FunAudioLLM/CosyVoice',
    'MetaVoice': 'https://github.com/metavoiceio/metavoice-src',
    'OpenVoice': 'https://github.com/myshell-ai/OpenVoice',
    'OpenVoice V2': 'https://github.com/myshell-ai/OpenVoice',
    'Pheme': 'https://github.com/PolyAI-LDN/pheme',
    'Vokan TTS': 'https://huggingface.co/ShoukanLabs/Vokan',
    'Papla P1': 'https://papla.media',
    'Hume Octave': 'https://www.hume.ai'
}

closed_source = [
    'ElevenLabs',
    'Play.HT 2.0',
    'Play.HT 3.0 Mini',
    'PlayDialog',
    'Papla P1',
    'Hume Octave'
]

# Model name mapping, can include models that users cannot vote on
model_names = {
    'styletts2': 'StyleTTS 2',
    'tacotron': 'Tacotron',
    'tacotronph': 'Tacotron Phoneme',
    'tacotrondca': 'Tacotron DCA',
    'speedyspeech': 'Speedy Speech',
    'overflow': 'Overflow TTS',
    'anonymoussparkle': 'Anonymous Sparkle',
    'vits': 'VITS',
    'vitsneon': 'VITS Neon',
    'neuralhmm': 'Neural HMM',
    'glow': 'Glow TTS',
    'fastpitch': 'FastPitch',
    'jenny': 'Jenny',
    'tortoise': 'Tortoise TTS',
    'xtts2': 'Coqui XTTSv2',
    'xtts': 'Coqui XTTS',
    'openvoice': 'MyShell OpenVoice',
    'elevenlabs': 'ElevenLabs',
    'openai': 'OpenAI',
    'hierspeech': 'HierSpeech++',
    'pheme': 'PolyAI Pheme',
    'speecht5': 'SpeechT5',
    'metavoice': 'MetaVoice-1B',
}