Spaces:
Build error
Build error
积极的屁孩
commited on
Commit
·
fbb3473
1
Parent(s):
b4485a3
adjustments
Browse files
app.py
CHANGED
@@ -628,24 +628,34 @@ def vevo_tts(text, ref_wav, timbre_ref_wav=None, src_language="en", ref_language
|
|
628 |
# 创建Gradio界面
|
629 |
with gr.Blocks(title="VEVO DEMO") as demo:
|
630 |
gr.Markdown("# VEVO DEMO")
|
631 |
-
gr.Markdown("## Controllable Zero-Shot Voice Conversion and Style Transfer")
|
632 |
|
633 |
with gr.Tab("Vevo-Timbre"):
|
634 |
gr.Markdown("### Vevo-Timbre: Maintain style but transfer timbre")
|
635 |
with gr.Row():
|
636 |
with gr.Column():
|
637 |
-
timbre_content = gr.Audio(label="
|
638 |
timbre_reference = gr.Audio(label="Timbre Reference", type="numpy")
|
639 |
timbre_button = gr.Button("Generate")
|
640 |
with gr.Column():
|
641 |
timbre_output = gr.Audio(label="Result")
|
642 |
timbre_button.click(vevo_timbre, inputs=[timbre_content, timbre_reference], outputs=timbre_output)
|
643 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
644 |
with gr.Tab("Vevo-Voice"):
|
645 |
gr.Markdown("### Vevo-Voice: Transfers both style and timbre with separate references")
|
646 |
with gr.Row():
|
647 |
with gr.Column():
|
648 |
-
voice_content = gr.Audio(label="
|
649 |
voice_style_reference = gr.Audio(label="Style Reference", type="numpy")
|
650 |
voice_timbre_reference = gr.Audio(label="Timbre Reference", type="numpy")
|
651 |
voice_button = gr.Button("Generate")
|
@@ -653,16 +663,7 @@ with gr.Blocks(title="VEVO DEMO") as demo:
|
|
653 |
voice_output = gr.Audio(label="Result")
|
654 |
voice_button.click(vevo_voice, inputs=[voice_content, voice_style_reference, voice_timbre_reference], outputs=voice_output)
|
655 |
|
656 |
-
|
657 |
-
gr.Markdown("### Vevo-Style: Maintain timbre but transfer style (accent, emotion, etc.)")
|
658 |
-
with gr.Row():
|
659 |
-
with gr.Column():
|
660 |
-
style_content = gr.Audio(label="Content Audio", type="numpy")
|
661 |
-
style_reference = gr.Audio(label="Style Reference", type="numpy")
|
662 |
-
style_button = gr.Button("Generate")
|
663 |
-
with gr.Column():
|
664 |
-
style_output = gr.Audio(label="Result")
|
665 |
-
style_button.click(vevo_style, inputs=[style_content, style_reference], outputs=style_output)
|
666 |
|
667 |
with gr.Tab("Vevo-TTS"):
|
668 |
gr.Markdown("### Vevo-TTS: Text-to-speech with separate style and timbre references")
|
|
|
628 |
# 创建Gradio界面
|
629 |
with gr.Blocks(title="VEVO DEMO") as demo:
|
630 |
gr.Markdown("# VEVO DEMO")
|
|
|
631 |
|
632 |
with gr.Tab("Vevo-Timbre"):
|
633 |
gr.Markdown("### Vevo-Timbre: Maintain style but transfer timbre")
|
634 |
with gr.Row():
|
635 |
with gr.Column():
|
636 |
+
timbre_content = gr.Audio(label="Source Audio", type="numpy")
|
637 |
timbre_reference = gr.Audio(label="Timbre Reference", type="numpy")
|
638 |
timbre_button = gr.Button("Generate")
|
639 |
with gr.Column():
|
640 |
timbre_output = gr.Audio(label="Result")
|
641 |
timbre_button.click(vevo_timbre, inputs=[timbre_content, timbre_reference], outputs=timbre_output)
|
642 |
+
|
643 |
+
with gr.Tab("Vevo-Style"):
|
644 |
+
gr.Markdown("### Vevo-Style: Maintain timbre but transfer style (accent, emotion, etc.)")
|
645 |
+
with gr.Row():
|
646 |
+
with gr.Column():
|
647 |
+
style_content = gr.Audio(label="Source Audio", type="numpy")
|
648 |
+
style_reference = gr.Audio(label="Style Reference", type="numpy")
|
649 |
+
style_button = gr.Button("Generate")
|
650 |
+
with gr.Column():
|
651 |
+
style_output = gr.Audio(label="Result")
|
652 |
+
style_button.click(vevo_style, inputs=[style_content, style_reference], outputs=style_output)
|
653 |
+
|
654 |
with gr.Tab("Vevo-Voice"):
|
655 |
gr.Markdown("### Vevo-Voice: Transfers both style and timbre with separate references")
|
656 |
with gr.Row():
|
657 |
with gr.Column():
|
658 |
+
voice_content = gr.Audio(label="Source Audio", type="numpy")
|
659 |
voice_style_reference = gr.Audio(label="Style Reference", type="numpy")
|
660 |
voice_timbre_reference = gr.Audio(label="Timbre Reference", type="numpy")
|
661 |
voice_button = gr.Button("Generate")
|
|
|
663 |
voice_output = gr.Audio(label="Result")
|
664 |
voice_button.click(vevo_voice, inputs=[voice_content, voice_style_reference, voice_timbre_reference], outputs=voice_output)
|
665 |
|
666 |
+
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
667 |
|
668 |
with gr.Tab("Vevo-TTS"):
|
669 |
gr.Markdown("### Vevo-TTS: Text-to-speech with separate style and timbre references")
|