Spaces:
Build error
Build error
积极的屁孩
commited on
Commit
·
c5442ce
1
Parent(s):
c0b2589
final test
Browse files
app.py
CHANGED
@@ -630,32 +630,36 @@ def vevo_tts(text, ref_wav, timbre_ref_wav=None, style_ref_text=None, src_langua
|
|
630 |
# 创建Gradio界面
|
631 |
with gr.Blocks(title="Vevo DEMO") as demo:
|
632 |
gr.Markdown("# Vevo DEMO")
|
|
|
|
|
633 |
# 添加链接标签行
|
634 |
with gr.Row(elem_id="links_row"):
|
635 |
gr.HTML("""
|
636 |
-
<div style="display: flex; justify-content: center; gap:
|
637 |
<a href="https://arxiv.org/abs/2502.07243" target="_blank" style="text-decoration: none;">
|
638 |
-
<div style="
|
639 |
-
<span style="background-color: #
|
640 |
-
<span style="padding: 5px
|
641 |
</div>
|
642 |
</a>
|
643 |
<a href="https://openreview.net/pdf?id=anQDiQZhDP" target="_blank" style="text-decoration: none;">
|
644 |
-
<div style="
|
645 |
-
<span style="background-color: #
|
646 |
-
<span style="padding: 5px
|
647 |
</div>
|
648 |
</a>
|
649 |
<a href="https://huggingface.co/amphion/Vevo" target="_blank" style="text-decoration: none;">
|
650 |
-
<div style="
|
651 |
-
<span style="background-color: #
|
652 |
-
|
|
|
|
|
653 |
</div>
|
654 |
</a>
|
655 |
<a href="https://github.com/open-mmlab/Amphion/tree/main/models/vc/vevo" target="_blank" style="text-decoration: none;">
|
656 |
-
<div style="
|
657 |
-
<span style="background-color: #
|
658 |
-
<span style="padding: 5px
|
659 |
</div>
|
660 |
</a>
|
661 |
</div>
|
@@ -703,10 +707,10 @@ with gr.Blocks(title="Vevo DEMO") as demo:
|
|
703 |
with gr.Column():
|
704 |
tts_text = gr.Textbox(label="Input Text", placeholder="Enter text to synthesize...", lines=3)
|
705 |
tts_src_language = gr.Dropdown(["en", "zh", "de", "fr", "ja", "ko"], label="Text Language", value="en")
|
706 |
-
tts_reference = gr.Audio(label="Style Reference", type="numpy")
|
|
|
707 |
tts_timbre_reference = gr.Audio(label="Timbre Reference", type="numpy")
|
708 |
tts_ref_language = gr.Dropdown(["en", "zh", "de", "fr", "ja", "ko"], label="Reference Audio Language", value="en")
|
709 |
-
tts_style_ref_text = gr.Textbox(label="Style Reference Text", placeholder="Enter style reference text...", lines=3)
|
710 |
tts_button = gr.Button("Generate")
|
711 |
with gr.Column():
|
712 |
tts_output = gr.Audio(label="Result")
|
|
|
630 |
# 创建Gradio界面
|
631 |
with gr.Blocks(title="Vevo DEMO") as demo:
|
632 |
gr.Markdown("# Vevo DEMO")
|
633 |
+
gr.Markdown("## Controllable Zero-Shot Voice Imitation with Self-Supervised Disentanglement")
|
634 |
+
|
635 |
# 添加链接标签行
|
636 |
with gr.Row(elem_id="links_row"):
|
637 |
gr.HTML("""
|
638 |
+
<div style="display: flex; justify-content: center; gap: 8px; margin: 20px 0;">
|
639 |
<a href="https://arxiv.org/abs/2502.07243" target="_blank" style="text-decoration: none;">
|
640 |
+
<div style="display: inline-flex; align-items: center; border-radius: 4px; overflow: hidden;">
|
641 |
+
<span style="background-color: #4a4a4a; color: white; padding: 5px 8px; font-size: 14px;">arXiv</span>
|
642 |
+
<span style="background-color: #c44e52; color: white; padding: 5px 8px; font-size: 14px;">Paper</span>
|
643 |
</div>
|
644 |
</a>
|
645 |
<a href="https://openreview.net/pdf?id=anQDiQZhDP" target="_blank" style="text-decoration: none;">
|
646 |
+
<div style="display: inline-flex; align-items: center; border-radius: 4px; overflow: hidden;">
|
647 |
+
<span style="background-color: #4a4a4a; color: white; padding: 5px 8px; font-size: 14px;">ICLR</span>
|
648 |
+
<span style="background-color: #55a868; color: white; padding: 5px 8px; font-size: 14px;">Paper</span>
|
649 |
</div>
|
650 |
</a>
|
651 |
<a href="https://huggingface.co/amphion/Vevo" target="_blank" style="text-decoration: none;">
|
652 |
+
<div style="display: inline-flex; align-items: center; border-radius: 4px; overflow: hidden;">
|
653 |
+
<span style="background-color: #4a4a4a; color: white; padding: 5px 8px; font-size: 14px;">
|
654 |
+
<span style="font-size: 14px;">🤗</span> HuggingFace
|
655 |
+
</span>
|
656 |
+
<span style="background-color: #eeca3b; color: white; padding: 5px 8px; font-size: 14px;">Model</span>
|
657 |
</div>
|
658 |
</a>
|
659 |
<a href="https://github.com/open-mmlab/Amphion/tree/main/models/vc/vevo" target="_blank" style="text-decoration: none;">
|
660 |
+
<div style="display: inline-flex; align-items: center; border-radius: 4px; overflow: hidden;">
|
661 |
+
<span style="background-color: #4a4a4a; color: white; padding: 5px 8px; font-size: 14px;">GitHub</span>
|
662 |
+
<span style="background-color: #4c72b0; color: white; padding: 5px 8px; font-size: 14px;">Repo</span>
|
663 |
</div>
|
664 |
</a>
|
665 |
</div>
|
|
|
707 |
with gr.Column():
|
708 |
tts_text = gr.Textbox(label="Input Text", placeholder="Enter text to synthesize...", lines=3)
|
709 |
tts_src_language = gr.Dropdown(["en", "zh", "de", "fr", "ja", "ko"], label="Text Language", value="en")
|
710 |
+
tts_reference = gr.Audio(label="Style Reference", type="numpy")
|
711 |
+
tts_style_ref_text = gr.Textbox(label="Style Reference Text", placeholder="Enter style reference text...", lines=3)
|
712 |
tts_timbre_reference = gr.Audio(label="Timbre Reference", type="numpy")
|
713 |
tts_ref_language = gr.Dropdown(["en", "zh", "de", "fr", "ja", "ko"], label="Reference Audio Language", value="en")
|
|
|
714 |
tts_button = gr.Button("Generate")
|
715 |
with gr.Column():
|
716 |
tts_output = gr.Audio(label="Result")
|