积极的屁孩 commited on
Commit
fbb3473
·
1 Parent(s): b4485a3

adjustments

Browse files
Files changed (1) hide show
  1. app.py +15 -14
app.py CHANGED
@@ -628,24 +628,34 @@ def vevo_tts(text, ref_wav, timbre_ref_wav=None, src_language="en", ref_language
628
  # 创建Gradio界面
629
  with gr.Blocks(title="VEVO DEMO") as demo:
630
  gr.Markdown("# VEVO DEMO")
631
- gr.Markdown("## Controllable Zero-Shot Voice Conversion and Style Transfer")
632
 
633
  with gr.Tab("Vevo-Timbre"):
634
  gr.Markdown("### Vevo-Timbre: Maintain style but transfer timbre")
635
  with gr.Row():
636
  with gr.Column():
637
- timbre_content = gr.Audio(label="Content Audio", type="numpy")
638
  timbre_reference = gr.Audio(label="Timbre Reference", type="numpy")
639
  timbre_button = gr.Button("Generate")
640
  with gr.Column():
641
  timbre_output = gr.Audio(label="Result")
642
  timbre_button.click(vevo_timbre, inputs=[timbre_content, timbre_reference], outputs=timbre_output)
643
-
 
 
 
 
 
 
 
 
 
 
 
644
  with gr.Tab("Vevo-Voice"):
645
  gr.Markdown("### Vevo-Voice: Transfers both style and timbre with separate references")
646
  with gr.Row():
647
  with gr.Column():
648
- voice_content = gr.Audio(label="Content Audio", type="numpy")
649
  voice_style_reference = gr.Audio(label="Style Reference", type="numpy")
650
  voice_timbre_reference = gr.Audio(label="Timbre Reference", type="numpy")
651
  voice_button = gr.Button("Generate")
@@ -653,16 +663,7 @@ with gr.Blocks(title="VEVO DEMO") as demo:
653
  voice_output = gr.Audio(label="Result")
654
  voice_button.click(vevo_voice, inputs=[voice_content, voice_style_reference, voice_timbre_reference], outputs=voice_output)
655
 
656
- with gr.Tab("Vevo-Style"):
657
- gr.Markdown("### Vevo-Style: Maintain timbre but transfer style (accent, emotion, etc.)")
658
- with gr.Row():
659
- with gr.Column():
660
- style_content = gr.Audio(label="Content Audio", type="numpy")
661
- style_reference = gr.Audio(label="Style Reference", type="numpy")
662
- style_button = gr.Button("Generate")
663
- with gr.Column():
664
- style_output = gr.Audio(label="Result")
665
- style_button.click(vevo_style, inputs=[style_content, style_reference], outputs=style_output)
666
 
667
  with gr.Tab("Vevo-TTS"):
668
  gr.Markdown("### Vevo-TTS: Text-to-speech with separate style and timbre references")
 
628
  # 创建Gradio界面
629
  with gr.Blocks(title="VEVO DEMO") as demo:
630
  gr.Markdown("# VEVO DEMO")
 
631
 
632
  with gr.Tab("Vevo-Timbre"):
633
  gr.Markdown("### Vevo-Timbre: Maintain style but transfer timbre")
634
  with gr.Row():
635
  with gr.Column():
636
+ timbre_content = gr.Audio(label="Source Audio", type="numpy")
637
  timbre_reference = gr.Audio(label="Timbre Reference", type="numpy")
638
  timbre_button = gr.Button("Generate")
639
  with gr.Column():
640
  timbre_output = gr.Audio(label="Result")
641
  timbre_button.click(vevo_timbre, inputs=[timbre_content, timbre_reference], outputs=timbre_output)
642
+
643
+ with gr.Tab("Vevo-Style"):
644
+ gr.Markdown("### Vevo-Style: Maintain timbre but transfer style (accent, emotion, etc.)")
645
+ with gr.Row():
646
+ with gr.Column():
647
+ style_content = gr.Audio(label="Source Audio", type="numpy")
648
+ style_reference = gr.Audio(label="Style Reference", type="numpy")
649
+ style_button = gr.Button("Generate")
650
+ with gr.Column():
651
+ style_output = gr.Audio(label="Result")
652
+ style_button.click(vevo_style, inputs=[style_content, style_reference], outputs=style_output)
653
+
654
  with gr.Tab("Vevo-Voice"):
655
  gr.Markdown("### Vevo-Voice: Transfers both style and timbre with separate references")
656
  with gr.Row():
657
  with gr.Column():
658
+ voice_content = gr.Audio(label="Source Audio", type="numpy")
659
  voice_style_reference = gr.Audio(label="Style Reference", type="numpy")
660
  voice_timbre_reference = gr.Audio(label="Timbre Reference", type="numpy")
661
  voice_button = gr.Button("Generate")
 
663
  voice_output = gr.Audio(label="Result")
664
  voice_button.click(vevo_voice, inputs=[voice_content, voice_style_reference, voice_timbre_reference], outputs=voice_output)
665
 
666
+
 
 
 
 
 
 
 
 
 
667
 
668
  with gr.Tab("Vevo-TTS"):
669
  gr.Markdown("### Vevo-TTS: Text-to-speech with separate style and timbre references")