积极的屁孩 commited on
Commit
b4485a3
·
1 Parent(s): cc7434e

adjustments

Browse files
Files changed (1) hide show
  1. app.py +5 -8
app.py CHANGED
@@ -642,7 +642,7 @@ with gr.Blocks(title="VEVO DEMO") as demo:
642
  timbre_button.click(vevo_timbre, inputs=[timbre_content, timbre_reference], outputs=timbre_output)
643
 
644
  with gr.Tab("Vevo-Voice"):
645
- gr.Markdown("### Vevo-Voice: Transfer both style and timbre with separate references")
646
  with gr.Row():
647
  with gr.Column():
648
  voice_content = gr.Audio(label="Content Audio", type="numpy")
@@ -665,17 +665,14 @@ with gr.Blocks(title="VEVO DEMO") as demo:
665
  style_button.click(vevo_style, inputs=[style_content, style_reference], outputs=style_output)
666
 
667
  with gr.Tab("Vevo-TTS"):
668
- gr.Markdown("### Vevo-TTS: Text-to-speech with controllable style and timbre")
669
  with gr.Row():
670
  with gr.Column():
671
  tts_text = gr.Textbox(label="Input Text", placeholder="Enter text to synthesize...", lines=3)
672
  tts_src_language = gr.Dropdown(["en", "zh", "de", "fr", "ja", "ko"], label="Text Language", value="en")
673
  tts_reference = gr.Audio(label="Style Reference", type="numpy")
 
674
  tts_ref_language = gr.Dropdown(["en", "zh", "de", "fr", "ja", "ko"], label="Reference Audio Language", value="en")
675
-
676
- with gr.Accordion("Advanced Options", open=False):
677
- tts_timbre_reference = gr.Audio(label="Timbre Reference (Optional)", type="numpy")
678
-
679
  tts_button = gr.Button("Generate")
680
  with gr.Column():
681
  tts_output = gr.Audio(label="Result")
@@ -691,8 +688,8 @@ with gr.Blocks(title="VEVO DEMO") as demo:
691
  VEVO is a versatile voice synthesis and conversion model that offers four main functionalities:
692
  1. **Vevo-Style**: Maintains timbre but transfers style (accent, emotion, etc.)
693
  2. **Vevo-Timbre**: Maintains style but transfers timbre
694
- 3. **Vevo-Voice**: Transfers both style and timbre simultaneously
695
- 4. **Vevo-TTS**: Text-to-speech with controllable style and timbre
696
 
697
  For more information, visit the [Amphion project](https://github.com/open-mmlab/Amphion)
698
  """)
 
642
  timbre_button.click(vevo_timbre, inputs=[timbre_content, timbre_reference], outputs=timbre_output)
643
 
644
  with gr.Tab("Vevo-Voice"):
645
+ gr.Markdown("### Vevo-Voice: Transfers both style and timbre with separate references")
646
  with gr.Row():
647
  with gr.Column():
648
  voice_content = gr.Audio(label="Content Audio", type="numpy")
 
665
  style_button.click(vevo_style, inputs=[style_content, style_reference], outputs=style_output)
666
 
667
  with gr.Tab("Vevo-TTS"):
668
+ gr.Markdown("### Vevo-TTS: Text-to-speech with separate style and timbre references")
669
  with gr.Row():
670
  with gr.Column():
671
  tts_text = gr.Textbox(label="Input Text", placeholder="Enter text to synthesize...", lines=3)
672
  tts_src_language = gr.Dropdown(["en", "zh", "de", "fr", "ja", "ko"], label="Text Language", value="en")
673
  tts_reference = gr.Audio(label="Style Reference", type="numpy")
674
+ tts_timbre_reference = gr.Audio(label="Timbre Reference", type="numpy")
675
  tts_ref_language = gr.Dropdown(["en", "zh", "de", "fr", "ja", "ko"], label="Reference Audio Language", value="en")
 
 
 
 
676
  tts_button = gr.Button("Generate")
677
  with gr.Column():
678
  tts_output = gr.Audio(label="Result")
 
688
  VEVO is a versatile voice synthesis and conversion model that offers four main functionalities:
689
  1. **Vevo-Style**: Maintains timbre but transfers style (accent, emotion, etc.)
690
  2. **Vevo-Timbre**: Maintains style but transfers timbre
691
+ 3. **Vevo-Voice**: Transfers both style and timbre with separate references
692
+ 4. **Vevo-TTS**: Text-to-speech with separate style and timbre references
693
 
694
  For more information, visit the [Amphion project](https://github.com/open-mmlab/Amphion)
695
  """)