dongyh20 commited on
Commit
af514e8
·
1 Parent(s): 667e460

update space

Browse files
app.py CHANGED
@@ -76,7 +76,8 @@ tokenizer, model, image_processor, _ = load_pretrained_model(model_path, None)
76
  model = model.to('cuda').eval()
77
  model = model.bfloat16()
78
 
79
- tts_model = CosyVoice('iic/CosyVoice-300M-SFT', load_jit=True, fp16=True)
 
80
  OUTPUT_SPEECH = False
81
 
82
  USE_SPEECH=False
 
76
  model = model.to('cuda').eval()
77
  model = model.bfloat16()
78
 
79
+ # tts_model = CosyVoice('iic/CosyVoice-300M-SFT', load_jit=True, fp16=True)
80
+ tts_model = CosyVoice('FunAudioLLM/CosyVoice-300M-SFT', load_jit=True, fp16=True)
81
  OUTPUT_SPEECH = False
82
 
83
  USE_SPEECH=False
ola/CosyVoice_main/cosyvoice/cli/cosyvoice.py CHANGED
@@ -16,7 +16,8 @@ import time
16
  from typing import Generator
17
  from tqdm import tqdm
18
  from hyperpyyaml import load_hyperpyyaml
19
- from modelscope import snapshot_download
 
20
  import torch
21
  from cosyvoice.cli.frontend import CosyVoiceFrontEnd
22
  from cosyvoice.cli.model import CosyVoiceModel, CosyVoice2Model
 
16
  from typing import Generator
17
  from tqdm import tqdm
18
  from hyperpyyaml import load_hyperpyyaml
19
+ # from modelscope import snapshot_download
20
+ from huggingface_hub import snapshot_download
21
  import torch
22
  from cosyvoice.cli.frontend import CosyVoiceFrontEnd
23
  from cosyvoice.cli.model import CosyVoiceModel, CosyVoice2Model
requirements.txt CHANGED
@@ -22,6 +22,7 @@ torchvision==0.16.1
22
  torchaudio
23
  modelscope
24
  matcha-tts
 
25
  av
26
  librosa
27
  gradio
 
22
  torchaudio
23
  modelscope
24
  matcha-tts
25
+ pyworld
26
  av
27
  librosa
28
  gradio