Spaces:
Running
Running
gradio infer
Browse files- MMAudio/demo.py +1 -1
- app.py +5 -5
MMAudio/demo.py
CHANGED
@@ -64,7 +64,7 @@ def v2a_load():
|
|
64 |
if args.variant not in all_model_cfg:
|
65 |
raise ValueError(f'Unknown model variant: {args.variant}')
|
66 |
model: ModelConfig = all_model_cfg[args.variant]
|
67 |
-
|
68 |
seq_cfg = model.seq_cfg
|
69 |
|
70 |
#if args.video:
|
|
|
64 |
if args.variant not in all_model_cfg:
|
65 |
raise ValueError(f'Unknown model variant: {args.variant}')
|
66 |
model: ModelConfig = all_model_cfg[args.variant]
|
67 |
+
model.download_if_needed()
|
68 |
seq_cfg = model.seq_cfg
|
69 |
|
70 |
#if args.video:
|
app.py
CHANGED
@@ -35,11 +35,6 @@ if True:
|
|
35 |
log = logging.getLogger()
|
36 |
|
37 |
|
38 |
-
import sys
|
39 |
-
sys.path.insert(0, "./F5-TTS/src/")
|
40 |
-
from f5_tts.infer.infer_cli_test import v2s_infer
|
41 |
-
|
42 |
-
|
43 |
import sys
|
44 |
sys.path.insert(0, "./MMAudio/")
|
45 |
from demo import v2a_load, v2a_infer
|
@@ -47,6 +42,11 @@ from demo import v2a_load, v2a_infer
|
|
47 |
v2a_loaded = v2a_load()
|
48 |
|
49 |
|
|
|
|
|
|
|
|
|
|
|
50 |
#@spaces.GPU(duration=120)
|
51 |
def video_to_audio_and_speech(video: gr.Video, prompt: str, v2a_num_steps: int, text: str, audio_prompt: gr.Audio, text_prompt: str, v2s_num_steps: int):
|
52 |
|
|
|
35 |
log = logging.getLogger()
|
36 |
|
37 |
|
|
|
|
|
|
|
|
|
|
|
38 |
import sys
|
39 |
sys.path.insert(0, "./MMAudio/")
|
40 |
from demo import v2a_load, v2a_infer
|
|
|
42 |
v2a_loaded = v2a_load()
|
43 |
|
44 |
|
45 |
+
import sys
|
46 |
+
sys.path.insert(0, "./F5-TTS/src/")
|
47 |
+
from f5_tts.infer.infer_cli_test import v2s_infer
|
48 |
+
|
49 |
+
|
50 |
#@spaces.GPU(duration=120)
|
51 |
def video_to_audio_and_speech(video: gr.Video, prompt: str, v2a_num_steps: int, text: str, audio_prompt: gr.Audio, text_prompt: str, v2s_num_steps: int):
|
52 |
|