lshzhm commited on
Commit
923aa33
·
1 Parent(s): 43d27a1

gradio infer

Browse files
Files changed (2) hide show
  1. MMAudio/demo.py +1 -1
  2. app.py +5 -5
MMAudio/demo.py CHANGED
@@ -64,7 +64,7 @@ def v2a_load():
64
  if args.variant not in all_model_cfg:
65
  raise ValueError(f'Unknown model variant: {args.variant}')
66
  model: ModelConfig = all_model_cfg[args.variant]
67
- #model.download_if_needed()
68
  seq_cfg = model.seq_cfg
69
 
70
  #if args.video:
 
64
  if args.variant not in all_model_cfg:
65
  raise ValueError(f'Unknown model variant: {args.variant}')
66
  model: ModelConfig = all_model_cfg[args.variant]
67
+ model.download_if_needed()
68
  seq_cfg = model.seq_cfg
69
 
70
  #if args.video:
app.py CHANGED
@@ -35,11 +35,6 @@ if True:
35
  log = logging.getLogger()
36
 
37
 
38
- import sys
39
- sys.path.insert(0, "./F5-TTS/src/")
40
- from f5_tts.infer.infer_cli_test import v2s_infer
41
-
42
-
43
  import sys
44
  sys.path.insert(0, "./MMAudio/")
45
  from demo import v2a_load, v2a_infer
@@ -47,6 +42,11 @@ from demo import v2a_load, v2a_infer
47
  v2a_loaded = v2a_load()
48
 
49
 
 
 
 
 
 
50
  #@spaces.GPU(duration=120)
51
  def video_to_audio_and_speech(video: gr.Video, prompt: str, v2a_num_steps: int, text: str, audio_prompt: gr.Audio, text_prompt: str, v2s_num_steps: int):
52
 
 
35
  log = logging.getLogger()
36
 
37
 
 
 
 
 
 
38
  import sys
39
  sys.path.insert(0, "./MMAudio/")
40
  from demo import v2a_load, v2a_infer
 
42
  v2a_loaded = v2a_load()
43
 
44
 
45
+ import sys
46
+ sys.path.insert(0, "./F5-TTS/src/")
47
+ from f5_tts.infer.infer_cli_test import v2s_infer
48
+
49
+
50
  #@spaces.GPU(duration=120)
51
  def video_to_audio_and_speech(video: gr.Video, prompt: str, v2a_num_steps: int, text: str, audio_prompt: gr.Audio, text_prompt: str, v2s_num_steps: int):
52