Michael Hu commited on
Commit
a602e5e
Β·
1 Parent(s): 2d2f2b9

divide and conquer, don't do tts for now

Browse files
Files changed (3) hide show
  1. app.py +2 -2
  2. requirements.txt +1 -1
  3. utils/tts_dummy.py +3 -0
app.py CHANGED
@@ -9,7 +9,7 @@ import time
9
  import subprocess
10
  from utils.stt import transcribe_audio
11
  from utils.translation import translate_text
12
- from utils.tts import generate_speech
13
 
14
  # Hugging Face Spaces Setup Automation
15
  def setup_huggingface_space():
@@ -125,7 +125,7 @@ def render_results(english_text, chinese_text, output_path):
125
 
126
  def main():
127
  """Main application workflow"""
128
- setup_huggingface_space() # First-run configuration checks
129
  configure_page()
130
  st.title("🎧 High-Quality Audio Translation System")
131
  st.markdown("Upload English Audio β†’ Get Chinese Speech Output")
 
9
  import subprocess
10
  from utils.stt import transcribe_audio
11
  from utils.translation import translate_text
12
+ from utils.tts_dummy import generate_speech
13
 
14
  # Hugging Face Spaces Setup Automation
15
  def setup_huggingface_space():
 
125
 
126
  def main():
127
  """Main application workflow"""
128
+ # setup_huggingface_space() # First-run configuration checks
129
  configure_page()
130
  st.title("🎧 High-Quality Audio Translation System")
131
  st.markdown("Upload English Audio β†’ Get Chinese Speech Output")
requirements.txt CHANGED
@@ -11,4 +11,4 @@ phonemizer>=3.0
11
  espeak-ng>=1.51
12
  scipy>=1.11
13
  munch>=2.5
14
- git+https://github.com/hexgrad/Kokoro-82M
 
11
  espeak-ng>=1.51
12
  scipy>=1.11
13
  munch>=2.5
14
+ # git+https://github.com/hexgrad/Kokoro-82M
utils/tts_dummy.py ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ def generate_speech(text: str, language: str = "zh") -> str:
2
+ """Public interface for TTS generation"""
3
+ return "temp/outputs/dummy.wav"