Spaces:

lalalic
/

xtts

Sleeping

App Files Files Community

li cheng commited on Apr 4, 2024

Commit

2bc4022

1 Parent(s): e73f150

sample silence threshold

Browse files

Files changed (1) hide show

xtts.py +11 -13

xtts.py CHANGED Viewed

@@ -3,6 +3,7 @@ import requests
 import torch
 import traceback
 from TTS.api import TTS
 root=os.path.dirname(os.path.abspath(__file__))
@@ -26,7 +27,7 @@ if not os.path.exists(sample_root):
     os.makedirs(sample_root)
 default_sample=f'{root}/sample.wav', f'{sample_root}/sample.pt'
-ffmpeg=f'{root}/ffmpeg'
 if api:
     from qili import upload, check_token
@@ -114,25 +115,22 @@ def download(url):
 def trim_sample_audio(speaker_wav):
     global ffmpeg
     try:
         lowpass_highpass = "lowpass=8000,highpass=75,"
-        trim_silence = "areverse,silenceremove=start_periods=1:start_silence=0:start_threshold=0.02,areverse,silenceremove=start_periods=1:start_silence=0:start_threshold=0.02,"
         out_filename=speaker_wav.replace(".wav","_trimed.wav")
         shell_command = f"{ffmpeg} -y -i {speaker_wav} -af {lowpass_highpass}{trim_silence} {out_filename}".split(" ")
-        subprocess.run(
             [item for item in shell_command],
             capture_output=False,
             text=True,
             check=True,
-            stdout=None, #subprocess.PIPE,
             stderr=None, #subprocess.PIPE,
         )
-        if os.path.exists(out_filename) and os.path.getsize(out_filename) > 0:
-            os.remove(speaker_wav)
-            logging.debug(f'trimed sample wav to {out_filename}')
-            return out_filename
-        else:
-            logging.debug(f'Error: trimed sample wav to, ignored')
-            return speaker_wav
     except:
         logging.debug(f'Error: trimed sample wav to, ignored')
         return speaker_wav
@@ -147,8 +145,8 @@ def to_mp3(wav):
             capture_output=False,
             text=True,
             check=True,
-            stdout=None, #subprocess.PIPE,
-            stderr=None, #subprocess.PIPE,
         )
         logging.debug(f'convert wav {wav} to mp3 at {mp3}')
         return mp3

 import torch
 import traceback
 from TTS.api import TTS
+#ffmpeg -y -i /var/folders/w6/mxy2wbmd2bj360glkp0d5qbw0000gn/T/tmp49s6gxk7.wav -af lowpass=8000,highpass=75,areverse,silenceremove=start_periods=1:start_silence=0:start_threshold=0.02,areverse,silenceremove=start_periods=1:start_silence=0:start_threshold=0.02, ./test.wav
 root=os.path.dirname(os.path.abspath(__file__))
     os.makedirs(sample_root)
 default_sample=f'{root}/sample.wav', f'{sample_root}/sample.pt'
+ffmpeg="/opt/homebrew/bin/ffmpeg" #f'{root}/ffmpeg'
 if api:
     from qili import upload, check_token
 def trim_sample_audio(speaker_wav):
     global ffmpeg
     try:
+        threshold=0.005 #os.environ["FILTER_THRESHOLD"]
         lowpass_highpass = "lowpass=8000,highpass=75,"
+        trim_silence = f"areverse,silenceremove=start_periods=1:start_silence=0:start_threshold={threshold},areverse,silenceremove=start_periods=1:start_silence=0:start_threshold={threshold},"
         out_filename=speaker_wav.replace(".wav","_trimed.wav")
         shell_command = f"{ffmpeg} -y -i {speaker_wav} -af {lowpass_highpass}{trim_silence} {out_filename}".split(" ")
+        result=subprocess.run(
             [item for item in shell_command],
             capture_output=False,
             text=True,
             check=True,
+            stdout=subprocess.DEVNULL,
             stderr=None, #subprocess.PIPE,
         )
+        os.remove(speaker_wav)
+        logging.debug(f'trimed sample wav to {out_filename}')
+        return out_filename
     except:
         logging.debug(f'Error: trimed sample wav to, ignored')
         return speaker_wav
             capture_output=False,
             text=True,
             check=True,
+            stdout=subprocess.DEVNULL,
+            stderr=subprocess.DEVNULL,
         )
         logging.debug(f'convert wav {wav} to mp3 at {mp3}')
         return mp3