Spaces:

lalalic
/

xtts

Sleeping

App Files Files Community

li cheng commited on Apr 4, 2024

Commit

b9ae40e

1 Parent(s): 2bc4022

try sample threshold/2 until 0.001

Browse files

Files changed (1) hide show

xtts.py +10 -6

xtts.py CHANGED Viewed

@@ -96,8 +96,8 @@ def download_sample(url):
         response = requests.get(url)
         if response.status_code == 200:
             id=f'{sample_root}/{response.headers["etag"]}.pt'.replace('"','')
-            if(os.path.exists(id)):
-                return "", id
             with tempfile.NamedTemporaryFile(mode="wb", suffix=".wav", delete=False) as temp_file:
                 temp_file.write(response.content)
                 logging.debug(f'downloaded sample wav from {url}')
@@ -112,22 +112,26 @@ def download(url):
             temp_file.write(response.content)
             return os.path.abspath(temp_file.name)
-def trim_sample_audio(speaker_wav):
     global ffmpeg
     try:
-        threshold=0.005 #os.environ["FILTER_THRESHOLD"]
         lowpass_highpass = "lowpass=8000,highpass=75,"
         trim_silence = f"areverse,silenceremove=start_periods=1:start_silence=0:start_threshold={threshold},areverse,silenceremove=start_periods=1:start_silence=0:start_threshold={threshold},"
         out_filename=speaker_wav.replace(".wav","_trimed.wav")
         shell_command = f"{ffmpeg} -y -i {speaker_wav} -af {lowpass_highpass}{trim_silence} {out_filename}".split(" ")
         result=subprocess.run(
             [item for item in shell_command],
-            capture_output=False,
             text=True,
             check=True,
             stdout=subprocess.DEVNULL,
-            stderr=None, #subprocess.PIPE,
         )
         os.remove(speaker_wav)
         logging.debug(f'trimed sample wav to {out_filename}')
         return out_filename

         response = requests.get(url)
         if response.status_code == 200:
             id=f'{sample_root}/{response.headers["etag"]}.pt'.replace('"','')
+            # if(os.path.exists(id)):
+            #     return "", id
             with tempfile.NamedTemporaryFile(mode="wb", suffix=".wav", delete=False) as temp_file:
                 temp_file.write(response.content)
                 logging.debug(f'downloaded sample wav from {url}')
             temp_file.write(response.content)
             return os.path.abspath(temp_file.name)
+def trim_sample_audio(speaker_wav, threshold=0.005):
     global ffmpeg
     try:
         lowpass_highpass = "lowpass=8000,highpass=75,"
         trim_silence = f"areverse,silenceremove=start_periods=1:start_silence=0:start_threshold={threshold},areverse,silenceremove=start_periods=1:start_silence=0:start_threshold={threshold},"
         out_filename=speaker_wav.replace(".wav","_trimed.wav")
         shell_command = f"{ffmpeg} -y -i {speaker_wav} -af {lowpass_highpass}{trim_silence} {out_filename}".split(" ")
+        logging.debug(shell_command)
         result=subprocess.run(
             [item for item in shell_command],
+            capture_output=True,
             text=True,
             check=True,
             stdout=subprocess.DEVNULL,
+            stderr=None,
         )
+        if result.stderr is not None and "Output file is empty" in result.stderr:
+            if threshold > 0.001:
+                return trim_sample_audio(speaker_wav, threshold/2)
+            return speaker_wav
         os.remove(speaker_wav)
         logging.debug(f'trimed sample wav to {out_filename}')
         return out_filename