E2-F5-TTS

Runtime error

cocktailpeanut commited on Oct 13, 2024

Commit

441eb78

1 Parent(s): 58ff1ba

update

Files changed (2) hide show

app_local.py CHANGED Viewed

@@ -88,9 +88,9 @@ def infer(ref_audio_orig, ref_text, gen_text, exp_name, remove_silence):
         aseg = AudioSegment.from_file(ref_audio_orig)
         aseg = aseg.set_channels(1)
         audio_duration = len(aseg)
-#        if audio_duration > 15000:
-#            gr.Warning("Audio is over 15s, clipping to only first 15s.")
-#            aseg = aseg[:15000]
         aseg.export(f.name, format="wav")
         ref_audio = f.name
     if exp_name == "F5-TTS":

         aseg = AudioSegment.from_file(ref_audio_orig)
         aseg = aseg.set_channels(1)
         audio_duration = len(aseg)
+        if audio_duration > 15000:
+            gr.Warning("Audio is over 15s, clipping to only first 15s.")
+            aseg = aseg[:15000]
         aseg.export(f.name, format="wav")
         ref_audio = f.name
     if exp_name == "F5-TTS":

model/utils.py CHANGED Viewed

@@ -134,7 +134,7 @@ def get_tokenizer(dataset_name, tokenizer: str = "pinyin"):
                 - if use "byte", set to 256 (unicode byte range)
     '''
     if tokenizer in ["pinyin", "char"]:
-        with open (f"data/{dataset_name}_{tokenizer}/vocab.txt", "r") as f:
             vocab_char_map = {}
             for i, char in enumerate(f):
                 vocab_char_map[char[:-1]] = i

                 - if use "byte", set to 256 (unicode byte range)
     '''
     if tokenizer in ["pinyin", "char"]:
+        with open (f"data/{dataset_name}_{tokenizer}/vocab.txt", "r", encoding="utf-8") as f:
             vocab_char_map = {}
             for i, char in enumerate(f):
                 vocab_char_map[char[:-1]] = i