Spaces:

Yehor
/

radtts-uk-vocos-demo

Running

Yehor commited on 13 days ago

Commit

5564ad9

1 Parent(s): 326a165

Fixes

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,7 +5,6 @@ import time
 from os.path import getsize
 from pathlib import Path
-from enum import Enum
 from importlib.metadata import version, PackageNotFoundError
 try:
@@ -27,7 +26,6 @@ from common import update_params
 from torch_env import device
 # Vocoder
 from vocos import Vocos
@@ -85,8 +83,12 @@ data_config = config["data_config"]
 model_config = config["model_config"]
 # Load vocoder
-vocos_config = hf_hub_download("patriotyk/vocos-mel-hifigan-compat-44100khz", "config.yaml")
-vocos_model = hf_hub_download("patriotyk/vocos-mel-hifigan-compat-44100khz", "pytorch_model.bin")
 vocos_model_path = Path(vocos_model)
 state_dict = torch.load(vocos_model_path, map_location="cpu")
@@ -107,8 +109,8 @@ state_dict = checkpoint_dict["state_dict"]
 radtts.load_state_dict(state_dict, strict=False)
 radtts.eval()
-radtts_params = f'{sum(param.numel() for param in radtts.parameters()):,}'
-vocos_params = f'{sum(param.numel() for param in vocos.parameters()):,}'
 print(f"Loaded checkpoint (RAD-TTS++), number of parameters: {radtts_params}")
 print(f"Loaded checkpoint (Vocos), number of parameters: {vocos_params}")
@@ -240,7 +242,9 @@ def inference(text, voice):
     tensor_text = get_text(text).to(device)
-    speaker_id = speaker_id_text = speaker_id_attributes = get_speaker_id(speaker).to(device)
     if speaker_text is not None:
         speaker_id_text = get_speaker_id(speaker_text).to(device)

 from os.path import getsize
 from pathlib import Path
 from importlib.metadata import version, PackageNotFoundError
 try:
 from torch_env import device
 # Vocoder
 from vocos import Vocos
 model_config = config["model_config"]
 # Load vocoder
+vocos_config = hf_hub_download(
+    "patriotyk/vocos-mel-hifigan-compat-44100khz", "config.yaml"
+)
+vocos_model = hf_hub_download(
+    "patriotyk/vocos-mel-hifigan-compat-44100khz", "pytorch_model.bin"
+)
 vocos_model_path = Path(vocos_model)
 state_dict = torch.load(vocos_model_path, map_location="cpu")
 radtts.load_state_dict(state_dict, strict=False)
 radtts.eval()
+radtts_params = f"{sum(param.numel() for param in radtts.parameters()):,}"
+vocos_params = f"{sum(param.numel() for param in vocos.parameters()):,}"
 print(f"Loaded checkpoint (RAD-TTS++), number of parameters: {radtts_params}")
 print(f"Loaded checkpoint (Vocos), number of parameters: {vocos_params}")
     tensor_text = get_text(text).to(device)
+    speaker_id = speaker_id_text = speaker_id_attributes = get_speaker_id(speaker).to(
+        device
+    )
     if speaker_text is not None:
         speaker_id_text = get_speaker_id(speaker_text).to(device)