Spaces:
Running
Running
Fixes
Browse files
app.py
CHANGED
@@ -5,7 +5,6 @@ import time
|
|
5 |
|
6 |
from os.path import getsize
|
7 |
from pathlib import Path
|
8 |
-
from enum import Enum
|
9 |
from importlib.metadata import version, PackageNotFoundError
|
10 |
|
11 |
try:
|
@@ -27,7 +26,6 @@ from common import update_params
|
|
27 |
from torch_env import device
|
28 |
|
29 |
|
30 |
-
|
31 |
# Vocoder
|
32 |
from vocos import Vocos
|
33 |
|
@@ -85,8 +83,12 @@ data_config = config["data_config"]
|
|
85 |
model_config = config["model_config"]
|
86 |
|
87 |
# Load vocoder
|
88 |
-
vocos_config = hf_hub_download(
|
89 |
-
|
|
|
|
|
|
|
|
|
90 |
|
91 |
vocos_model_path = Path(vocos_model)
|
92 |
state_dict = torch.load(vocos_model_path, map_location="cpu")
|
@@ -107,8 +109,8 @@ state_dict = checkpoint_dict["state_dict"]
|
|
107 |
radtts.load_state_dict(state_dict, strict=False)
|
108 |
radtts.eval()
|
109 |
|
110 |
-
radtts_params = f
|
111 |
-
vocos_params = f
|
112 |
|
113 |
print(f"Loaded checkpoint (RAD-TTS++), number of parameters: {radtts_params}")
|
114 |
print(f"Loaded checkpoint (Vocos), number of parameters: {vocos_params}")
|
@@ -240,7 +242,9 @@ def inference(text, voice):
|
|
240 |
|
241 |
tensor_text = get_text(text).to(device)
|
242 |
|
243 |
-
speaker_id = speaker_id_text = speaker_id_attributes = get_speaker_id(speaker).to(
|
|
|
|
|
244 |
|
245 |
if speaker_text is not None:
|
246 |
speaker_id_text = get_speaker_id(speaker_text).to(device)
|
|
|
5 |
|
6 |
from os.path import getsize
|
7 |
from pathlib import Path
|
|
|
8 |
from importlib.metadata import version, PackageNotFoundError
|
9 |
|
10 |
try:
|
|
|
26 |
from torch_env import device
|
27 |
|
28 |
|
|
|
29 |
# Vocoder
|
30 |
from vocos import Vocos
|
31 |
|
|
|
83 |
model_config = config["model_config"]
|
84 |
|
85 |
# Load vocoder
|
86 |
+
vocos_config = hf_hub_download(
|
87 |
+
"patriotyk/vocos-mel-hifigan-compat-44100khz", "config.yaml"
|
88 |
+
)
|
89 |
+
vocos_model = hf_hub_download(
|
90 |
+
"patriotyk/vocos-mel-hifigan-compat-44100khz", "pytorch_model.bin"
|
91 |
+
)
|
92 |
|
93 |
vocos_model_path = Path(vocos_model)
|
94 |
state_dict = torch.load(vocos_model_path, map_location="cpu")
|
|
|
109 |
radtts.load_state_dict(state_dict, strict=False)
|
110 |
radtts.eval()
|
111 |
|
112 |
+
radtts_params = f"{sum(param.numel() for param in radtts.parameters()):,}"
|
113 |
+
vocos_params = f"{sum(param.numel() for param in vocos.parameters()):,}"
|
114 |
|
115 |
print(f"Loaded checkpoint (RAD-TTS++), number of parameters: {radtts_params}")
|
116 |
print(f"Loaded checkpoint (Vocos), number of parameters: {vocos_params}")
|
|
|
242 |
|
243 |
tensor_text = get_text(text).to(device)
|
244 |
|
245 |
+
speaker_id = speaker_id_text = speaker_id_attributes = get_speaker_id(speaker).to(
|
246 |
+
device
|
247 |
+
)
|
248 |
|
249 |
if speaker_text is not None:
|
250 |
speaker_id_text = get_speaker_id(speaker_text).to(device)
|