Yehor commited on
Commit
5564ad9
·
1 Parent(s): 326a165
Files changed (1) hide show
  1. app.py +11 -7
app.py CHANGED
@@ -5,7 +5,6 @@ import time
5
 
6
  from os.path import getsize
7
  from pathlib import Path
8
- from enum import Enum
9
  from importlib.metadata import version, PackageNotFoundError
10
 
11
  try:
@@ -27,7 +26,6 @@ from common import update_params
27
  from torch_env import device
28
 
29
 
30
-
31
  # Vocoder
32
  from vocos import Vocos
33
 
@@ -85,8 +83,12 @@ data_config = config["data_config"]
85
  model_config = config["model_config"]
86
 
87
  # Load vocoder
88
- vocos_config = hf_hub_download("patriotyk/vocos-mel-hifigan-compat-44100khz", "config.yaml")
89
- vocos_model = hf_hub_download("patriotyk/vocos-mel-hifigan-compat-44100khz", "pytorch_model.bin")
 
 
 
 
90
 
91
  vocos_model_path = Path(vocos_model)
92
  state_dict = torch.load(vocos_model_path, map_location="cpu")
@@ -107,8 +109,8 @@ state_dict = checkpoint_dict["state_dict"]
107
  radtts.load_state_dict(state_dict, strict=False)
108
  radtts.eval()
109
 
110
- radtts_params = f'{sum(param.numel() for param in radtts.parameters()):,}'
111
- vocos_params = f'{sum(param.numel() for param in vocos.parameters()):,}'
112
 
113
  print(f"Loaded checkpoint (RAD-TTS++), number of parameters: {radtts_params}")
114
  print(f"Loaded checkpoint (Vocos), number of parameters: {vocos_params}")
@@ -240,7 +242,9 @@ def inference(text, voice):
240
 
241
  tensor_text = get_text(text).to(device)
242
 
243
- speaker_id = speaker_id_text = speaker_id_attributes = get_speaker_id(speaker).to(device)
 
 
244
 
245
  if speaker_text is not None:
246
  speaker_id_text = get_speaker_id(speaker_text).to(device)
 
5
 
6
  from os.path import getsize
7
  from pathlib import Path
 
8
  from importlib.metadata import version, PackageNotFoundError
9
 
10
  try:
 
26
  from torch_env import device
27
 
28
 
 
29
  # Vocoder
30
  from vocos import Vocos
31
 
 
83
  model_config = config["model_config"]
84
 
85
  # Load vocoder
86
+ vocos_config = hf_hub_download(
87
+ "patriotyk/vocos-mel-hifigan-compat-44100khz", "config.yaml"
88
+ )
89
+ vocos_model = hf_hub_download(
90
+ "patriotyk/vocos-mel-hifigan-compat-44100khz", "pytorch_model.bin"
91
+ )
92
 
93
  vocos_model_path = Path(vocos_model)
94
  state_dict = torch.load(vocos_model_path, map_location="cpu")
 
109
  radtts.load_state_dict(state_dict, strict=False)
110
  radtts.eval()
111
 
112
+ radtts_params = f"{sum(param.numel() for param in radtts.parameters()):,}"
113
+ vocos_params = f"{sum(param.numel() for param in vocos.parameters()):,}"
114
 
115
  print(f"Loaded checkpoint (RAD-TTS++), number of parameters: {radtts_params}")
116
  print(f"Loaded checkpoint (Vocos), number of parameters: {vocos_params}")
 
242
 
243
  tensor_text = get_text(text).to(device)
244
 
245
+ speaker_id = speaker_id_text = speaker_id_attributes = get_speaker_id(speaker).to(
246
+ device
247
+ )
248
 
249
  if speaker_text is not None:
250
  speaker_id_text = get_speaker_id(speaker_text).to(device)