diff --git a/TTS/bin/extract_tts_spectrograms.py b/TTS/bin/extract_tts_spectrograms.py index 0af98ff1..e46e4a00 100755 --- a/TTS/bin/extract_tts_spectrograms.py +++ b/TTS/bin/extract_tts_spectrograms.py @@ -12,7 +12,7 @@ from tqdm import tqdm from TTS.config import load_config from TTS.tts.datasets import TTSDataset, load_tts_samples from TTS.tts.models import setup_model -from TTS.tts.utils.speakers import get_speaker_manager +from TTS.tts.utils.speakers import SpeakerManager from TTS.utils.audio import AudioProcessor from TTS.utils.generic_utils import count_parameters @@ -234,8 +234,13 @@ def main(args): # pylint: disable=redefined-outer-name # use eval and training partitions meta_data = meta_data_train + meta_data_eval - # parse speakers - speaker_manager = get_speaker_manager(c, args, meta_data_train) + # init speaker manager + if config.use_speaker_embedding: + speaker_manager = SpeakerManager(data_items=meta_data) + elif config.use_d_vector_file: + speaker_manager = SpeakerManager(d_vectors_file_path=c.d_vector_file) + else: + speaker_manager = None # setup model model = setup_model(c)