editing the pr #310 and merging

2019-11-14 16:14:01 +01:00 · 2019-11-14 16:14:01 +01:00 · 8af75cad46
parent 574de86b9b
commit 8af75cad46
4 changed files with 42 additions and 485 deletions
--- a/requirements.txt
+++ b/requirements.txt
@ -11,3 +11,4 @@ scipy==0.19.0
 tqdm
 git+git://github.com/bootphon/phonemizer@master
 soundfile
 bokeh==1.4.0
--- a/setup.py
+++ b/setup.py
@ -87,6 +87,7 @@ setup(
        "flask",
        # "lws",
        "tqdm",
        "bokeh==1.4.0",
        "soundfile",
        "phonemizer @ https://github.com/bootphon/phonemizer/tarball/master",
    ],
--- a/speaker_encoder/compute_embeddings.py
+++ b/speaker_encoder/compute_embeddings.py
@ -11,17 +11,26 @@ from TTS.utils.audio import AudioProcessor
 from TTS.utils.generic_utils import load_config
 parser = argparse.ArgumentParser(
-    description="Compute embedding vectors for each wav file in a dataset. "
+    description='Compute embedding vectors for each wav file in a dataset. ')
 parser.add_argument(
    'model_path',
    type=str,
    help='Path to model outputs (checkpoint, tensorboard etc.).')
 parser.add_argument(
    'config_path',
    type=str,
    help='Path to config file for training.',
 )
 parser.add_argument(
    'data_path',
    type=str,
    help='Data path for wav files - directory or CSV file')
 parser.add_argument(
-    "config_path", type=str, help="Path to config file for training.",
+    'output_path',
-)
+    type=str,
    help='path for training outputs.')
 parser.add_argument(
-    "data_path", type=str, help="Defines the data path. It overwrites config.json."
+    '--use_cuda', type=bool, help='flag to set cuda.', default=False
 )
 parser.add_argument(
    '--separator', type=str, help='Separator used in file if CSV is passed for data_path', default='|'
@ -30,7 +39,7 @@ args = parser.parse_args()
 c = load_config(args.config_path)
-ap = AudioProcessor(**c["audio"])
+ap = AudioProcessor(**c['audio'])
 data_path = args.data_path
 split_ext = os.path.splitext(data_path)
@ -65,7 +74,7 @@ for output_file in output_files:
    os.makedirs(os.path.dirname(output_file), exist_ok=True)
 model = SpeakerEncoder(**c.model)
-model.load_state_dict(torch.load(args.model_path)["model"])
+model.load_state_dict(torch.load(args.model_path)['model'])
 model.eval()
 if args.use_cuda:
    model.cuda()
--- a/speaker_encoder/notebooks/PlotUmapLibriTTS.ipynb
+++ b/speaker_encoder/notebooks/PlotUmapLibriTTS.ipynb