TTSDataset.py fixes and updates for existing phoneme folder in nultiprocessing

pull/10/head
Eren Golge 2019-02-28 17:49:42 +01:00
parent 618b280812
commit cc34fe4c7c
2 changed files with 13 additions and 3 deletions

View File

@ -1,5 +1,7 @@
#!/bin/bash
ls ${SHARED_DIR}/data/keithito
pip3 install https://download.pytorch.org/whl/cu100/torch-1.0.1.post2-cp36-cp36m-linux_x86_64.whl
yes | apt-get install espeak
python3 setup.py develop
python3 train.py --config_path config_cluster.json --data_path ${SHARED_DIR}/data/Blizzard/Nancy/ --debug true
# python3 distribute.py --config_path config_cluster.json --data_path ${SHARED_DIR}/data/keithito/LJSpeech-1.1/ --restore_path ${USER_DIR}/best_model.pth.tar
python3 distribute.py --config_path config_cluster.json --data_path ${SHARED_DIR}/data/keithito/LJSpeech-1.1/

View File

@ -65,7 +65,7 @@ class MyDataset(Dataset):
self.phoneme_language = phoneme_language
self.verbose = verbose
if use_phonemes and not os.path.isdir(phoneme_cache_path):
os.makedirs(phoneme_cache_path)
os.makedirs(phoneme_cache_path, exist_ok=True)
if self.verbose:
print("\n > DataLoader initialization")
print(" | > Data path: {}".format(root_path))
@ -91,7 +91,15 @@ class MyDataset(Dataset):
file_name = os.path.basename(wav_file).split('.')[0]
tmp_path = os.path.join(self.phoneme_cache_path, file_name+'_phoneme.npy')
if os.path.isfile(tmp_path):
text = np.load(tmp_path)
try:
text = np.load(tmp_path)
except:
print(" > ERROR: phoneme connot be loaded for {}. Recomputing.".format(wav_file))
text = np.asarray(
phoneme_to_sequence(
text, [self.cleaners], language=self.phoneme_language),
dtype=np.int32)
np.save(tmp_path, text)
else:
text = np.asarray(
phoneme_to_sequence(text, [self.cleaners], language=self.phoneme_language), dtype=np.int32)