From 5bd61ca518be82750f2d688e97c9e066e3ad9645 Mon Sep 17 00:00:00 2001 From: Amila Rathnayake Date: Sat, 10 Mar 2018 13:24:41 +0530 Subject: [PATCH] Fix for issues #37 and #53 --- train.py | 11 +++++++++-- 1 file changed, 9 insertions(+), 2 deletions(-) diff --git a/train.py b/train.py index c85ceb6d..203061b7 100644 --- a/train.py +++ b/train.py @@ -50,6 +50,7 @@ from matplotlib import pyplot as plt import sys import os +import platform from tensorboardX import SummaryWriter from matplotlib import cm from warnings import warn @@ -96,8 +97,9 @@ def plot_alignment(alignment, path, info=None): class TextDataSource(FileDataSource): - def __init__(self, data_root, speaker_id=None): + def __init__(self, data_root, frontend_name, speaker_id=None): self.data_root = data_root + self.frontend_name = frontend_name self.speaker_ids = None self.multi_speaker = False # If not None, filter by speaker_id @@ -130,6 +132,11 @@ def collect_features(self, *args): text, speaker_id = args else: text = args[0] + + # Fix for issues #37 and #53 + if platform.system() == "Windows": + _frontend = getattr(frontend, self.frontend_name) + seq = _frontend.text_to_sequence(text, p=hparams.replace_pronunciation_prob) if self.multi_speaker: return np.asarray(seq, dtype=np.int32), int(speaker_id) @@ -884,7 +891,7 @@ def restore_parts(path, model): os.makedirs(checkpoint_dir, exist_ok=True) # Input dataset definitions - X = FileSourceDataset(TextDataSource(data_root, speaker_id)) + X = FileSourceDataset(TextDataSource(data_root, hparams.frontend, speaker_id)) Mel = FileSourceDataset(MelSpecDataSource(data_root, speaker_id)) Y = FileSourceDataset(LinearSpecDataSource(data_root, speaker_id))