From 93df4c160b8332a4ef41190860b5056905143def Mon Sep 17 00:00:00 2001 From: Hiroshiba Kazuyuki Date: Sun, 24 Dec 2017 20:24:21 +0900 Subject: add pad second --- become_yukarin/dataset/dataset.py | 6 +++++- become_yukarin/param.py | 1 + 2 files changed, 6 insertions(+), 1 deletion(-) (limited to 'become_yukarin') diff --git a/become_yukarin/dataset/dataset.py b/become_yukarin/dataset/dataset.py index 0ca35df..fa68a78 100644 --- a/become_yukarin/dataset/dataset.py +++ b/become_yukarin/dataset/dataset.py @@ -66,15 +66,19 @@ class SplitProcess(BaseDataProcess): class WaveFileLoadProcess(BaseDataProcess): - def __init__(self, sample_rate: int, top_db: float, dtype=numpy.float32): + def __init__(self, sample_rate: int, top_db: float, pad_second: float = 0, dtype=numpy.float32): self._sample_rate = sample_rate self._top_db = top_db + self._pad_second = pad_second self._dtype = dtype def __call__(self, data: str, test): wave = librosa.core.load(data, sr=self._sample_rate, dtype=self._dtype)[0] if self._top_db is not None: wave = librosa.effects.remix(wave, intervals=librosa.effects.split(wave, top_db=self._top_db)) + if self._pad_second > 0.0: + p = int(self._sample_rate * self._pad_second) + wave = numpy.pad(wave, pad_width=(p, p), mode='constant') return Wave(wave, self._sample_rate) diff --git a/become_yukarin/param.py b/become_yukarin/param.py index 9173470..0870bab 100644 --- a/become_yukarin/param.py +++ b/become_yukarin/param.py @@ -4,6 +4,7 @@ from typing import NamedTuple class VoiceParam(NamedTuple): sample_rate: int = 24000 top_db: float = None + pad_second: float = 0.0 class AcousticFeatureParam(NamedTuple): -- cgit v1.2.3-70-g09d2