diff options
Diffstat (limited to 'become_yukarin')
| -rw-r--r-- | become_yukarin/dataset/dataset.py | 6 | ||||
| -rw-r--r-- | become_yukarin/param.py | 1 |
2 files changed, 6 insertions, 1 deletions
diff --git a/become_yukarin/dataset/dataset.py b/become_yukarin/dataset/dataset.py index 0ca35df..fa68a78 100644 --- a/become_yukarin/dataset/dataset.py +++ b/become_yukarin/dataset/dataset.py @@ -66,15 +66,19 @@ class SplitProcess(BaseDataProcess): class WaveFileLoadProcess(BaseDataProcess): - def __init__(self, sample_rate: int, top_db: float, dtype=numpy.float32): + def __init__(self, sample_rate: int, top_db: float, pad_second: float = 0, dtype=numpy.float32): self._sample_rate = sample_rate self._top_db = top_db + self._pad_second = pad_second self._dtype = dtype def __call__(self, data: str, test): wave = librosa.core.load(data, sr=self._sample_rate, dtype=self._dtype)[0] if self._top_db is not None: wave = librosa.effects.remix(wave, intervals=librosa.effects.split(wave, top_db=self._top_db)) + if self._pad_second > 0.0: + p = int(self._sample_rate * self._pad_second) + wave = numpy.pad(wave, pad_width=(p, p), mode='constant') return Wave(wave, self._sample_rate) diff --git a/become_yukarin/param.py b/become_yukarin/param.py index 9173470..0870bab 100644 --- a/become_yukarin/param.py +++ b/become_yukarin/param.py @@ -4,6 +4,7 @@ from typing import NamedTuple class VoiceParam(NamedTuple): sample_rate: int = 24000 top_db: float = None + pad_second: float = 0.0 class AcousticFeatureParam(NamedTuple): |
