Secure your code as it's written. Use Snyk Code to scan source code in minutes - no build needed - and fix issues immediately.
@raises(ValueError)
def __test_invalid_speaker():
data_source = cmu_arctic.WavFileDataSource("dummy", speakers=["test"])
@attr("require_local_data")
@attr("require_cmu_arctic")
def test_cmu_arctic():
DATA_DIR = join(expanduser("~"), "data", "cmu_arctic")
if not exists(DATA_DIR):
warn("Data doesn't exist at {}".format(DATA_DIR))
return
class MyFileDataSource(cmu_arctic.WavFileDataSource):
def __init__(self, data_root, speakers, labelmap=None, max_files=2):
super(MyFileDataSource, self).__init__(
data_root, speakers, labelmap=labelmap, max_files=max_files)
self.alpha = pysptk.util.mcepalpha(16000)
def collect_features(self, path):
fs, x = wavfile.read(path)
x = x.astype(np.float64)
f0, timeaxis = pyworld.dio(x, fs, frame_period=5)
f0 = pyworld.stonemask(x, f0, timeaxis, fs)
spectrogram = pyworld.cheaptrick(x, f0, timeaxis, fs)
spectrogram = trim_zeros_frames(spectrogram)
mc = pysptk.sp2mc(spectrogram, order=24, alpha=self.alpha)
return mc.astype(np.float32)
max_files = 10
def test_cmu_arctic_dummy():
data_source = cmu_arctic.WavFileDataSource("dummy", speakers=["clb"])
@raises(ValueError)
def __test_invalid_speaker():
data_source = cmu_arctic.WavFileDataSource("dummy", speakers=["test"])
@raises(RuntimeError)
def __test_nodir(data_source):
data_source.collect_files()
__test_invalid_speaker()
__test_nodir(data_source)
def build_from_path(in_dir, out_dir, num_workers=1, tqdm=lambda x: x):
executor = ProcessPoolExecutor(max_workers=num_workers)
futures = []
speakers = cmu_arctic.available_speakers
wd = cmu_arctic.WavFileDataSource(in_dir, speakers=speakers)
wav_paths = wd.collect_files()
speaker_ids = wd.labels
for index, (speaker_id, wav_path) in enumerate(
zip(speaker_ids, wav_paths)):
futures.append(executor.submit(
partial(_process_utterance, out_dir, index + 1, speaker_id, wav_path, "N/A")))
return [future.result() for future in tqdm(futures)]
def build_from_path(in_dir, out_dir, silence_threshold, fft_size, num_workers=1, tqdm=lambda x: x):
executor = ProcessPoolExecutor(max_workers=num_workers)
futures = []
speakers = cmu_arctic.available_speakers
wd = cmu_arctic.WavFileDataSource(in_dir, speakers=speakers)
wav_paths = wd.collect_files()
speaker_ids = wd.labels
for index, (speaker_id, wav_path) in enumerate(
zip(speaker_ids, wav_paths)):
futures.append(executor.submit(
partial(_process_utterance, out_dir, index + 1, speaker_id, wav_path, "N/A", silence_threshold, fft_size)))
return [future.result() for future in tqdm(futures)]
def build_from_path(in_dir, out_dir, num_workers=1, tqdm=lambda x: x):
executor = ProcessPoolExecutor(max_workers=num_workers)
futures = []
speakers = cmu_arctic.available_speakers
wd = cmu_arctic.WavFileDataSource(in_dir, speakers=speakers)
wav_paths = wd.collect_files()
speaker_ids = wd.labels
for index, (speaker_id, wav_path) in enumerate(
zip(speaker_ids, wav_paths)):
futures.append(executor.submit(
partial(_process_utterance, out_dir, index + 1, speaker_id, wav_path, "N/A")))
return [future.result() for future in tqdm(futures)]
def build_from_path(hparams, in_dir, out_dir, num_workers=1, tqdm=lambda x: x):
executor = ProcessPoolExecutor(max_workers=num_workers)
futures = []
speakers = cmu_arctic.available_speakers
wd = cmu_arctic.WavFileDataSource(in_dir, speakers=speakers)
wav_paths = wd.collect_files()
speaker_ids = wd.labels
for index, (speaker_id, wav_path) in enumerate(
zip(speaker_ids, wav_paths)):
futures.append(executor.submit(
partial(_process_utterance, out_dir, index + 1, speaker_id, wav_path, "N/A", hparams)))
return [future.result() for future in tqdm(futures)]