def fetch_sample_speech_walla(n_samples=None):
datapath = os.path.join("walla_wav", "*wav")
names = glob.glob(datapath)
speech = []
wav_names = []
logger.info("Loading speech files...")
for name in names[:n_samples]:
fs, bitw, d = readwav(name)
d = d.astype('float32') / (2 ** 15)
inds = np.arange(0, len(d), 16000)
for i, j in zip(inds[:-1], inds[1:]):
dij = d[i:j]
dij = sg.decimate(dij, 2, ftype="iir")[::2]
# decimate to 8k
fs = 8000
speech.append(dij)
wav_names.append(name)
if len(speech) > 200:
break
return fs, speech, wav_names
评论列表
文章目录