def fetch_sample_speech_ono(n_samples=None):
datapath = os.path.join("ono_wav", "*wav")
wav_names = glob.glob(datapath)
wav_names = [w for w in wav_names
if "EKENWAY" in w]
wav_names = [w for w in wav_names
if "PAIN" in w]
speech = []
logger.info("Loading speech files...")
for wav_name in wav_names[:n_samples]:
fs, bitw, d = readwav(wav_name)
# 24 bit but only 16 used???
d = d.astype('float32') / (2 ** 15)
d = sg.decimate(d, 6, ftype="fir")[::6]
# decimate to 8k
fs = 8000
speech.append(d)
return fs, speech, wav_names
评论列表
文章目录