1、利用python_speech_features库编写MFCC特征提取,生成40维的mfcc向量
import scipy.io.wavfile as wavfile
from python_speech_features import mfcc, delta
def read_wave_data(filename):
"""获取语音文件信息: sample_rate:帧速率 signal:数据的矩阵形式 """
fs, wavsignal = wavfile.read(filename) # 声音文件数据的矩阵形式
return fs, wavsignal
def extract_mfcc( wav_arr, sample_rate):
mfcc_feat = mfcc(wav_arr, sample_rate)
energy = np.sqrt(wav_arr)
mfcc_feat = np.stack(mfcc_feat, energy)
delta1 = delta(mfcc_feat, 1)
delta2 = delta(delta1, 1)
mfcc_feat = np.stack(mfcc_feat, delta1, delta2)
return mfcc_feat.T
2、利用librosa库编写mfcc特征提取
import librosa
wavsignal,fs = librosa.load(filename)
mfccs = librosa.feature.mfcc(wavsignal , sr=fs)
return mfccs
3、python代码直接编写mfcc特征提取模块
import numpy
import scipy.io.wavfile
from matplotlib imp