语音处理-批量文件处理静默区删除

import fnmatch
from pathlib import Path

from scipy.io import wavfile
import webrtcvad
import struct
from scipy.io.wavfile import write
import os
import numpy as np
import matplotlib.pyplot as plt

#开始将所有文件进行批处理操作
def find_all_files(files_path):
    """遍历指定文件夹所有指定类型文件"""
    p = Path(files_path)
    files_names = []  # 存储文件路径名称
    for file in p.rglob('*.wav'):  # 寻找所有txt文件
        x = str(file).split('\\')[-1]
        if fnmatch.fnmatch(x, '._*.wav'):
            continue
        else:
            files_names.append(str(file))  # 以字符串形式保存

    return files_names


def all_void_void(single_file_path,flag_session):
    #single_file_path = 'F:\文件\情感数据集\未处理\IEMOCAP_full_release\Session1\sentences\wav\Ses01F_impro01\Ses01F_impro01_F013.wav'
    #single_file_path = 'E:\coding\python\pythonfor_deleteVD\Ses01F_impro01_F000.wav'
    print(os.path.join(single_file_path))
    sample_rate, samples = wavfile.read(os.path.join(single_file_path))
    file_name = single_file_path.split("\\")[-1]
    file_package = single_file_path.split("\\")[-2]
    print(file_name)
    vad = webrtcvad.Vad()
    vad.set_mode(3)
    raw_samples = struct.pack("%dh" % len(samples), *samples)
    window_duration = 0.03
    samples_per_window = int(window_duration * sample_rate + 0.3)
    bytes_per_sample = 2
    segments = []
    try:
        for start in np.arange(0, len(samples), samples_per_window):
            stop = min(start + samples_per_window, len(samples))
            is_speech = vad.is_speech(raw_samples[start * bytes_per_sample: stop * bytes_per_sample],
                                      sample_rate=sample_rate)
            segments.append(dict(
                start=start,
                stop=stop,
                is_speech=is_speech))
    except:
        try:
            speech_samples = np.concatenate(
                [samples[segment['start']:segment['stop']] for segment in segments if segment['is_speech']])
        except:
            print('产生异常了第一次')
    try:
        speech_samples = np.concatenate(
            [samples[segment['start']:segment['stop']] for segment in segments if segment['is_speech']])
        new_path = 'F:\文件\研究生组\情感数据集\已处理\IEMOCAP_full_release\\' + flag_session + '\sentences\wav\\' + file_package
        # os.makedirs(new_path)
        if (os.path.exists(new_path)):
            print('1')
        else:
            os.makedirs(new_path)
        new_path =new_path+ '\\'+file_name
        wavfile.write(new_path, sample_rate, speech_samples)
    except:
        print('产生异常了第二次')
    #new_path = 'F:\文件\研究生组\情感数据集\已处理\IEMOCAP_full_release\Session1\sentences\wav\\'+file_package
    # os.makedirs(new_path)
    # if(os.path.exists(new_path)):
    #     print('1')
    # else:
    #     os.makedirs(new_path)
    # new_path = new_path + '\\'+file_name
    # wavfile.write(new_path, sample_rate, speech_samples)
#Session_list =["Session1","Session2","Session3","Session4","Senssion5"]
Session_list =["Session5"]
for senssion_i in Session_list:
    files_name = find_all_files('F:\文件\情感数据集\未处理\IEMOCAP_full_release\\'+senssion_i+'\sentences\wav')
    for file_name in files_name:
        all_void_void(file_name,senssion_i)

  • 2
    点赞
  • 3
    收藏
    觉得还不错? 一键收藏
  • 5
    评论

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论 5
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值