该脚本功能类似于sox的去除silence的命令,这里是使用pydub做的
import os
import sys
import numpy as np
from pydub import AudioSegment
N=20
def usage():
print("batch_trim_silence <speech path>")
def trim_silence(f):
speech = AudioSegment.from_file(file=f, sample_width=2, frame_rate=8000, channels=1, )
l = int(len(speech)/N)
flags=np.ones(l, dtype=np.int)
rewrite = 0
for i in range(l-1):
print("frame {}: dB: {}".format(i, speech[i*N:(i+1)*N].max_dBFS))
if (rewrite == 0 and speech[i*N:(i+1)*N].max_dBFS < -30) or (rewrite == 1 and speech[i*N:(i+1)*N].max_dBFS < -40):
flags[i] = 0
rewrite = 1
if rewrite == 1:
f1 = open(f, 'wb')
for i in range(l-1):
if flags[i] == 1:
samples = np.array(speech[i*N:(i+1)*N].get_array_of_samples())
f1.write(samples.tobytes())
f1.close()
print("========trimed file ", f)
if len(sys.argv) != 2:
usage()
exit(-1)
work_path=sys.argv[1]
for root, dirs, files in os.walk(work_path):
for name in files:
trim_silence(os.path.join(root, name))