x.mean(dim=0, keepdim=True)
keepdim=True
表示维度不变
waveform, source_sr = torchaudio.load("4.wav")
waveform
tensor([[0.0000, 0.0000, 0.0000, …, 0.0016, 0.0016, 0.0012],
[0.0000, 0.0000, 0.0000, …, 0.0019, 0.0019, 0.0020]])
waveform.mean(0, True)
tensor([[0.0000, 0.0000, 0.0000, …, 0.0017, 0.0017, 0.0016]])