一个入门语音分离小菜鸡的日记
写此文的目的是记录自己的学习过程,一些经过,遇到问题以及解决问题的方法,存放在这里,方便自己以后复习以及自己的一些总结,如果此文对你有帮助,或者我写的有错误,请随时联系我。
今天晚上看代码,想通过简单的print打印出来网络结构看看,
一是我的研究生老板要我讲给他听,
二来自己看懂,为了毕业。
notepad缩进,默认是tab
pycharm的缩进默认是四个空格
空格和tab不能混用
遇到不懂的地方先print出来看看是什么结构,很方便,慢慢学会怎么看代码,怎么看懂代码,
运行到这里用exit()退出程序。
后面修改一下能投一个自己的水文章。毕业要紧。哈哈哈哈
summary(nnet,tuple(【32000】))
对我笔记本来说跑不动,后面我注释了这句。可以print出网络结构。
ConvTasNet(
(encoder_1d): Conv1D(1, 256, kernel_size=(20,), stride=(10,))
(ln): ChannelWiseLayerNorm((256,), eps=1e-05, elementwise_affine=True)
(proj): Conv1D(256, 256, kernel_size=(1,), stride=(1,))
(repeats): Sequential(
(0): Sequential(
(0): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(1,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(1): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(2,), dilation=(2,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(2): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(4,), dilation=(4,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(3): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(8,), dilation=(8,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(4): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(16,), dilation=(16,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(5): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(32,), dilation=(32,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(6): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(64,), dilation=(64,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(7): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(128,), dilation=(128,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
)
(1): Sequential(
(0): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(1,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(1): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(2,), dilation=(2,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(2): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(4,), dilation=(4,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(3): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(8,), dilation=(8,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(4): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(16,), dilation=(16,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(5): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(32,), dilation=(32,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(6): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(64,), dilation=(64,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(7): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(128,), dilation=(128,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
)
(2): Sequential(
(0): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(1,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(1): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(2,), dilation=(2,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(2): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(4,), dilation=(4,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(3): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(8,), dilation=(8,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(4): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(16,), dilation=(16,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(5): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(32,), dilation=(32,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(6): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(64,), dilation=(64,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(7): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(128,), dilation=(128,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
)
(3): Sequential(
(0): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(1,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(1): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(2,), dilation=(2,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(2): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(4,), dilation=(4,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(3): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(8,), dilation=(8,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(4): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(16,), dilation=(16,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(5): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(32,), dilation=(32,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(6): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(64,), dilation=(64,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
(7): Conv1DBlock(
(conv1x1): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(prelu1): PReLU(num_parameters=1)
(lnorm1): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(dconv): Conv1d(512, 512, kernel_size=(3,), stride=(1,), padding=(128,), dilation=(128,), groups=512)
(prelu2): PReLU(num_parameters=1)
(lnorm2): ChannelWiseLayerNorm((512,), eps=1e-05, elementwise_affine=True)
(sconv): Conv1d(512, 256, kernel_size=(1,), stride=(1,))
)
)
)
(mask): Conv1D(256, 512, kernel_size=(1,), stride=(1,))
(decoder_1d): ConvTrans1D(256, 1, kernel_size=(20,), stride=(10,))
)
ConvTasNet #param: 8.75
torch.Size([4, 1000])