手写四维卷积,python and C

手写四维卷积,python and C

数据结构

数据:NHWC
权重:OIHW

C:

void convOp(Blob input,Blob* output,conv_s convInfo, wtParam param){
	int sh = convInfo.strideH, sw = convInfo.strideW,
	ph = convInfo.convPad.padH, pw = convInfo.convPad.padW,
	kh = convInfo.kernelH, kw = convInfo.kernelW;

    Blob padedblob;
    padedblob.n = input.n;
    padedblob.h = input.h + 2 * ph;
    padedblob.w = input.w + 2 * pw;
    padedblob.c = input.c;
    padedblob.dataFmt = input.dataFmt;
    padedblob.dataType = input.dataType;
    padedblob.data = malloc(sizeof(float) * padedblob.n * padedblob.h * padedblob.w * padedblob.c);
    memset(padedblob.data, 0, sizeof(float) * padedblob.n * padedblob.h * padedblob.w * padedblob.c);

	//补边
	for(int n = 0; n < input.n; n++){
	    for(int c = 0; c < input.c; c++){
	        for(int h = 0; h < input.h; h++){
	            for(int w = 0; w < input.w; w++){
	                blobSet(
	                    n,
	                    h + ph,
	                    w + pw,
	                    c,
	                    padedblob,
	                    blobGet(
	                         n,
	                         h,
	                         w,
	                         c,
	                         input
	                    )
	                );
	            }
	        }
	    }
	}
	
	output->data = malloc(sizeof(float) * output->n * output->h * output->w * output->c);
	memset(output->data, 0, sizeof(float) * output->n * output->h * output->w * output->c);
	//卷积计算
    for(int n = 0; n < padedblob.n; n++){
        for(int oc = 0; oc < param.n; oc++){
            // wt[oc, 256, 3, 3]
            for(int inh = 0; inh <= padedblob.h - kh; inh += sh){
                for(int inw = 0; inw <= padedblob.w - kw; inw += sw){
                    float sum = 0;
                    for(int inc = 0; inc < padedblob.c; inc++){
                        for(int offx = 0; offx < kh; offx++){
                            for(int offy = 0; offy < kw; offy++){
                                sum += blobGet(n, inh + offx, inw + offy, inc, padedblob) *
                                wtGet(oc, offx, offy, inc, param);
                            }
                        }
                    }
                    blobSet(n, inh / sh, inw / sw, oc, *output, sum);
                }
            }
        }
    }

}

Python:

def convOp(inblob, node_size, node_shape, param):
    """param : OIHW

        return: outblob->nparray
    """
    param = param[0]
    kh = int(node_shape[1][0])
    kw = int(node_shape[1][1])
    sh = int(node_shape[2][0])
    sw = int(node_shape[2][1])
    ph = int(node_shape[3][0])
    pw = int(node_shape[3][1])

    if ph != 0 or pw != 0:
    	# 补边儿
        newn = inblob.shape[0]
        newh = inblob.shape[1] + 2 * ph
        neww = inblob.shape[2] + 2 * pw
        newc = inblob.shape[3]
        paddedblob = np.zeros((newn, newh, neww, newc), dtype=np.float32)
        paddedblob[:, ph:ph + inblob.shape[1], pw:pw + inblob.shape[2], :] = inblob
    else:
        paddedblob = inblob


    outblob = np.zeros(tuple(node_size), dtype=np.float32)

	# 权重是OIHW,而数据是NHWC,为了H与W能够在numpy中通过广播的方式计算,需要把权重转置成OHWI,numpy的转置几乎不消耗时间,因为该转置是不改变数据在内存中表示的。
	# 权重:OIHW 		OHWI
	# 数据:   	     	NHWC
    param = np.transpose(param, [0, 2, 3, 1])

	#卷积计算
    for oc in range(param.shape[0]):  # O of weight
        for h in range(outblob.shape[1]):  # H of outblob
            for w in range(outblob.shape[2]):
                outblob[:, h, w, oc] = np.sum(paddedblob[
                                             :,
                                             h * sh: h * sh + param.shape[1],
                                             w * sw: w * sw + param.shape[2],
                                             :] * param[oc, :, :, :])


    return outblob
  • 2
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值