矩阵乘法逐步加速演示

矩阵乘法

#include<iostream>
#include<ctime>
using namespace std;
int main() {
    int n = 1000;
    double* a = new double[n*n];
    double* b = new double[n*n];
    double* c = new double[n*n];
    int i, j, k;
    for (i = 0; i < n; ++i)
        for (j = 0; j < n; ++j) {
            a[i*n + j] = i + j;
            b[i*n + j] = i + j;
        }
    auto tic = clock();
    double s{ 0 };
    for (i = 0; i < n; ++i)
        for (j = 0; j < n; ++j) {
            s = 0.0;
            for (k = 0; k < n; ++k)
                s += a[i*n + k] * a[k*n + j];
            c[i*n + j] = s;
        }
    auto toc = clock() - tic;
    cout << toc << endl;
}

耗时 1600ms

后面矩阵转置

#include<iostream>
#include<ctime>
using namespace std;
int main() {
    int n = 1000;
    double* a = new double[n*n];
    double* b = new double[n*n];
    double* c = new double[n*n];
    int i, j, k;
    for (i = 0; i < n; ++i)
        for (j = 0; j < n; ++j) {
            a[i*n + j] = i + j;
            b[i*n + j] = i + j;
        }
    auto tic = clock();
    double s{ 0 };
    for (i = 0; i < n; ++i)
        for (j = 0; j < n; ++j) {
            s = 0.0;
            for (k = 0; k < n; ++k)
                s += a[i*n + k] * b[j*n + k];
            c[i*n + j] = s;
        }
    auto toc = clock() - tic;
    cout << toc << endl;
}

耗时 960ms

循环展开2个乘积

#include<iostream>
#include<ctime>
using namespace std;
int main() {
    int n = 1000;
    double* a = new double[n*n];
    double* b = new double[n*n];
    double* c = new double[n*n];
    int i, j, k;
    for (i = 0; i < n; ++i)
        for (j = 0; j < n; ++j) {
            a[i*n + j] = i + j;
            b[i*n + j] = i + j;
        }
    auto tic = clock();
    double s{ 0 };
    for (i = 0; i < n; ++i)
        for (j = 0; j < n; ++j) {
            s = 0.0;
            for (k = 0; k < n; k += 2)
                s += a[i*n + k] * b[j*n + k] +
                a[i*n + k + 1] * b[j*n + k + 1];
            c[i*n + j] = s;
        }
    auto toc = clock() - tic;
    cout << toc << endl;
}

耗时 560 ms

循环展开4个乘积

#include<iostream>
#include<ctime>
using namespace std;
int main() {
    int n = 1000;
    double* a = new double[n*n];
    double* b = new double[n*n];
    double* c = new double[n*n];
    int i, j, k, i1, j1;
    for (i = 0; i < n; ++i)
        for (j = 0; j < n; ++j) {
            a[i*n + j] = i + j;
            b[i*n + j] = i + j;
        }
    auto tic = clock();
    double s{ 0 };
    for (i = 0; i < n; ++i) {
        i1 = i * n;
        for (j = 0; j < n; ++j) {
            j1 = j * n;
            s = 0.0;
            for (k = 0; k < n; k += 4)
                s += a[i1 + k] * b[j1 + k] +
                a[i1 + k + 1] * b[j1 + k + 1] +
                a[i1 + k + 2] * b[j1 + k + 2] +
                a[i1 + k + 3] * b[j1 + k + 3];
            c[i*n + j] = s;
        }
    }
    auto toc = clock() - tic;
    cout << toc << endl;
}

耗时 480 ms

蛇形顺序

#include<iostream>
#include<ctime>
using namespace std;
int main() {
    int n = 1000;
    double* a = new double[n*n];
    double* b = new double[n*n];
    double* c = new double[n*n];
    int i, j, k, i1, j1;
    for (i = 0; i < n; ++i)
        for (j = 0; j < n; ++j) {
            a[i*n + j] = i + j;
            b[i*n + j] = i + j;
        }
    auto tic = clock();
    double s{ 0 };
    for (i = 0; i < n; ++i) {
        i1 = i * n;
        if (i % 2 == 0) {
            for (j = 0; j < n; ++j) {
                j1 = j * n;
                s = 0.0;
                for (k = 0; k < n; k += 4)
                    s += a[i1 + k] * b[j1 + k] +
                    a[i1 + k + 1] * b[j1 + k + 1] +
                    a[i1 + k + 2] * b[j1 + k + 2] +
                    a[i1 + k + 3] * b[j1 + k + 3];
                c[i*n + j] = s;
            }
        }
        else {
            for (j = n - 1; j >= 0; --j) {
                j1 = j * n;
                s = 0.0;
                for (k = 0; k < n; k += 4)
                    s += a[i1 + k] * b[j1 + k] +
                    a[i1 + k + 1] * b[j1 + k + 1] +
                    a[i1 + k + 2] * b[j1 + k + 2] +
                    a[i1 + k + 3] * b[j1 + k + 3];
                c[i*n + j] = s;
            }
        }
    }
    auto toc = clock() - tic;
    cout << toc << endl;
}

耗时 430 ms

注: visual C++ 2017, release, Intel()R) Core()TM) i7-8700K CPU 3.7G Hz

  • 0
    点赞
  • 9
    收藏
    觉得还不错? 一键收藏
  • 1
    评论

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论 1
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值