【c++】OpenMP自动并行

ystraw_ah

已于 2024-06-26 15:12:12 修改

阅读量231

点赞数

分类专栏： c/c++ 文章标签： c++ omp 并行

于 2020-08-02 10:50:17 首次发布

本文链接：https://blog.csdn.net/qq_39451578/article/details/107741360

版权

c/c++ 专栏收录该内容

26 篇文章 1 订阅

订阅专栏

标题

自动并行相关技术
入门博客：
omp例子
- 嵌套并行操作
- 线程id

自动并行相关技术

文档教程OpenMP 推荐！！！下面的几篇博客为此教程的翻译整理版本。
官网：OpenMP应用程序编程接口

入门博客：

omp例子

#include <iostream>
#include <omp.h>
#include <thread>

void report_num_threads(int level)
{
  // #pragma omp single
  {
      printf("Level %d: number of threads in the team: %d\n",
                level, omp_get_num_threads());

    // 获取当前线程的 ID
    std::thread::id this_id = std::this_thread::get_id();
    // 输出线程 ID
    std::cout << " Current thread ID: " << this_id << std::endl;
  }
 }

int main() {
    const int n = 32;
    int sum = 0;
    // int data[n];
    int a1 = 0;
    // int data2[n];
    int a2 = 0;
    // int data3[n];
    int a3 = 0;
    // int data4[n];
    int a4 = 0;
    // int data5[n];
    int a5 = 0;

    bool is_nested = false;
    is_nested = omp_get_nested();
    std::cout<<"是否支持并行嵌套：" << is_nested << "\n";
    omp_set_nested(1);//设置支持嵌套并行, 嵌套则会产生 n*m个线程(线程id不同)
    is_nested = omp_get_nested();
    std::cout<<"是否支持并行嵌套：" << is_nested << "\n";

    omp_set_num_threads(4); // 这个设置一个最大线程数，其他地方不指定线程数，然后开启嵌套，不会增加线程数，但是可以嵌套并行，然后指定的for里面会按照指定的来，没有指定的全部按照这个默认值

    double start_time = omp_get_wtime();

    for (int j = 0; j < 1; j++) {
      #pragma omp parallel for // num_threads(4)
      for (int i = 0; i < 1; ++i) {
          std::cout << "Thread " << omp_get_thread_num() << ": "  << std::endl;
         int sum = 0;
         report_num_threads(1);
         #pragma omp parallel for //num_threads(3)
         for (int k = 0; k < 10; ++k) {
            sum = sum + 1;
            report_num_threads(2);
         }
         report_num_threads(3);
         std::cout << "Thread " << omp_get_thread_num()
                   << " sum=" << sum 
                   << std::endl;
      }
    }
    report_num_threads(4);
    double end_time = omp_get_wtime();
    std::cout << "Time taken: " << end_time - start_time << " seconds" << std::endl;

    return 0;
}

// cmd: g++ -fopenmp -o sum_openmp openmp_test.cpp && ./sum_openmp

/*
output:
ID: 0, Max threads: 52, Num threads: 1 
ID: 0, Max threads: 5, Num threads: 1 
ID: 0, Max threads: 5, Num threads: 5 
ID: 4, Max threads: 5, Num threads: 5 
ID: 2, Max threads: 5, Num threads: 5 
ID: 1, Max threads: 5, Num threads: 5 
ID: 3, Max threads: 5, Num threads: 5 
ID: 0, Max threads: 5, Num threads: 1 
ID: 0, Max threads: 6, Num threads: 1 


ID: 0, Max threads: 6, Num threads: 6 
ID: 3, Max threads: 6, Num threads: 6 
ID: 1, Max threads: 6, Num threads: 6 
ID: 4, Max threads: 6, Num threads: 6 
ID: 2, Max threads: 6, Num threads: 6 
*/

嵌套并行操作

嵌套并行操作
例子：

#include <iostream>
#include <omp.h>

void report_num_threads(int level)
{
  // #pragma omp single
  {
      printf("Level %d: number of threads in the team: %d\n",
                level, omp_get_num_threads());
  }
 }

int main() {
    const int n = 32;
    int sum = 0;
    // int data[n];
    int a1 = 0;
    // int data2[n];
    int a2 = 0;
    // int data3[n];
    int a3 = 0;
    // int data4[n];
    int a4 = 0;
    // int data5[n];
    int a5 = 0;

    bool is_nested = false;
    is_nested = omp_get_nested();
    std::cout<<"是否支持并行嵌套：" << is_nested << "\n";
    omp_set_nested(1);//设置支持嵌套并行
    is_nested = omp_get_nested();
    std::cout<<"是否支持并行嵌套：" << is_nested << "\n";

    omp_set_num_threads(4);

    double start_time = omp_get_wtime();

    for (int j = 0; j < 1; j++) {
      #pragma omp parallel for num_threads(4)
      for (int i = 0; i < 2; ++i) {
          std::cout << "Thread " << omp_get_thread_num() << ": "  << std::endl;
         int sum = 0;
         report_num_threads(1);
         #pragma omp parallel for num_threads(16)
         for (int k = 0; k < 3; ++k) {
            sum = sum + 1;
            report_num_threads(2);
         }
         report_num_threads(3);
         std::cout << "Thread " << omp_get_thread_num()
                   << " sum=" << sum 
                   << std::endl;
      }
    }
    report_num_threads(4);
    double end_time = omp_get_wtime();
    std::cout << "Time taken: " << end_time - start_time << " seconds" << std::endl;

    return 0;
}

// cmd: g++ -fopenmp -o sum_openmp openmp_test.cpp && ./sum_openmp

/*
是否支持并行嵌套：0
是否支持并行嵌套：1
Thread 0: Thread 
1: 
Level 1: number of threads in the team: 4
Level 1: number of threads in the team: 4
Level 2: number of threads in the team: 16
Level 2: number of threads in the team: 16
Level 2: number of threads in the team: 16
Level 2: number of threads in the team: 16
Level 2: number of threads in the team: 16
Level 2: number of threads in the team: 16
Level 3: number of threads in the team: 4
Thread 1 sum=3
Level 3: number of threads in the team: 4
Thread 0 sum=3
Level 4: number of threads in the team: 1
Time taken: 0.000629196 seconds*/

线程id

#include <iostream>
#include <omp.h>
#include <thread>

void report_num_threads(int level)
{
  // #pragma omp single
  {
      // printf("Level %d: number of threads in the team: %d\n",
      //           level, omp_get_num_threads());

    // 获取当前线程的 ID
    std::thread::id thread_id1 = std::this_thread::get_id();
    int thread_id2 = omp_get_thread_num(); // 线程id
    // 输出线程 ID
    // std::cout << " Current thread ID: " << thread_id1 
    //           << " id2=" << thread_id2
    //           << std::endl;
    printf("Level %d: number of threads in the team: %d \
            Current thread ID: %d, id2=%d\n",
                level, omp_get_num_threads(), thread_id1, thread_id2);
  }
}

 // 

int main() {

    std::cout << "------------ thread_num=4 ----------" << std::endl;
    #pragma omp parallel for num_threads(4)
    for (int i = 0; i < 10; i++) {
      report_num_threads(i);
    }

    std::cout << "------------ thread_num=10 ----------" << std::endl;
    #pragma omp parallel for num_threads(10)
    for (int i = 0; i < 10; i++) {
      report_num_threads(i);
    }

    return 0;
}

// cmd: g++ -fopenmp -o sum_openmp openmp_test.cpp && ./sum_openmp

output:

------------ thread_num=4 ----------
Level 0: number of threads in the team: 4             Current thread ID: 789157824, id2=0
Level 1: number of threads in the team: 4             Current thread ID: 789157824, id2=0
Level 2: number of threads in the team: 4             Current thread ID: 789157824, id2=0
Level 6: number of threads in the team: 4             Current thread ID: 780760832, id2=2
Level 7: number of threads in the team: 4             Current thread ID: 780760832, id2=2
Level 8: number of threads in the team: 4             Current thread ID: 772368128, id2=3
Level 9: number of threads in the team: 4             Current thread ID: 772368128, id2=3
Level 3: number of threads in the team: 4             Current thread ID: 789153536, id2=1
Level 4: number of threads in the team: 4             Current thread ID: 789153536, id2=1
Level 5: number of threads in the team: 4             Current thread ID: 789153536, id2=1
------------ thread_num=10 ----------
Level 0: number of threads in the team: 10             Current thread ID: 789157824, id2=0
Level 8: number of threads in the team: 10             Current thread ID: 730404608, id2=8
Level 3: number of threads in the team: 10             Current thread ID: 772368128, id2=3
Level 2: number of threads in the team: 10             Current thread ID: 780760832, id2=2
Level 7: number of threads in the team: 10             Current thread ID: 738797312, id2=7
Level 9: number of threads in the team: 10             Current thread ID: 722011904, id2=9
Level 6: number of threads in the team: 10             Current thread ID: 747190016, id2=6
Level 5: number of threads in the team: 10             Current thread ID: 755582720, id2=5
Level 4: number of threads in the team: 10             Current thread ID: 763975424, id2=4
Level 1: number of threads in the team: 10             Current thread ID: 789153536, id2=1