非异常安全
#include <numeric>
#include <iterator>
#include <thread>
#include <vector>
#include <functional>
template<typename Iterator, typename T>
struct accumulate_block
{
void operator()(Iterator first, Iterator last, T &result)
{
result = std::accumulate(first, last, result);
}
};
template<typename Iterator, typename T>
T parallel_accumulate(Iterator first, Iterator last, T init)
{
const unsigned long length = std::distance(first, last);
if (!length)
{
return init;
}
const unsigned long min_per_thread = 25;
const unsigned long max_threads = (length + min_per_thread - 1) / min_per_thread;
const unsigned long hardware_threads = std::thread::hardware_concurrency();
const unsigned long num_threads = std::min(hardware_threads != 0 ? hardware_threads : 2, max_threads);
const unsigned long block_size = length / num_threads;
std::vector<T> results(num_threads);
std::vector<std::thread> threads(num_threads);
Iterator block_start = first;
for (unsigned long i = 0; i < (num_threads - 1); ++i)
{
Iterator block_end = block_start;
std::advance(block_end, block_size);
threads.at(i) = \
std::thread(accumulate_block<Iterator, T>(), \
block_start, block_end, \
std::ref(results.at(i)));
block_start = block_end;
}
accumulate_block()(block_start, last, results.at(num_threads - 1));
std::for_each(threads.begin(), threads.end(), std::mem_fn(&std::thread::join));
return std::accumulate(results.begin(), results.end(), init);
}
异常安全版本
#include <numeric>
#include <future>
#include <vector>
#include <functional>
#include <thread>
template<typename Iterator, typename T>
struct accumulate_block
{
T operator()(Iterator first, Iterator last)
{
return std::accumulate(first, last, T());
}
};
template<typename Iterator, typename T>
T parallel_accumulate(Iterator first, Iterator last, T init)
{
const unsigned long length = std::distance(first, last);
if (!length)
{
return init;
}
const unsigned long min_pre_thread = 25;
const unsigned long max_threads =
(length + min_pre_thread - 1) / min_pre_thread;
const unsigned long hadrware_threads = std::thread::hardware_concurrency();
const unsigned long num_threads =
std::min(hadrware_threads != 0 ? hadrware_threads : 2, max_threads);
const unsigned long block_size = length / num_threads;
std::vector<std::future<T>> futures(num_threads - 1);
std::vector<std::thread> threads(num_threads - 1);
Iterator block_start = first;
for (unsigned long i = 0; i < num_threads - 1; ++i)
{
Iterator block_end = block_start;
std::advance(block_end, block_size);
std::packaged_task<T(Iterator, Iterator)> task(accumulate_block<Iterator, T>());
futures.at(i) = task.get_future();
threads.at(i) = std::thread(std::move(task), block_start, block_end);
block_start = block_end;
}
T last_result = accumulate_block()(block_start, last);
std::for_each(threads.begin(), threads.end(), std::mem_fn(&std::thread::join));
T result = init;
for (unsigned long i = 0; i < num_threads - 1; ++i)
{
result += futures.at(i).get();
}
result += last_result;
return result;
}