grppi/0.3.1/parallel__execution__native_8h_source.html

 #ifndef GRPPI_NATIVE_PARALLEL_EXECUTION_NATIVE_H
 #define GRPPI_NATIVE_PARALLEL_EXECUTION_NATIVE_H

 #include "worker_pool.h"
 #include "../common/mpmc_queue.h"
 #include "../common/iterator.h"
 #include "../common/execution_traits.h"

 #include <thread>
 #include <atomic>
 #include <algorithm>
 #include <vector>
 #include <type_traits>
 #include <tuple>
 #include <experimental/optional>

 namespace grppi {

 class thread_registry {
 public:
   thread_registry() noexcept = default;

   void register_thread() noexcept;

   void deregister_thread() noexcept;

   int current_index() const noexcept;

 private:
   mutable std::atomic_flag lock_ = ATOMIC_FLAG_INIT;
   std::vector<std::thread::id> ids_;
 };

 inline void thread_registry::register_thread() noexcept
 {
   using namespace std;
   while (lock_.test_and_set(memory_order_acquire)) {}
   auto this_id = this_thread::get_id();
   ids_.push_back(this_id);
   lock_.clear(memory_order_release);
 }

 inline void thread_registry::deregister_thread() noexcept
 {
   using namespace std;
   while (lock_.test_and_set(memory_order_acquire)) {}
   auto this_id = this_thread::get_id();
   auto current = find(begin(ids_), end(ids_), this_id);
   *current = {}; //Empty thread
   lock_.clear(memory_order_release);
 }

 inline int thread_registry::current_index() const noexcept
 {
   using namespace std;
   while (lock_.test_and_set(memory_order_acquire)) {}
   auto this_id = this_thread::get_id();
   auto current = find(begin(ids_), end(ids_), this_id);
   auto index = distance(begin(ids_), current);
   lock_.clear(memory_order_release);
   return index;
 };

 class native_thread_manager {
 public:
   native_thread_manager(thread_registry & registry)
       : registry_{registry}
   { registry_.register_thread(); }

   ~native_thread_manager() {
     registry_.deregister_thread();
   }

 private:
   thread_registry & registry_;
 };

 class parallel_execution_native {
 public:

   parallel_execution_native() noexcept :
       parallel_execution_native{
           static_cast<int>(2 * std::thread::hardware_concurrency()),
           true}
   {}

   parallel_execution_native(int concurrency_degree, bool ordering=true) noexcept :
     concurrency_degree_{concurrency_degree},
     ordering_{ordering}
   {}

   parallel_execution_native(const parallel_execution_native & ex) :
       parallel_execution_native{ex.concurrency_degree_, ex.ordering_}
   {}

   void set_concurrency_degree(int degree) noexcept { concurrency_degree_ = degree; }

   int concurrency_degree() const noexcept { return concurrency_degree_; }

   void enable_ordering() noexcept { ordering_=true; }

   void disable_ordering() noexcept { ordering_=false; }

   bool is_ordered() const noexcept { return ordering_; }

   native_thread_manager thread_manager() const {
     return native_thread_manager{thread_registry_};
   }

   int get_thread_id() const noexcept {
     return thread_registry_.current_index();
   }

   void set_queue_attributes(int size, queue_mode mode) noexcept {
     queue_size_ = size;
     queue_mode_ = mode;
   }

   template <typename T>
   mpmc_queue<T> make_queue() const {
     return {queue_size_, queue_mode_};
   }

   template <typename T, typename ... Transformers>
   mpmc_queue<T>& get_output_queue(mpmc_queue<T> & queue, Transformers && ...) const {
     return queue;
   }

   template <typename T, typename ... Transformers>
   mpmc_queue<T> get_output_queue(Transformers && ...) const{
     return std::move(make_queue<T>());
   }

   template <typename ... InputIterators, typename OutputIterator,
             typename Transformer>
   void map(std::tuple<InputIterators...> firsts,
       OutputIterator first_out,
       std::size_t sequence_size, Transformer transform_op) const;

   template <typename InputIterator, typename Identity, typename Combiner>
   auto reduce(InputIterator first, std::size_t sequence_size,
               Identity && identity, Combiner && combine_op) const;

   template <typename ... InputIterators, typename Identity,
             typename Transformer, typename Combiner>
   auto map_reduce(std::tuple<InputIterators...> firsts,
                   std::size_t sequence_size,
                   Identity && identity,
                   Transformer && transform_op, Combiner && combine_op) const;

   template <typename ... InputIterators, typename OutputIterator,
             typename StencilTransformer, typename Neighbourhood>
   void stencil(std::tuple<InputIterators...> firsts, OutputIterator first_out,
                std::size_t sequence_size,
                StencilTransformer && transform_op,
                Neighbourhood && neighbour_op) const;

   template <typename Input, typename Divider, typename Solver, typename Combiner>
   [[deprecated("Use new interface with predicate argument")]]
   auto divide_conquer(Input && input,
                       Divider && divide_op,
                       Solver && solve_op,
                       Combiner && combine_op) const;

   template <typename Input, typename Divider, typename Predicate, typename Solver, typename Combiner>
   auto divide_conquer(Input && input,
                       Divider && divide_op,
                       Predicate && predicate_op,
                       Solver && solve_op,
                       Combiner && combine_op) const;


   template <typename Generator, typename ... Transformers>
   void pipeline(Generator && generate_op,
                 Transformers && ... transform_ops) const;

   template <typename InputType, typename Transformer, typename OutputType>
   void pipeline(mpmc_queue<InputType> & input_queue, Transformer && transform_op,
                 mpmc_queue<OutputType> &output_queue) const
   {
     do_pipeline(input_queue, std::forward<Transformer>(transform_op), output_queue);
   }

 private:

   template <typename Input, typename Divider, typename Solver, typename Combiner>
   auto divide_conquer(Input && input,
                       Divider && divide_op,
                       Solver && solve_op,
                       Combiner && combine_op,
                       std::atomic<int> & num_threads) const;

  template <typename Input, typename Divider,typename Predicate, typename Solver, typename Combiner>
   auto divide_conquer(Input && input,
                       Divider && divide_op,
                       Predicate && predicate_op,
                       Solver && solve_op,
                       Combiner && combine_op,
                       std::atomic<int> & num_threads) const;


   template <typename Queue, typename Consumer,
             requires_no_pattern<Consumer> = 0>
   void do_pipeline(Queue & input_queue, Consumer && consume_op) const;

   template <typename Inqueue, typename Transformer, typename output_type,
             requires_no_pattern<Transformer> = 0>
   void do_pipeline(Inqueue & input_queue, Transformer && transform_op,
       mpmc_queue<output_type> & output_queue) const;

   template <typename T, typename ... Others>
   void do_pipeline(mpmc_queue<T> & in_q, mpmc_queue<T> & same_queue, Others &&... ops) const
   { }

   template <typename T>
   void do_pipeline(mpmc_queue<T> & in_q) const {}


   template <typename Queue, typename Transformer, typename ... OtherTransformers,
             requires_no_pattern<Transformer> = 0>
   void do_pipeline(Queue & input_queue, Transformer && transform_op,
       OtherTransformers && ... other_ops) const;

   template <typename Queue, typename FarmTransformer,
             template <typename> class Farm,
             requires_farm<Farm<FarmTransformer>> = 0>
   void do_pipeline(Queue & input_queue,
       Farm<FarmTransformer> & farm_obj) const
   {
     do_pipeline(input_queue, std::move(farm_obj));
   }

   template <typename Queue, typename FarmTransformer,
             template <typename> class Farm,
             requires_farm<Farm<FarmTransformer>> = 0>
   void do_pipeline( Queue & input_queue,
       Farm<FarmTransformer> && farm_obj) const;

   template <typename Queue, typename Execution, typename Transformer,
             template <typename, typename> class Context,
             typename ... OtherTransformers,
             requires_context<Context<Execution,Transformer>> = 0>
   void do_pipeline(Queue & input_queue, Context<Execution,Transformer> && context_op,
        OtherTransformers &&... other_ops) const;

   template <typename Queue, typename Execution, typename Transformer,
             template <typename, typename> class Context,
             typename ... OtherTransformers,
             requires_context<Context<Execution,Transformer>> = 0>
   void do_pipeline(Queue & input_queue, Context<Execution,Transformer> & context_op,
        OtherTransformers &&... other_ops) const
   {
     do_pipeline(input_queue, std::move(context_op),
       std::forward<OtherTransformers>(other_ops)...);
   }

   template <typename Queue, typename FarmTransformer,
             template <typename> class Farm,
             typename ... OtherTransformers,
             requires_farm<Farm<FarmTransformer>> = 0>
   void do_pipeline(Queue & input_queue,
       Farm<FarmTransformer> & farm_obj,
       OtherTransformers && ... other_transform_ops) const
   {
     do_pipeline(input_queue, std::move(farm_obj),
         std::forward<OtherTransformers>(other_transform_ops)...);
   }

   template <typename Queue, typename FarmTransformer,
             template <typename> class Farm,
             typename ... OtherTransformers,
             requires_farm<Farm<FarmTransformer>> = 0>
   void do_pipeline(Queue & input_queue,
       Farm<FarmTransformer> && farm_obj,
       OtherTransformers && ... other_transform_ops) const;

   template <typename Queue, typename Predicate,
             template <typename> class Filter,
             typename ... OtherTransformers,
             requires_filter<Filter<Predicate>> =0>
   void do_pipeline(Queue & input_queue,
       Filter<Predicate> & filter_obj,
       OtherTransformers && ... other_transform_ops) const
   {
     do_pipeline(input_queue, std::move(filter_obj),
         std::forward<OtherTransformers>(other_transform_ops)...);
   }

   template <typename Queue, typename Predicate,
             template <typename> class Filter,
             typename ... OtherTransformers,
             requires_filter<Filter<Predicate>> =0>
   void do_pipeline(Queue & input_queue,
       Filter<Predicate> && farm_obj,
       OtherTransformers && ... other_transform_ops) const;

   template <typename Queue, typename Combiner, typename Identity,
             template <typename C, typename I> class Reduce,
             typename ... OtherTransformers,
             requires_reduce<Reduce<Combiner,Identity>> = 0>
   void do_pipeline(Queue && input_queue, Reduce<Combiner,Identity> & reduce_obj,
                    OtherTransformers && ... other_transform_ops) const
   {
     do_pipeline(input_queue, std::move(reduce_obj),
         std::forward<OtherTransformers>(other_transform_ops)...);
   };

   template <typename Queue, typename Combiner, typename Identity,
             template <typename C, typename I> class Reduce,
             typename ... OtherTransformers,
             requires_reduce<Reduce<Combiner,Identity>> = 0>
   void do_pipeline(Queue && input_queue, Reduce<Combiner,Identity> && reduce_obj,
                    OtherTransformers && ... other_transform_ops) const;

   template <typename Queue, typename Transformer, typename Predicate,
             template <typename T, typename P> class Iteration,
             typename ... OtherTransformers,
             requires_iteration<Iteration<Transformer,Predicate>> =0,
             requires_no_pattern<Transformer> =0>
   void do_pipeline(Queue & input_queue, Iteration<Transformer,Predicate> & iteration_obj,
                    OtherTransformers && ... other_transform_ops) const
   {
     do_pipeline(input_queue, std::move(iteration_obj),
         std::forward<OtherTransformers>(other_transform_ops)...);
   }

   template <typename Queue, typename Transformer, typename Predicate,
             template <typename T, typename P> class Iteration,
             typename ... OtherTransformers,
             requires_iteration<Iteration<Transformer,Predicate>> =0,
             requires_no_pattern<Transformer> =0>
   void do_pipeline(Queue & input_queue, Iteration<Transformer,Predicate> && iteration_obj,
                    OtherTransformers && ... other_transform_ops) const;

   template <typename Queue, typename Transformer, typename Predicate,
             template <typename T, typename P> class Iteration,
             typename ... OtherTransformers,
             requires_iteration<Iteration<Transformer,Predicate>> =0,
             requires_pipeline<Transformer> =0>
   void do_pipeline(Queue & input_queue, Iteration<Transformer,Predicate> && iteration_obj,
                    OtherTransformers && ... other_transform_ops) const;


   template <typename Queue, typename ... Transformers,
             template <typename...> class Pipeline,
             requires_pipeline<Pipeline<Transformers...>> = 0>
   void do_pipeline(Queue & input_queue,
       Pipeline<Transformers...> & pipeline_obj) const
   {
     do_pipeline(input_queue, std::move(pipeline_obj));
   }

   template <typename Queue, typename ... Transformers,
             template <typename...> class Pipeline,
             requires_pipeline<Pipeline<Transformers...>> = 0>
   void do_pipeline(Queue & input_queue,
       Pipeline<Transformers...> && pipeline_obj) const;

   template <typename Queue, typename ... Transformers,
             template <typename...> class Pipeline,
             typename ... OtherTransformers,
             requires_pipeline<Pipeline<Transformers...>> = 0>
   void do_pipeline(Queue & input_queue,
       Pipeline<Transformers...> & pipeline_obj,
       OtherTransformers && ... other_transform_ops) const
   {
     do_pipeline(input_queue, std::move(pipeline_obj),
         std::forward<OtherTransformers>(other_transform_ops)...);
   }

   template <typename Queue, typename ... Transformers,
             template <typename...> class Pipeline,
             typename ... OtherTransformers,
             requires_pipeline<Pipeline<Transformers...>> = 0>
   void do_pipeline(Queue & input_queue,
       Pipeline<Transformers...> && pipeline_obj,
       OtherTransformers && ... other_transform_ops) const;

   template <typename Queue, typename ... Transformers,
             std::size_t ... I>
   void do_pipeline_nested(
       Queue & input_queue,
       std::tuple<Transformers...> && transform_ops,
       std::index_sequence<I...>) const;

 private:
   mutable thread_registry thread_registry_;

   int concurrency_degree_;
   bool ordering_;

   constexpr static int default_queue_size = 100;
   int queue_size_ = default_queue_size;

   queue_mode queue_mode_ = queue_mode::blocking;
 };

 template <typename E>
 constexpr bool is_parallel_execution_native() {
   return std::is_same<E, parallel_execution_native>::value;
 }

 template <>
 constexpr bool is_supported<parallel_execution_native>() { return true; }

 template <>
 constexpr bool supports_map<parallel_execution_native>() { return true; }

 template <>
 constexpr bool supports_reduce<parallel_execution_native>() { return true; }

 template <>
 constexpr bool supports_map_reduce<parallel_execution_native>() { return true; }

 template <>
 constexpr bool supports_stencil<parallel_execution_native>() { return true; }

 template <>
 constexpr bool supports_divide_conquer<parallel_execution_native>() { return true; }

 template <>
 constexpr bool supports_pipeline<parallel_execution_native>() { return true; }

 template <typename ... InputIterators, typename OutputIterator,
           typename Transformer>
 void parallel_execution_native::map(
     std::tuple<InputIterators...> firsts,
     OutputIterator first_out,
     std::size_t sequence_size, Transformer transform_op) const
 {
   using namespace std;

   auto process_chunk =
     [&transform_op](auto fins, std::size_t size, auto fout)
   {
     const auto l = next(get<0>(fins), size);
     while (get<0>(fins)!=l) {
       *fout++ = apply_deref_increment(
           std::forward<Transformer>(transform_op), fins);
     }
   };

   const int chunk_size = sequence_size / concurrency_degree_;

   {
     worker_pool workers{concurrency_degree_};
     for (int i=0; i!=concurrency_degree_-1; ++i) {
       const auto delta = chunk_size * i;
       const auto chunk_firsts = iterators_next(firsts,delta);
       const auto chunk_first_out = next(first_out, delta);
       workers.launch(*this, process_chunk, chunk_firsts, chunk_size, chunk_first_out);
     }

     const auto delta = chunk_size * (concurrency_degree_ - 1);
     const auto chunk_firsts = iterators_next(firsts,delta);
     const auto chunk_first_out = next(first_out, delta);
     process_chunk(chunk_firsts, sequence_size - delta, chunk_first_out);
   } // Pool synch
 }

 template <typename InputIterator, typename Identity, typename Combiner>
 auto parallel_execution_native::reduce(
     InputIterator first, std::size_t sequence_size,
     Identity && identity,
     Combiner && combine_op) const
 {
   using result_type = std::decay_t<Identity>;
   std::vector<result_type> partial_results(concurrency_degree_);

   constexpr sequential_execution seq;
   auto process_chunk = [&](InputIterator f, std::size_t sz, std::size_t id) {
     partial_results[id] = seq.reduce(f,sz, std::forward<Identity>(identity),
         std::forward<Combiner>(combine_op));
   };

   const auto chunk_size = sequence_size / concurrency_degree_;

   {
     worker_pool workers{concurrency_degree_};
     for (int i=0; i<concurrency_degree_-1; ++i) {
       const auto delta = chunk_size * i;
       const auto chunk_first = std::next(first,delta);
       workers.launch(*this, process_chunk, chunk_first, chunk_size, i);
     }

     const auto delta = chunk_size * (concurrency_degree_-1);
     const auto chunk_first = std::next(first, delta);
     const auto chunk_sz = sequence_size - delta;
     process_chunk(chunk_first, chunk_sz, concurrency_degree_-1);
   } // Pool synch

   return seq.reduce(std::next(partial_results.begin()),
       partial_results.size()-1, std::forward<result_type>(partial_results[0]),
       std::forward<Combiner>(combine_op));
 }

 template <typename ... InputIterators, typename Identity,
           typename Transformer, typename Combiner>
 auto parallel_execution_native::map_reduce(
     std::tuple<InputIterators...> firsts,
     std::size_t sequence_size,
     Identity && identity,
     Transformer && transform_op, Combiner && combine_op) const
 {
   using result_type = std::decay_t<Identity>;
   std::vector<result_type> partial_results(concurrency_degree_);

   constexpr sequential_execution seq;
   auto process_chunk = [&](auto f, std::size_t sz, std::size_t id) {
     partial_results[id] = seq.map_reduce(f, sz,
         std::forward<Identity>(partial_results[id]),
         std::forward<Transformer>(transform_op),
         std::forward<Combiner>(combine_op));
   };

   const auto chunk_size = sequence_size / concurrency_degree_;

   {
     worker_pool workers{concurrency_degree_};
     for(int i=0;i<concurrency_degree_-1;++i){
       const auto delta = chunk_size * i;
       const auto chunk_firsts = iterators_next(firsts,delta);
       workers.launch(*this, process_chunk, chunk_firsts, chunk_size, i);
     }

     const auto delta = chunk_size * (concurrency_degree_-1);
     const auto chunk_firsts = iterators_next(firsts, delta);
     process_chunk(chunk_firsts, sequence_size - delta, concurrency_degree_-1);
   } // Pool synch

   return seq.reduce(std::next(partial_results.begin()),
      partial_results.size()-1, std::forward<result_type>(partial_results[0]),
      std::forward<Combiner>(combine_op));
 }

 template <typename ... InputIterators, typename OutputIterator,
           typename StencilTransformer, typename Neighbourhood>
 void parallel_execution_native::stencil(
     std::tuple<InputIterators...> firsts, OutputIterator first_out,
     std::size_t sequence_size,
     StencilTransformer && transform_op,
     Neighbourhood && neighbour_op) const
 {
   constexpr sequential_execution seq;
   auto process_chunk =
     [&transform_op, &neighbour_op,seq](auto fins, std::size_t sz, auto fout)
   {
     seq.stencil(fins, fout, sz,
       std::forward<StencilTransformer>(transform_op),
       std::forward<Neighbourhood>(neighbour_op));
   };

   const auto chunk_size = sequence_size / concurrency_degree_;
   {
     worker_pool workers{concurrency_degree_};

     for (int i=0; i!=concurrency_degree_-1; ++i) {
       const auto delta = chunk_size * i;
       const auto chunk_firsts = iterators_next(firsts,delta);
       const auto chunk_out = std::next(first_out,delta);
       workers.launch(*this, process_chunk, chunk_firsts, chunk_size, chunk_out);
     }

     const auto delta = chunk_size * (concurrency_degree_ - 1);
     const auto chunk_firsts = iterators_next(firsts,delta);
     const auto chunk_out = std::next(first_out,delta);
     process_chunk(chunk_firsts, sequence_size - delta, chunk_out);
   } // Pool synch
 }

 template <typename Input, typename Divider, typename Solver, typename Combiner>
 auto parallel_execution_native::divide_conquer(
     Input && problem,
     Divider && divide_op,
     Solver && solve_op,
     Combiner && combine_op) const
 {
   std::atomic<int> num_threads{concurrency_degree_-1};

   return divide_conquer(std::forward<Input>(problem), std::forward<Divider>(divide_op),
         std::forward<Solver>(solve_op), std::forward<Combiner>(combine_op),
         num_threads);
 }


 template <typename Input, typename Divider,typename Predicate, typename Solver, typename Combiner>
 auto parallel_execution_native::divide_conquer(
     Input && problem,
     Divider && divide_op,
     Predicate && predicate_op,
     Solver && solve_op,
     Combiner && combine_op) const
 {
   std::atomic<int> num_threads{concurrency_degree_-1};

   return divide_conquer(std::forward<Input>(problem), std::forward<Divider>(divide_op),
         std::forward<Predicate>(predicate_op),
         std::forward<Solver>(solve_op), std::forward<Combiner>(combine_op),
         num_threads);
 }

 template <typename Generator, typename ... Transformers>
 void parallel_execution_native::pipeline(
     Generator && generate_op,
     Transformers && ... transform_ops) const
 {
   using namespace std;
   using result_type = decay_t<typename result_of<Generator()>::type>;
   using output_type = pair<result_type,long>;
   auto output_queue = make_queue<output_type>();

   thread generator_task([&,this]() {
     auto manager = thread_manager();

     long order = 0;
     for (;;) {
       auto item{generate_op()};
       output_queue.push(make_pair(item, order));
       order++;
       if (!item) break;
     }
   });

   do_pipeline(output_queue, forward<Transformers>(transform_ops)...);
   generator_task.join();
 }

 // PRIVATE MEMBERS

 template <typename Input, typename Divider, typename Solver, typename Combiner>
 auto parallel_execution_native::divide_conquer(
     Input && input,
     Divider && divide_op,
     Solver && solve_op,
     Combiner && combine_op,
     std::atomic<int> & num_threads) const
 {
   constexpr sequential_execution seq;
   if (num_threads.load() <=0) {
     return seq.divide_conquer(std::forward<Input>(input),
         std::forward<Divider>(divide_op), std::forward<Solver>(solve_op),
         std::forward<Combiner>(combine_op));
   }

   auto subproblems = divide_op(std::forward<Input>(input));
   if (subproblems.size()<=1) { return solve_op(std::forward<Input>(input)); }

   using subresult_type =
       std::decay_t<typename std::result_of<Solver(Input)>::type>;
   std::vector<subresult_type> partials(subproblems.size()-1);

   auto process_subproblem = [&,this](auto it, std::size_t div) {
     partials[div] = this->divide_conquer(std::forward<Input>(*it),
         std::forward<Divider>(divide_op), std::forward<Solver>(solve_op),
         std::forward<Combiner>(combine_op), num_threads);
   };

   int division = 0;

   worker_pool workers{num_threads.load()};
   auto i = subproblems.begin() + 1;
   while (i!=subproblems.end() && num_threads.load()>0) {
     workers.launch(*this,process_subproblem, i++, division++);
     num_threads--;
   }

   while (i!=subproblems.end()) {
     partials[division] = seq.divide_conquer(std::forward<Input>(*i++),
         std::forward<Divider>(divide_op), std::forward<Solver>(solve_op),
         std::forward<Combiner>(combine_op));
   }

   auto subresult = divide_conquer(std::forward<Input>(*subproblems.begin()),
       std::forward<Divider>(divide_op), std::forward<Solver>(solve_op),
       std::forward<Combiner>(combine_op), num_threads);

   workers.wait();

   return seq.reduce(partials.begin(), partials.size(),
       std::forward<subresult_type>(subresult), std::forward<Combiner>(combine_op));
 }

 template <typename Input, typename Divider,typename Predicate, typename Solver, typename Combiner>
 auto parallel_execution_native::divide_conquer(
     Input && input,
     Divider && divide_op,
     Predicate && predicate_op,
     Solver && solve_op,
     Combiner && combine_op,
     std::atomic<int> & num_threads) const
 {
   constexpr sequential_execution seq;
   if (num_threads.load() <=0) {
     return seq.divide_conquer(std::forward<Input>(input),
         std::forward<Divider>(divide_op),
         std::forward<Predicate>(predicate_op),
         std::forward<Solver>(solve_op),
         std::forward<Combiner>(combine_op));
   }

   if (predicate_op(input)) { return solve_op(std::forward<Input>(input)); }
   auto subproblems = divide_op(std::forward<Input>(input));

   using subresult_type =
       std::decay_t<typename std::result_of<Solver(Input)>::type>;
   std::vector<subresult_type> partials(subproblems.size()-1);

   auto process_subproblem = [&,this](auto it, std::size_t div) {
     partials[div] = this->divide_conquer(std::forward<Input>(*it),
         std::forward<Divider>(divide_op), std::forward<Predicate>(predicate_op),
         std::forward<Solver>(solve_op),
         std::forward<Combiner>(combine_op), num_threads);
   };

   int division = 0;

   worker_pool workers{num_threads.load()};
   auto i = subproblems.begin() + 1;
   while (i!=subproblems.end() && num_threads.load()>0) {
     workers.launch(*this,process_subproblem, i++, division++);
     num_threads--;
   }

   while (i!=subproblems.end()) {
     partials[division] = seq.divide_conquer(std::forward<Input>(*i++),
         std::forward<Divider>(divide_op), std::forward<Predicate>(predicate_op), std::forward<Solver>(solve_op),
         std::forward<Combiner>(combine_op));
   }

   auto subresult = divide_conquer(std::forward<Input>(*subproblems.begin()),
       std::forward<Divider>(divide_op), std::forward<Predicate>(predicate_op), std::forward<Solver>(solve_op),
       std::forward<Combiner>(combine_op), num_threads);

   workers.wait();

   return seq.reduce(partials.begin(), partials.size(),
       std::forward<subresult_type>(subresult), std::forward<Combiner>(combine_op));
 }
 template <typename Queue, typename Consumer,
           requires_no_pattern<Consumer>>
 void parallel_execution_native::do_pipeline(
     Queue & input_queue,
     Consumer && consume_op) const
 {
   using namespace std;
   using gen_value_type = typename Queue::value_type;
   using input_value_type = typename gen_value_type::first_type;

   auto manager = thread_manager();
   if (!is_ordered()) {
     for (;;) {
       auto item = input_queue.pop();
       if (!item.first) break;
       consume_op(*item.first);
     }
     return;
   }
   vector<gen_value_type> elements;
   long current = 0;
   for (;;) {
     auto item = input_queue.pop();
     if (!item.first) break;
     if(current == item.second){
       consume_op(*item.first);
       current ++;
     }
     else {
       elements.push_back(item);
     }
     // TODO: Probably find_if() + erase
     for (auto it=elements.begin(); it!=elements.end(); it++) {
       if(it->second == current) {
         consume_op(*it->first);
         elements.erase(it);
         current++;
         break;
       }
     }
   }
   while (elements.size()>0) {
     // TODO: Probably find_if() + erase
     for (auto it = elements.begin(); it != elements.end(); it++) {
       if(it->second == current) {
         consume_op(*it->first);
         elements.erase(it);
         current++;
         break;
       }
     }
   }
 }


 template <typename Inqueue, typename Transformer, typename output_type,
             requires_no_pattern<Transformer>>
 void parallel_execution_native::do_pipeline(Inqueue & input_queue, Transformer && transform_op,
       mpmc_queue<output_type> & output_queue) const
 {
   using namespace std;
   using namespace experimental;

   using input_item_type = typename Inqueue::value_type;
   using input_item_value_type = typename input_item_type::first_type::value_type;

   using output_optional_type = typename output_type::first_type;
   using output_item_value_type = typename output_type::first_type::value_type;
   for (;;) {
     auto item{input_queue.pop()};
     if(!item.first) break;
     auto out = output_item_value_type{transform_op(*item.first)};
     output_queue.push(make_pair(out,item.second)) ;
   }
 }


 template <typename Queue, typename Transformer,
           typename ... OtherTransformers,
           requires_no_pattern<Transformer>>
 void parallel_execution_native::do_pipeline(
     Queue & input_queue,
     Transformer && transform_op,
     OtherTransformers && ... other_transform_ops) const
 {
   using namespace std;
   using namespace experimental;

   using input_item_type = typename Queue::value_type;
   using input_item_value_type = typename input_item_type::first_type::value_type;
   using transform_result_type =
       decay_t<typename result_of<Transformer(input_item_value_type)>::type>;
   using output_item_value_type = optional<transform_result_type>;
   using output_item_type = pair<output_item_value_type,long>;

   decltype(auto) output_queue =
     get_output_queue<output_item_type>(other_transform_ops...);

   thread task([&,this]() {
     auto manager = thread_manager();

     long order = 0;
     for (;;) {
       auto item{input_queue.pop()};
       if (!item.first) break;
       auto out = output_item_value_type{transform_op(*item.first)};
       output_queue.push(make_pair(out, item.second));
     }
     output_queue.push(make_pair(output_item_value_type{},-1));
   });

   do_pipeline(output_queue,
       forward<OtherTransformers>(other_transform_ops)...);
   task.join();
 }

 template <typename Queue, typename FarmTransformer,
           template <typename> class Farm,
           requires_farm<Farm<FarmTransformer>>>
 void parallel_execution_native::do_pipeline(
     Queue & input_queue,
     Farm<FarmTransformer> && farm_obj) const
 {
   using namespace std;
   using input_item_type = typename Queue::value_type;
   using input_item_value_type = typename input_item_type::first_type::value_type;
   using transform_result_type =
       decay_t<typename result_of<FarmTransformer(input_item_value_type)>::type>;
   using output_item_value_type = experimental::optional<transform_result_type>;
   using output_item_type = pair<output_item_value_type,long>;

   auto farm_task = [&](int nt) {
     long order = 0;
     auto item{input_queue.pop()};
     while (item.first) {
       farm_obj(*item.first);
       item = input_queue.pop();
     }
     input_queue.push(item);
   };

   auto ntasks = farm_obj.cardinality();
   worker_pool workers{ntasks};
   workers.launch_tasks(*this, farm_task, ntasks);
   workers.wait();
 }


 template <typename Queue, typename Execution, typename Transformer,
           template <typename, typename> class Context,
           typename ... OtherTransformers,
           requires_context<Context<Execution,Transformer>>>
 void parallel_execution_native::do_pipeline(Queue & input_queue,
     Context<Execution,Transformer> && context_op,
     OtherTransformers &&... other_ops) const
 {
   using namespace std;
   using namespace experimental;

   using input_item_type = typename Queue::value_type;
   using input_item_value_type = typename input_item_type::first_type::value_type;

   using output_type = typename stage_return_type<input_item_value_type, Transformer>::type;
   using output_optional_type = experimental::optional<output_type>;
   using output_item_type = pair <output_optional_type, long> ;

   decltype(auto) output_queue =
     get_output_queue<output_item_type>(other_ops...);

   auto context_task = [&](int nt) {
     context_op.execution_policy().pipeline(input_queue, context_op.transformer(), output_queue);
     output_queue.push( make_pair(output_optional_type{}, -1) );
   };

   worker_pool workers{1};
   workers.launch_tasks(*this, context_task, 1);

   do_pipeline(output_queue,
       forward<OtherTransformers>(other_ops)... );

   workers.wait();
 }


 template <typename Queue, typename FarmTransformer,
           template <typename> class Farm,
           typename ... OtherTransformers,
           requires_farm<Farm<FarmTransformer>>>
 void parallel_execution_native::do_pipeline(
     Queue & input_queue,
     Farm<FarmTransformer> && farm_obj,
     OtherTransformers && ... other_transform_ops) const
 {
   using namespace std;
   using namespace experimental;

   using input_item_type = typename Queue::value_type;
   using input_item_value_type = typename input_item_type::first_type::value_type;

   using output_type = typename stage_return_type<input_item_value_type, FarmTransformer>::type;
   using output_optional_type = experimental::optional<output_type>;
   using output_item_type = pair <output_optional_type, long> ;

   decltype(auto) output_queue =
     get_output_queue<output_item_type>(other_transform_ops...);

   atomic<int> done_threads{0};

   auto farm_task = [&](int nt) {
     do_pipeline(input_queue, farm_obj.transformer(), output_queue);
     done_threads++;
     if (done_threads == nt) {
       output_queue.push(make_pair(output_optional_type{}, -1));
     }else{
       input_queue.push(input_item_type{});
     }
   };

   auto ntasks = farm_obj.cardinality();
   worker_pool workers{ntasks};
   workers.launch_tasks(*this, farm_task, ntasks);
   do_pipeline(output_queue,
       forward<OtherTransformers>(other_transform_ops)... );

   workers.wait();
 }

 template <typename Queue, typename Predicate,
           template <typename> class Filter,
           typename ... OtherTransformers,
           requires_filter<Filter<Predicate>>>
 void parallel_execution_native::do_pipeline(
     Queue & input_queue,
     Filter<Predicate> && filter_obj,
     OtherTransformers && ... other_transform_ops) const
 {
   using namespace std;
   using namespace experimental;

   using input_item_type = typename Queue::value_type;
   using input_value_type = typename input_item_type::first_type;
   auto filter_queue = make_queue<input_item_type>();

   auto filter_task = [&,this]() {
     auto manager = thread_manager();
     auto item{input_queue.pop()};
     while (item.first) {
       if (filter_obj(*item.first)) {
         filter_queue.push(item);
       }
       else {
         filter_queue.push(make_pair(input_value_type{}, item.second));
       }
       item = input_queue.pop();
     }
     filter_queue.push(make_pair(input_value_type{}, -1));
   };
   thread filter_thread{filter_task};

   using queue_type = mpmc_queue<input_item_type>;
   decltype(auto) output_queue =
     get_output_queue<input_item_type>(other_transform_ops...);

   thread ordering_thread;
   if (is_ordered()) {
     auto ordering_task = [&]() {
       auto manager = thread_manager();
       vector<input_item_type> elements;
       int current = 0;
       long order = 0;
       auto item{filter_queue.pop()};
       for (;;) {
         if(!item.first && item.second == -1) break;
         if (item.second == current) {
           if (item.first) {
             output_queue.push(make_pair(item.first,order));
             order++;
           }
           current++;
         }
         else {
           elements.push_back(item);
         }
         // TODO: Probably find_if() + erase
         for (auto it=elements.begin(); it<elements.end(); it++) {
           if (it->second == current) {
             if (it->first) {
               output_queue.push(make_pair(it->first,order));
               order++;
             }
             elements.erase(it);
             current++;
             break;
           }
         }
         item = filter_queue.pop();
       }
       while (elements.size()>0) {
         // TODO: Probably find_if() + erase
         for (auto it=elements.begin(); it<elements.end(); it++) {
           if (it->second == current) {
             if(it->first) {
               output_queue.push(make_pair(it->first,order));
               order++;
             }
             elements.erase(it);
             current++;
             break;
           }
         }
       }
       output_queue.push(item);
     };

     ordering_thread = thread{ordering_task};
     do_pipeline(output_queue, forward<OtherTransformers>(other_transform_ops)...);
     filter_thread.join();
     ordering_thread.join();
   }
   else {
     do_pipeline(filter_queue, forward<OtherTransformers>(other_transform_ops)...);
     filter_thread.join();
   }
 }

 template <typename Queue, typename Combiner, typename Identity,
           template <typename C, typename I> class Reduce,
           typename ... OtherTransformers,
           requires_reduce<Reduce<Combiner,Identity>>>
 void parallel_execution_native::do_pipeline(
     Queue && input_queue,
     Reduce<Combiner,Identity> && reduce_obj,
     OtherTransformers && ... other_transform_ops) const
 {
   using namespace std;
   using namespace experimental;

   using input_item_type = typename decay_t<Queue>::value_type;
   using input_item_value_type = typename input_item_type::first_type::value_type;
   using output_item_value_type = optional<decay_t<Identity>>;
   using output_item_type = pair<output_item_value_type,long>;
   decltype(auto) output_queue =
     get_output_queue<output_item_type>(other_transform_ops...);

   auto reduce_task = [&,this]() {
     auto manager = thread_manager();
     auto item{input_queue.pop()};
     int order = 0;
     while (item.first) {
       reduce_obj.add_item(std::forward<Identity>(*item.first));
       item = input_queue.pop();
       if (reduce_obj.reduction_needed()) {
         constexpr sequential_execution seq;
         auto red = reduce_obj.reduce_window(seq);
         output_queue.push(make_pair(red, order++));
       }
     }
     output_queue.push(make_pair(output_item_value_type{}, -1));
   };
   thread reduce_thread{reduce_task};
   do_pipeline(output_queue, forward<OtherTransformers>(other_transform_ops)...);
   reduce_thread.join();
 }

 template <typename Queue, typename Transformer, typename Predicate,
           template <typename T, typename P> class Iteration,
           typename ... OtherTransformers,
           requires_iteration<Iteration<Transformer,Predicate>>,
           requires_no_pattern<Transformer>>
 void parallel_execution_native::do_pipeline(
     Queue & input_queue,
     Iteration<Transformer,Predicate> && iteration_obj,
     OtherTransformers && ... other_transform_ops) const
 {
   using namespace std;
   using namespace experimental;

   using input_item_type = typename decay_t<Queue>::value_type;
   using input_item_value_type = typename input_item_type::first_type::value_type;

   decltype(auto) output_queue =
     get_output_queue<input_item_type>(other_transform_ops...);

   auto iteration_task = [&]() {
     for (;;) {
       auto item = input_queue.pop();
       if (!item.first) break;
       auto value = iteration_obj.transform(*item.first);
       auto new_item = input_item_type{value,item.second};
       if (iteration_obj.predicate(value)) {
         output_queue.push(new_item);
       }
       else {
         input_queue.push(new_item);
       }
     }
     while (!input_queue.is_empty()) {
       auto item = input_queue.pop();
       auto value = iteration_obj.transform(*item.first);
       auto new_item = input_item_type{value,item.second};
       if (iteration_obj.predicate(value)) {
         output_queue.push(new_item);
       }
       else {
         input_queue.push(new_item);
       }
     }
     output_queue.push(input_item_type{{},-1});
   };

   thread iteration_thread{iteration_task};
   do_pipeline(output_queue, forward<OtherTransformers>(other_transform_ops)...);
   iteration_thread.join();
 }

 template <typename Queue, typename Transformer, typename Predicate,
           template <typename T, typename P> class Iteration,
           typename ... OtherTransformers,
           requires_iteration<Iteration<Transformer,Predicate>>,
           requires_pipeline<Transformer>>
 void parallel_execution_native::do_pipeline(
     Queue & input_queue,
     Iteration<Transformer,Predicate> && iteration_obj,
     OtherTransformers && ... other_transform_ops) const
 {
   static_assert(!is_pipeline<Transformer>, "Not implemented");
 }


 template <typename Queue, typename ... Transformers,
           template <typename...> class Pipeline,
           requires_pipeline<Pipeline<Transformers...>>>
 void parallel_execution_native::do_pipeline(
     Queue & input_queue,
     Pipeline<Transformers...> && pipeline_obj) const
 {
   do_pipeline_nested(
       input_queue,
       pipeline_obj.transformers(),
       std::make_index_sequence<sizeof...(Transformers)>());
 }

 template <typename Queue, typename ... Transformers,
           template <typename...> class Pipeline,
           typename ... OtherTransformers,
           requires_pipeline<Pipeline<Transformers...>>>
 void parallel_execution_native::do_pipeline(
     Queue & input_queue,
     Pipeline<Transformers...> && pipeline_obj,
     OtherTransformers && ... other_transform_ops) const
 {
   do_pipeline_nested(
       input_queue,
       std::tuple_cat(pipeline_obj.transformers(),
           std::forward_as_tuple(other_transform_ops...)),
       std::make_index_sequence<sizeof...(Transformers)+sizeof...(OtherTransformers)>());
 }

 template <typename Queue, typename ... Transformers,
           std::size_t ... I>
 void parallel_execution_native::do_pipeline_nested(
     Queue & input_queue,
     std::tuple<Transformers...> && transform_ops,
     std::index_sequence<I...>) const
 {
   do_pipeline(input_queue,
       std::forward<Transformers>(std::get<I>(transform_ops))...);
 }

 } // end namespace grppi

 #endif
grppi
Definition: callable_traits.h:26

grppi::parallel_execution_native::set_concurrency_degree
void set_concurrency_degree(int degree) noexcept
Set number of grppi threads.
Definition: parallel_execution_native.h:179

grppi::pipeline
void pipeline(const Execution &ex, Generator &&generate_op, Transformers &&...transform_ops)
Invoke Pipeline pattern on a data stream.
Definition: pipeline.h:51

grppi::worker_pool::launch
void launch(const E &ex, F f, Args &&...args)
Launch a function in the pool.
Definition: worker_pool.h:62

grppi::is_supported< parallel_execution_native >
constexpr bool is_supported< parallel_execution_native >()
Determines if an execution policy is supported in the current compilation.
Definition: parallel_execution_native.h:639

grppi::stencil
void stencil(const Execution &ex, std::tuple< InputIterators... > firsts, std::size_t size, OutputIt out, StencilTransformer &&transform_op, Neighbourhood &&neighbour_op)
Invoke Stencil pattern on a data sequence with sequential execution.
Definition: stencil.h:59

grppi::native_thread_manager::native_thread_manager
native_thread_manager(thread_registry &registry)
Saves a reference to the registry and registers current thread.
Definition: parallel_execution_native.h:120

grppi::requires_reduce
std::enable_if_t< is_reduce< T >, int > requires_reduce
Definition: reduce_pattern.h:135

grppi::supports_map< parallel_execution_native >
constexpr bool supports_map< parallel_execution_native >()
Determines if an execution policy supports the map pattern.
Definition: parallel_execution_native.h:646

grppi::reduce
auto reduce(const Execution &ex, InputIt first, std::size_t size, Result &&identity, Combiner &&combine_op)
Invoke Reduce pattern with identity value on a data sequence with sequential execution.
Definition: reduce.h:55

grppi::worker_pool
Pool of worker threads. This class offers a simple pool of worker threads.
Definition: worker_pool.h:34

grppi::supports_reduce< parallel_execution_native >
constexpr bool supports_reduce< parallel_execution_native >()
Determines if an execution policy supports the reduce pattern.
Definition: parallel_execution_native.h:653

grppi::parallel_execution_native::enable_ordering
void enable_ordering() noexcept
Enable ordering.
Definition: parallel_execution_native.h:189

grppi::parallel_execution_native::thread_manager
native_thread_manager thread_manager() const
Get a manager object for registration/deregistration in the thread index table for current thread...
Definition: parallel_execution_native.h:205

grppi::parallel_execution_native::concurrency_degree
int concurrency_degree() const noexcept
Get number of grppi trheads.
Definition: parallel_execution_native.h:184

grppi::parallel_execution_native::get_output_queue
mpmc_queue< T > get_output_queue(Transformers &&...) const
Makes a communication queue for elements of type T if the queue has not been created in an outer patt...
Definition: parallel_execution_native.h:257

grppi::parallel_execution_native::stencil
void stencil(std::tuple< InputIterators... > firsts, OutputIterator first_out, std::size_t sequence_size, StencilTransformer &&transform_op, Neighbourhood &&neighbour_op) const
Applies a stencil to multiple sequences leaving the result in another sequence.
Definition: parallel_execution_native.h:797

grppi::requires_iteration
typename std::enable_if_t< is_iteration< T >, int > requires_iteration
Definition: iteration_pattern.h:88

grppi::supports_divide_conquer< parallel_execution_native >
constexpr bool supports_divide_conquer< parallel_execution_native >()
Determines if an execution policy supports the divide/conquer pattern.
Definition: parallel_execution_native.h:674

grppi::parallel_execution_native::set_queue_attributes
void set_queue_attributes(int size, queue_mode mode) noexcept
Sets the attributes for the queues built through make_queue<T>()
Definition: parallel_execution_native.h:220

grppi::parallel_execution_native::reduce
auto reduce(InputIterator first, std::size_t sequence_size, Identity &&identity, Combiner &&combine_op) const
Applies a reduction to a sequence of data items.
Definition: parallel_execution_native.h:721

std
STL namespace.

grppi::iterators_next
auto iterators_next(T &&t, int n)
Computes next n steps from a tuple of iterators.
Definition: iterator.h:175

grppi::supports_map_reduce< parallel_execution_native >
constexpr bool supports_map_reduce< parallel_execution_native >()
Determines if an execution policy supports the map-reduce pattern.
Definition: parallel_execution_native.h:660

grppi::queue_mode
queue_mode
Definition: mpmc_queue.h:35

grppi::thread_registry::deregister_thread
void deregister_thread() noexcept
Removes current thread id from the registry.
Definition: parallel_execution_native.h:88

grppi::parallel_execution_native
Native parallel execution policy. This policy uses ISO C++ threads as implementation building block a...
Definition: parallel_execution_native.h:140

grppi::thread_registry::thread_registry
thread_registry() noexcept=default

grppi::mpmc_queue
Definition: mpmc_queue.h:38

grppi::worker_pool::launch_tasks
void launch_tasks(const E &ex, F &&f, Args &&...args)
Definition: worker_pool.h:70

grppi::parallel_execution_native::parallel_execution_native
parallel_execution_native() noexcept
Default construct a native parallel execution policy.
Definition: parallel_execution_native.h:153

grppi::queue_mode::blocking

grppi::native_thread_manager::~native_thread_manager
~native_thread_manager()
Deregisters current thread from the registry.
Definition: parallel_execution_native.h:127

grppi::is_parallel_execution_native
constexpr bool is_parallel_execution_native()
Metafunction that determines if type E is parallel_execution_native.
Definition: parallel_execution_native.h:630

grppi::thread_registry::register_thread
void register_thread() noexcept
Adds the current thread id in the registry.
Definition: parallel_execution_native.h:79

grppi::sequential_execution::stencil
constexpr void stencil(std::tuple< InputIterators... > firsts, OutputIterator first_out, std::size_t sequence_size, StencilTransformer &&transform_op, Neighbourhood &&neighbour_op) const
Applies a stencil to multiple sequences leaving the result in another sequence.
Definition: sequential_execution.h:502

grppi::parallel_execution_native::pipeline
void pipeline(mpmc_queue< InputType > &input_queue, Transformer &&transform_op, mpmc_queue< OutputType > &output_queue) const
Invoke Pipeline pattern comming from another context that uses mpmc_queues as communication channels...
Definition: parallel_execution_native.h:405

grppi::requires_no_pattern
std::enable_if_t< is_no_pattern< T >, int > requires_no_pattern
Definition: patterns.h:92

grppi::map_reduce
auto map_reduce(const Execution &ex, std::tuple< InputIterators... > firsts, std::size_t size, Identity &&identity, Transformer &&transform_op, Combiner &&combine_op)
Invoke Map/reduce pattern on a data sequence.
Definition: mapreduce.h:57

grppi::requires_pipeline
typename std::enable_if_t< is_pipeline< T >, int > requires_pipeline
Definition: pipeline_pattern.h:111

grppi::parallel_execution_native::map_reduce
auto map_reduce(std::tuple< InputIterators... > firsts, std::size_t sequence_size, Identity &&identity, Transformer &&transform_op, Combiner &&combine_op) const
Applies a map/reduce operation to a sequence of data items.
Definition: parallel_execution_native.h:758

grppi::supports_stencil< parallel_execution_native >
constexpr bool supports_stencil< parallel_execution_native >()
Determines if an execution policy supports the stencil pattern.
Definition: parallel_execution_native.h:667

grppi::thread_registry::current_index
int current_index() const noexcept
Integer index for current thread.
Definition: parallel_execution_native.h:98

worker_pool.h

grppi::parallel_execution_native::map
void map(std::tuple< InputIterators... > firsts, OutputIterator first_out, std::size_t sequence_size, Transformer transform_op) const
Applies a trasnformation to multiple sequences leaving the result in another sequence by chunks accor...
Definition: parallel_execution_native.h:685

grppi::stage_return_type::type
return_type type
Definition: patterns.h:103

grppi::requires_filter
typename std::enable_if_t< is_filter< T >, int > requires_filter
Definition: filter_pattern.h:70

grppi::sequential_execution
Sequential execution policy.
Definition: sequential_execution.h:41

grppi::parallel_execution_native::parallel_execution_native
parallel_execution_native(int concurrency_degree, bool ordering=true) noexcept
Constructs a native parallel execution policy.
Definition: parallel_execution_native.h:167

grppi::parallel_execution_native::pipeline
void pipeline(Generator &&generate_op, Transformers &&...transform_ops) const
Invoke Pipeline pattern.
Definition: parallel_execution_native.h:862

grppi::sequential_execution::divide_conquer
auto divide_conquer(Input &&input, Divider &&divide_op, Solver &&solve_op, Combiner &&combine_op) const
Invoke Divide/conquer pattern.
Definition: sequential_execution.h:543

grppi::apply_deref_increment
decltype(auto) apply_deref_increment(F &&f, T< Iterators... > &iterators)
Applies a callable object to the values obtained from the iterators in a tuple-like object...
Definition: iterator.h:63

grppi::result_type
typename std::result_of< Transformer(Input)>::type result_type
Determines the return type of appliying a function on a input type.
Definition: patterns.h:110

grppi::thread_registry
Thread index table to provide portable natural thread indices.
Definition: parallel_execution_native.h:53

grppi::parallel_execution_native::disable_ordering
void disable_ordering() noexcept
Disable ordering.
Definition: parallel_execution_native.h:194

grppi::native_thread_manager
RAII class to manage registration/deregistration pairs. This class allows to manage automatic deregis...
Definition: parallel_execution_native.h:115

grppi::parallel_execution_native::divide_conquer
auto divide_conquer(Input &&input, Divider &&divide_op, Solver &&solve_op, Combiner &&combine_op) const
Invoke Divide/conquer pattern.
Definition: parallel_execution_native.h:831

grppi::parallel_execution_native::parallel_execution_native
parallel_execution_native(const parallel_execution_native &ex)
Definition: parallel_execution_native.h:172

grppi::divide_conquer
auto divide_conquer(const Execution &ex, Input &&input, Divider &&divider_op, Solver &&solver_op, Combiner &&combiner_op)
Invoke Divide/conquer pattern.  Execution Execution type.
Definition: divideconquer.h:53

grppi::parallel_execution_native::get_output_queue
mpmc_queue< T > & get_output_queue(mpmc_queue< T > &queue, Transformers &&...) const
Returns the reference of a communication queue for elements of type T if the queue has been created i...
Definition: parallel_execution_native.h:245

grppi::parallel_execution_native::make_queue
mpmc_queue< T > make_queue() const
Makes a communication queue for elements of type T. Constructs a queue using the attributes that can ...
Definition: parallel_execution_native.h:232

grppi::supports_pipeline< parallel_execution_native >
constexpr bool supports_pipeline< parallel_execution_native >()
Determines if an execution policy supports the pipeline pattern.
Definition: parallel_execution_native.h:681

grppi::parallel_execution_native::get_thread_id
int get_thread_id() const noexcept
Get index of current thread in the thread table.
Definition: parallel_execution_native.h:213

grppi::requires_context
typename std::enable_if_t< is_context< T >, int > requires_context
Definition: common/context.h:95

grppi::parallel_execution_native::is_ordered
bool is_ordered() const noexcept
Is execution ordered.
Definition: parallel_execution_native.h:199

grppi::map
void map(const Execution &ex, std::tuple< InputIterators... > firsts, InputIt last, OutputIt first_out, Transformer transform_op)
Invoke Map pattern on a data sequence.
Definition: map.h:56

grppi::mpmc_queue::push
bool push(T item)
Definition: mpmc_queue.h:128

grppi::requires_farm
typename std::enable_if_t< is_farm< T >, int > requires_farm
Definition: farm_pattern.h:89