scan.h 6.81 KB
Newer Older
1
/*
Marcus Winter committed
2
 * Copyright (c) 2014-2016, Siemens AG. All rights reserved.
3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *
 * 1. Redistributions of source code must retain the above copyright notice,
 * this list of conditions and the following disclaimer.
 *
 * 2. Redistributions in binary form must reproduce the above copyright notice,
 * this list of conditions and the following disclaimer in the documentation
 * and/or other materials provided with the distribution.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 * POSSIBILITY OF SUCH DAMAGE.
 */

#ifndef EMBB_ALGORITHMS_SCAN_H_
#define EMBB_ALGORITHMS_SCAN_H_

30
#include <embb/mtapi/execution_policy.h>
31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68
#include <embb/algorithms/identity.h>

namespace embb {
namespace algorithms {

/**
 * \defgroup CPP_ALGORITHMS_SCAN Scan
 * Parallel scan computation
 * \ingroup CPP_ALGORITHMS
 *
 * \{
 */

#ifdef DOXYGEN

/**
 * Performs a parallel scan (or prefix) computation on a range of elements.
 *
 * The algorithm reads an input range and writes its result to a separate output
 * range. The input range consists of the elements from \c first to \c last,
 * excluding the last element. The output range consists of the elements from
 * \c output_first to <tt>output_first + std::difference(last - first)</tt>.
 *
 * The algorithm performs two runs on the given range. Hence, a performance
 * speedup can only be expected on processors with more than two cores.
 *
 * \throws embb::base::ErrorException if not enough MTAPI tasks can be created
 *         to satisfy the requirements of the algorithm.
 * \threadsafe if the elements in the range are not modified by another thread
 *             while the algorithm is executed.
 * \note No guarantee is given on the order in which the functions \c scan
 *       and \c transformation are applied to the elements.\n
 *       For all \c x of type \c ReturnType it must hold that
 *       <tt>reduction(x, neutral) == x</tt>. \n
 *       The reduction operation need not be commutative but must be
 *       associative, i.e., <tt>reduction(x, reduction(y, z)) ==
 *       reduction(reduction(x, y), z))</tt> for all \c x, \c y, \c z of type
 *       \c ReturnType.
69
 * \see embb::mtapi::ExecutionPolicy, Identity, ZipIterator
70 71 72 73
 * \tparam RAIIn Random access iterator type of input range
 * \tparam RAIOut Random access iterator type of output range
 * \tparam ReturnType Type of output elements of scan operation, deduced from
 *         \c neutral
74
 * \tparam ScanFunction Binary scan function object with signature
75
 *         <tt>ReturnType ScanFunction(ReturnType, ReturnType)</tt>
76 77
 * \tparam TransformationFunction Unary transformation function object with
 *         signature <tt>ReturnType TransformationFunction(typename
78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98
 *         std::iterator_traits<RAIIn>::value_type)</tt>.
 */
template<typename RAIIn, typename RAIOut, typename ReturnType,
         typename ScanFunction, typename TransformationFunction>
void Scan(
  RAIIn first,
  /**< [IN] Random access iterator pointing to the first element of the input
            range */
  RAIIn last,
  /**< [IN] Random access iterator pointing to the last plus one element of the
            input range */
  RAIOut output_first,
  /**< [IN] Random access iterator pointing to the first element of the output
            range */
  ReturnType neutral,
  /**< [IN] Neutral element of the \c scan operation. */
  ScanFunction scan,
  /**< [IN] Scan operation to be applied to the elements of the input range */
  TransformationFunction transformation = Identity(),
  /**< [IN] Transforms the elements of the input range before the scan operation
            is applied */
99
  const embb::mtapi::ExecutionPolicy& policy = embb::mtapi::ExecutionPolicy(),
100
  /**< [IN] embb::mtapi::ExecutionPolicy for the scan computation */
101 102 103 104 105 106 107 108 109 110 111 112
  size_t block_size = 0
  /**< [IN] Lower bound for partitioning the range of elements into blocks that
            are treated in parallel. Partitioning of a block stops if its size
            is less than or equal to \c block_size. The default value 0 means
            that the minimum block size is determined automatically depending on
            the number of elements in the range divided by the number of
            available cores. */
  );

#else // DOXYGEN

/**
113
 * Overload of above described Doxygen dummy.
114 115
 */
template<typename RAIIn, typename RAIOut, typename ReturnType,
116
         typename ScanFunction, typename TransformationFunction>
117 118 119 120 121
void Scan(
  RAIIn first,
  RAIIn last,
  RAIOut output_iterator,
  ReturnType neutral,
122 123
  ScanFunction scan,
  TransformationFunction transformation,
124
  const embb::mtapi::ExecutionPolicy& policy,
125 126
  size_t block_size
  );
127 128 129 130 131

/**
 * Overload of above described Doxygen dummy with less arguments.
 */
template<typename RAIIn, typename RAIOut, typename ReturnType,
132
         typename ScanFunction>
133 134 135 136 137
void Scan(
  RAIIn first,
  RAIIn last,
  RAIOut output_iterator,
  ReturnType neutral,
138
  ScanFunction scan
139
  ) {
140
  Scan(first, last, output_iterator, neutral, scan, Identity(),
141
    embb::mtapi::ExecutionPolicy(), 0);
142 143 144 145 146 147 148 149 150 151 152 153 154
}

/**
 * Overload of above described Doxygen dummy with less arguments.
 */
template<typename RAIIn, typename RAIOut, typename ReturnType,
         typename ScanFunction, typename TransformationFunction>
void Scan(
  RAIIn first,
  RAIIn last,
  RAIOut output_iterator,
  ReturnType neutral,
  ScanFunction scan,
155
  TransformationFunction transformation
156
  ) {
157
  Scan(first, last, output_iterator, neutral, scan, transformation,
158
    embb::mtapi::ExecutionPolicy(), 0);
159 160 161
}

/**
162
 * Overload of above described Doxygen dummy with less arguments.
163 164 165 166 167 168 169 170 171 172
 */
template<typename RAIIn, typename RAIOut, typename ReturnType,
         typename ScanFunction, typename TransformationFunction>
void Scan(
  RAIIn first,
  RAIIn last,
  RAIOut output_iterator,
  ReturnType neutral,
  ScanFunction scan,
  TransformationFunction transformation,
173
  const embb::mtapi::ExecutionPolicy& policy
174 175 176
  ) {
  Scan(first, last, output_iterator, neutral, scan, transformation, policy, 0);
}
177 178 179 180 181 182 183 184 185 186 187 188 189

#endif // else DOXYGEN

/**
 * \}
 */

}  // namespace algorithms
}  // namespace embb

#include <embb/algorithms/internal/scan-inl.h>

#endif  // EMBB_ALGORITHMS_SCAN_H_