scan_perf.h 3.85 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112
/*
 * Copyright (c) 2014, Siemens AG. All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *
 * 1. Redistributions of source code must retain the above copyright notice,
 * this list of conditions and the following disclaimer.
 *
 * 2. Redistributions in binary form must reproduce the above copyright notice,
 * this list of conditions and the following disclaimer in the documentation
 * and/or other materials provided with the distribution.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 * POSSIBILITY OF SUCH DAMAGE.
 */

#ifndef EMBB_ALGORITHMS_PERF_SCAN_PERF_H_
#define EMBB_ALGORITHMS_PERF_SCAN_PERF_H_

#include <embb/base/perf/call_args.h>
#include <vector>

namespace embb {
namespace algorithms {
namespace perf {


template<typename T>
class RamStressScanOp {
  size_t load_factor;
  const T * const in;
public:
   explicit RamStressScanOp(const CallArgs & args, const T inVector[]) :
     load_factor(args.LoadFactor()), in(inVector) { }
public:
  T operator()(const T & lhs, const T & rhs) {
    T value = lhs;
    // rhs is index. First iteration in range has
    // lhs = 0 (neutral element).
    // artificial complexity
    for (unsigned int k = 0; k < load_factor; k++) {
      // artificial complexity
      value += rhs;
    }
    return value;
  }
  RamStressScanOp(const RamStressScanOp & other)
    : load_factor(other.load_factor), in(other.in) { }
  RamStressScanOp & operator=(const RamStressScanOp & other) {
    if (*this != &other) {
      load_factor = other.load_factor;
      in = other.in;
    }
    return *this;
  }
};

template<typename T>
class CpuStressScanOp {
  size_t load_factor;
public:
  explicit CpuStressScanOp(const CallArgs & args) :
    load_factor(args.LoadFactor()) { }
public:
  T operator()(const T & lhs, const T &) {    
    T value = lhs;
    // Ignore rhs value, always add 1, corresponding
    // to input value in RAM stress operation
    for (unsigned int k = 0; k < load_factor; k++) {
      // artificial complexity
      value += static_cast<T>(1);
    }
    return value;
  }
};

template<typename T>
class SerialScan {
public:
  explicit SerialScan(const embb::base::perf::CallArgs & args);
  ~SerialScan();
  void Pre() { }
  void Run();
  void Post() { }

private:
  const embb::base::perf::CallArgs & cargs;
  const size_t vector_size;
  unsigned int load_factor;
  T * in;
  T * out;
  T result;
  /* prohibit copy and assignment */
  SerialScan(const SerialScan & other);
  SerialScan & operator=(const SerialScan & other);
};

template<typename T>
class ParallelScan {
public:
  explicit ParallelScan(const embb::base::perf::CallArgs & args);
  ~ParallelScan();
113
  void Pre();
114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135
  void Run(unsigned int numThreads);
  void Post() { }

private:
  const embb::base::perf::CallArgs & cargs;
  const size_t vector_size;
  T * in;
  T * out;
  T result;
  /* prohibit copy and assignment */
  ParallelScan(const ParallelScan & other);
  ParallelScan & operator=(const ParallelScan & other);
};


} // namespace perf
} // namespace algorithms
} // namespace embb

#include <scan_perf-inl.h>

#endif /* EMBB_ALGORITHMS_PERF_SCAN_PERF_H_ */