![]() |
|
#include <tensor_benchmarks.h>
Public Member Functions | |
| BenchmarkSuite (const Device &device, size_t m, size_t k, size_t n) | |
| BenchmarkSuite (const Device &device, size_t m) | |
| BenchmarkSuite (const Device &device, size_t m, size_t k) | |
| ~BenchmarkSuite () | |
| void | memcpy (int num_iters) |
| void | typeCasting (int num_iters) |
| void | random (int num_iters) |
| void | slicing (int num_iters) |
| void | rowChip (int num_iters) |
| void | colChip (int num_iters) |
| void | shuffling (int num_iters) |
| void | padding (int num_iters) |
| void | striding (int num_iters) |
| void | broadcasting (int num_iters) |
| void | coeffWiseOp (int num_iters) |
| void | algebraicFunc (int num_iters) |
| void | transcendentalFunc (int num_iters) |
| void | rowReduction (int num_iters) |
| void | colReduction (int num_iters) |
| void | fullReduction (int num_iters) |
| void | contraction (int num_iters) |
| void | contractionRowMajor (int num_iters) |
| void | contractionRowMajorAT (int num_iters) |
| void | contractionRowMajorBT (int num_iters) |
| void | contractionRowMajorABT (int num_iters) |
| void | convolution (int num_iters, int kernel_x, int kernel_y) |
Private Member Functions | |
| template<int Layout> | |
| void | contraction (int num_iters, bool trans_a, bool trans_b) |
| void | initialize () |
| void | finalizeBenchmark (int64_t num_items) |
Private Attributes | |
| TensorIndex | m_ |
| TensorIndex | k_ |
| TensorIndex | n_ |
| T * | a_ |
| T * | b_ |
| T * | c_ |
| Device | device_ |
|
inline |
References BenchmarkSuite< Device, T >::initialize().
|
inline |
References BenchmarkSuite< Device, T >::initialize().
|
inline |
References BenchmarkSuite< Device, T >::initialize().
|
inline |
|
inline |
References BenchmarkSuite< Device, T >::a_, Eigen::Aligned, BenchmarkSuite< Device, T >::b_, BenchmarkSuite< Device, T >::c_, BenchmarkSuite< Device, T >::device_, eigen_assert, BenchmarkSuite< Device, T >::finalizeBenchmark(), BenchmarkSuite< Device, T >::k_, BenchmarkSuite< Device, T >::m_, BenchmarkSuite< Device, T >::n_, sizes, and StartBenchmarkTiming().
|
inline |
References BenchmarkSuite< Device, T >::a_, Eigen::Aligned, BenchmarkSuite< Device, T >::c_, BenchmarkSuite< Device, T >::device_, BenchmarkSuite< Device, T >::finalizeBenchmark(), BenchmarkSuite< Device, T >::m_, BenchmarkSuite< Device, T >::n_, Eigen::IndexList< FirstType, OtherTypes >::set(), and StartBenchmarkTiming().
|
inline |
References BenchmarkSuite< Device, T >::a_, Eigen::Aligned, BenchmarkSuite< Device, T >::b_, BenchmarkSuite< Device, T >::c_, BenchmarkSuite< Device, T >::device_, eigen_assert, BenchmarkSuite< Device, T >::finalizeBenchmark(), BenchmarkSuite< Device, T >::k_, BenchmarkSuite< Device, T >::m_, BenchmarkSuite< Device, T >::n_, sizes, and StartBenchmarkTiming().
|
inline |
|
inline |
|
inline |
References Eigen::ColMajor.
|
inlineprivate |
References BenchmarkSuite< Device, T >::a_, Eigen::Aligned, BenchmarkSuite< Device, T >::b_, BenchmarkSuite< Device, T >::c_, BenchmarkSuite< Device, T >::device_, BenchmarkSuite< Device, T >::finalizeBenchmark(), BenchmarkSuite< Device, T >::k_, BenchmarkSuite< Device, T >::m_, BenchmarkSuite< Device, T >::n_, and StartBenchmarkTiming().
|
inline |
References Eigen::RowMajor.
|
inline |
References Eigen::RowMajor.
|
inline |
References Eigen::RowMajor.
|
inline |
References Eigen::RowMajor.
|
inline |
References BenchmarkSuite< Device, T >::a_, Eigen::Aligned, BenchmarkSuite< Device, T >::b_, BenchmarkSuite< Device, T >::c_, BenchmarkSuite< Device, T >::device_, BenchmarkSuite< Device, T >::finalizeBenchmark(), BenchmarkSuite< Device, T >::m_, BenchmarkSuite< Device, T >::n_, and StartBenchmarkTiming().
|
inlineprivate |
References BenchmarkSuite< Device, T >::device_, SetBenchmarkFlopsProcessed(), and StopBenchmarkTiming().
Referenced by BenchmarkSuite< Device, T >::algebraicFunc(), BenchmarkSuite< Device, T >::broadcasting(), BenchmarkSuite< Device, T >::coeffWiseOp(), BenchmarkSuite< Device, T >::colChip(), BenchmarkSuite< Device, T >::colReduction(), BenchmarkSuite< Device, T >::contraction(), BenchmarkSuite< Device, T >::convolution(), BenchmarkSuite< Device, T >::fullReduction(), BenchmarkSuite< Device, T >::memcpy(), BenchmarkSuite< Device, T >::padding(), BenchmarkSuite< Device, T >::random(), BenchmarkSuite< Device, T >::rowChip(), BenchmarkSuite< Device, T >::rowReduction(), BenchmarkSuite< Device, T >::shuffling(), BenchmarkSuite< Device, T >::slicing(), BenchmarkSuite< Device, T >::striding(), BenchmarkSuite< Device, T >::transcendentalFunc(), and BenchmarkSuite< Device, T >::typeCasting().
|
inline |
|
inlineprivate |
References BenchmarkSuite< Device, T >::a_, BenchmarkSuite< Device, T >::b_, BenchmarkSuite< Device, T >::c_, BenchmarkSuite< Device, T >::device_, BenchmarkSuite< Device, T >::k_, BenchmarkSuite< Device, T >::m_, and BenchmarkSuite< Device, T >::n_.
Referenced by BenchmarkSuite< Device, T >::BenchmarkSuite().
|
inline |
References BenchmarkSuite< Device, T >::a_, BenchmarkSuite< Device, T >::c_, BenchmarkSuite< Device, T >::device_, eigen_assert, BenchmarkSuite< Device, T >::finalizeBenchmark(), BenchmarkSuite< Device, T >::k_, BenchmarkSuite< Device, T >::m_, BenchmarkSuite< Device, T >::n_, and StartBenchmarkTiming().
|
inline |
References BenchmarkSuite< Device, T >::a_, Eigen::Aligned, BenchmarkSuite< Device, T >::b_, BenchmarkSuite< Device, T >::device_, eigen_assert, BenchmarkSuite< Device, T >::finalizeBenchmark(), BenchmarkSuite< Device, T >::k_, BenchmarkSuite< Device, T >::m_, and StartBenchmarkTiming().
|
inline |
|
inline |
|
inline |
|
inline |
References BenchmarkSuite< Device, T >::a_, Eigen::Aligned, BenchmarkSuite< Device, T >::b_, BenchmarkSuite< Device, T >::device_, eigen_assert, BenchmarkSuite< Device, T >::finalizeBenchmark(), BenchmarkSuite< Device, T >::k_, BenchmarkSuite< Device, T >::m_, BenchmarkSuite< Device, T >::n_, Eigen::internal::shuffle(), and StartBenchmarkTiming().
|
inline |
References BenchmarkSuite< Device, T >::a_, Eigen::Aligned, BenchmarkSuite< Device, T >::b_, BenchmarkSuite< Device, T >::c_, BenchmarkSuite< Device, T >::device_, eigen_assert, BenchmarkSuite< Device, T >::finalizeBenchmark(), BenchmarkSuite< Device, T >::k_, BenchmarkSuite< Device, T >::m_, BenchmarkSuite< Device, T >::n_, sizes, and StartBenchmarkTiming().
|
inline |
References BenchmarkSuite< Device, T >::a_, Eigen::Aligned, BenchmarkSuite< Device, T >::b_, BenchmarkSuite< Device, T >::device_, eigen_assert, BenchmarkSuite< Device, T >::finalizeBenchmark(), BenchmarkSuite< Device, T >::k_, BenchmarkSuite< Device, T >::m_, StartBenchmarkTiming(), and Eigen::internal::strides().
|
inline |
References BenchmarkSuite< Device, T >::a_, Eigen::Aligned, BenchmarkSuite< Device, T >::b_, BenchmarkSuite< Device, T >::c_, BenchmarkSuite< Device, T >::device_, eigen_assert, BenchmarkSuite< Device, T >::finalizeBenchmark(), BenchmarkSuite< Device, T >::k_, BenchmarkSuite< Device, T >::m_, BenchmarkSuite< Device, T >::n_, sizes, and StartBenchmarkTiming().
|
inline |
References BenchmarkSuite< Device, T >::a_, Eigen::Aligned, BenchmarkSuite< Device, T >::b_, BenchmarkSuite< Device, T >::device_, eigen_assert, BenchmarkSuite< Device, T >::finalizeBenchmark(), BenchmarkSuite< Device, T >::k_, BenchmarkSuite< Device, T >::m_, BenchmarkSuite< Device, T >::n_, sizes, and StartBenchmarkTiming().
|
private |
Referenced by BenchmarkSuite< Device, T >::algebraicFunc(), BenchmarkSuite< Device, T >::broadcasting(), BenchmarkSuite< Device, T >::coeffWiseOp(), BenchmarkSuite< Device, T >::colReduction(), BenchmarkSuite< Device, T >::contraction(), BenchmarkSuite< Device, T >::convolution(), BenchmarkSuite< Device, T >::initialize(), BenchmarkSuite< Device, T >::memcpy(), BenchmarkSuite< Device, T >::padding(), BenchmarkSuite< Device, T >::shuffling(), BenchmarkSuite< Device, T >::slicing(), BenchmarkSuite< Device, T >::striding(), BenchmarkSuite< Device, T >::transcendentalFunc(), BenchmarkSuite< Device, T >::typeCasting(), and BenchmarkSuite< Device, T >::~BenchmarkSuite().
|
private |
Referenced by BenchmarkSuite< Device, T >::algebraicFunc(), BenchmarkSuite< Device, T >::coeffWiseOp(), BenchmarkSuite< Device, T >::colChip(), BenchmarkSuite< Device, T >::colReduction(), BenchmarkSuite< Device, T >::contraction(), BenchmarkSuite< Device, T >::convolution(), BenchmarkSuite< Device, T >::fullReduction(), BenchmarkSuite< Device, T >::initialize(), BenchmarkSuite< Device, T >::padding(), BenchmarkSuite< Device, T >::rowChip(), BenchmarkSuite< Device, T >::rowReduction(), BenchmarkSuite< Device, T >::shuffling(), BenchmarkSuite< Device, T >::slicing(), BenchmarkSuite< Device, T >::striding(), BenchmarkSuite< Device, T >::transcendentalFunc(), BenchmarkSuite< Device, T >::typeCasting(), and BenchmarkSuite< Device, T >::~BenchmarkSuite().
|
private |
Referenced by BenchmarkSuite< Device, T >::algebraicFunc(), BenchmarkSuite< Device, T >::broadcasting(), BenchmarkSuite< Device, T >::coeffWiseOp(), BenchmarkSuite< Device, T >::colChip(), BenchmarkSuite< Device, T >::contraction(), BenchmarkSuite< Device, T >::convolution(), BenchmarkSuite< Device, T >::fullReduction(), BenchmarkSuite< Device, T >::initialize(), BenchmarkSuite< Device, T >::memcpy(), BenchmarkSuite< Device, T >::random(), BenchmarkSuite< Device, T >::rowChip(), BenchmarkSuite< Device, T >::rowReduction(), BenchmarkSuite< Device, T >::slicing(), BenchmarkSuite< Device, T >::transcendentalFunc(), and BenchmarkSuite< Device, T >::~BenchmarkSuite().
|
private |
Referenced by BenchmarkSuite< Device, T >::algebraicFunc(), BenchmarkSuite< Device, T >::broadcasting(), BenchmarkSuite< Device, T >::coeffWiseOp(), BenchmarkSuite< Device, T >::colChip(), BenchmarkSuite< Device, T >::colReduction(), BenchmarkSuite< Device, T >::contraction(), BenchmarkSuite< Device, T >::convolution(), BenchmarkSuite< Device, T >::finalizeBenchmark(), BenchmarkSuite< Device, T >::fullReduction(), BenchmarkSuite< Device, T >::initialize(), BenchmarkSuite< Device, T >::memcpy(), BenchmarkSuite< Device, T >::padding(), BenchmarkSuite< Device, T >::random(), BenchmarkSuite< Device, T >::rowChip(), BenchmarkSuite< Device, T >::rowReduction(), BenchmarkSuite< Device, T >::shuffling(), BenchmarkSuite< Device, T >::slicing(), BenchmarkSuite< Device, T >::striding(), BenchmarkSuite< Device, T >::transcendentalFunc(), BenchmarkSuite< Device, T >::typeCasting(), and BenchmarkSuite< Device, T >::~BenchmarkSuite().
|
private |
Referenced by BenchmarkSuite< Device, T >::algebraicFunc(), BenchmarkSuite< Device, T >::coeffWiseOp(), BenchmarkSuite< Device, T >::colChip(), BenchmarkSuite< Device, T >::colReduction(), BenchmarkSuite< Device, T >::contraction(), BenchmarkSuite< Device, T >::fullReduction(), BenchmarkSuite< Device, T >::initialize(), BenchmarkSuite< Device, T >::memcpy(), BenchmarkSuite< Device, T >::padding(), BenchmarkSuite< Device, T >::random(), BenchmarkSuite< Device, T >::rowChip(), BenchmarkSuite< Device, T >::rowReduction(), BenchmarkSuite< Device, T >::shuffling(), BenchmarkSuite< Device, T >::slicing(), BenchmarkSuite< Device, T >::striding(), BenchmarkSuite< Device, T >::transcendentalFunc(), and BenchmarkSuite< Device, T >::typeCasting().
|
private |
Referenced by BenchmarkSuite< Device, T >::algebraicFunc(), BenchmarkSuite< Device, T >::broadcasting(), BenchmarkSuite< Device, T >::coeffWiseOp(), BenchmarkSuite< Device, T >::contraction(), BenchmarkSuite< Device, T >::convolution(), BenchmarkSuite< Device, T >::initialize(), BenchmarkSuite< Device, T >::memcpy(), BenchmarkSuite< Device, T >::padding(), BenchmarkSuite< Device, T >::random(), BenchmarkSuite< Device, T >::shuffling(), BenchmarkSuite< Device, T >::slicing(), BenchmarkSuite< Device, T >::striding(), BenchmarkSuite< Device, T >::transcendentalFunc(), and BenchmarkSuite< Device, T >::typeCasting().
|
private |
Referenced by BenchmarkSuite< Device, T >::algebraicFunc(), BenchmarkSuite< Device, T >::broadcasting(), BenchmarkSuite< Device, T >::coeffWiseOp(), BenchmarkSuite< Device, T >::colChip(), BenchmarkSuite< Device, T >::colReduction(), BenchmarkSuite< Device, T >::contraction(), BenchmarkSuite< Device, T >::convolution(), BenchmarkSuite< Device, T >::fullReduction(), BenchmarkSuite< Device, T >::initialize(), BenchmarkSuite< Device, T >::memcpy(), BenchmarkSuite< Device, T >::random(), BenchmarkSuite< Device, T >::rowChip(), BenchmarkSuite< Device, T >::rowReduction(), BenchmarkSuite< Device, T >::shuffling(), BenchmarkSuite< Device, T >::slicing(), BenchmarkSuite< Device, T >::transcendentalFunc(), and BenchmarkSuite< Device, T >::typeCasting().