#include <tensor_benchmarks.h>
Public Member Functions | |
void | algebraicFunc (int num_iters) |
BenchmarkSuite (const Device &device, size_t m) | |
BenchmarkSuite (const Device &device, size_t m, size_t k) | |
BenchmarkSuite (const Device &device, size_t m, size_t k, size_t n) | |
void | broadcasting (int num_iters) |
void | coeffWiseOp (int num_iters) |
void | colChip (int num_iters) |
void | colReduction (int num_iters) |
void | contraction (int num_iters) |
void | contractionRowMajor (int num_iters) |
void | contractionRowMajorABT (int num_iters) |
void | contractionRowMajorAT (int num_iters) |
void | contractionRowMajorBT (int num_iters) |
void | convolution (int num_iters, int kernel_x, int kernel_y) |
void | fullReduction (int num_iters) |
void | memcpy (int num_iters) |
void | padding (int num_iters) |
void | random (int num_iters) |
void | rowChip (int num_iters) |
void | rowReduction (int num_iters) |
void | shuffling (int num_iters) |
void | slicing (int num_iters) |
void | striding (int num_iters) |
void | transcendentalFunc (int num_iters) |
void | typeCasting (int num_iters) |
~BenchmarkSuite () | |
Private Member Functions | |
template<int Layout> | |
void | contraction (int num_iters, bool trans_a, bool trans_b) |
void | finalizeBenchmark (int64_t num_items) |
void | initialize () |
Private Attributes | |
T * | a_ |
T * | b_ |
T * | c_ |
Device | device_ |
TensorIndex | k_ |
TensorIndex | m_ |
TensorIndex | n_ |
Definition at line 18 of file tensor_benchmarks.h.
|
inline |
Definition at line 20 of file tensor_benchmarks.h.
|
inline |
Definition at line 25 of file tensor_benchmarks.h.
|
inline |
Definition at line 30 of file tensor_benchmarks.h.
|
inline |
Definition at line 35 of file tensor_benchmarks.h.
|
inline |
Definition at line 334 of file tensor_benchmarks.h.
|
inline |
Definition at line 278 of file tensor_benchmarks.h.
|
inline |
Definition at line 312 of file tensor_benchmarks.h.
|
inline |
Definition at line 163 of file tensor_benchmarks.h.
|
inline |
Definition at line 412 of file tensor_benchmarks.h.
|
inline |
Definition at line 472 of file tensor_benchmarks.h.
|
inlineprivate |
Definition at line 526 of file tensor_benchmarks.h.
|
inline |
Definition at line 476 of file tensor_benchmarks.h.
|
inline |
Definition at line 488 of file tensor_benchmarks.h.
|
inline |
Definition at line 480 of file tensor_benchmarks.h.
|
inline |
Definition at line 484 of file tensor_benchmarks.h.
|
inline |
Definition at line 492 of file tensor_benchmarks.h.
|
inlineprivate |
Definition at line 573 of file tensor_benchmarks.h.
|
inline |
Definition at line 446 of file tensor_benchmarks.h.
|
inlineprivate |
Definition at line 560 of file tensor_benchmarks.h.
|
inline |
Definition at line 41 of file tensor_benchmarks.h.
|
inline |
Definition at line 211 of file tensor_benchmarks.h.
|
inline |
Definition at line 81 of file tensor_benchmarks.h.
|
inline |
Definition at line 142 of file tensor_benchmarks.h.
|
inline |
Definition at line 380 of file tensor_benchmarks.h.
|
inline |
Definition at line 184 of file tensor_benchmarks.h.
|
inline |
Definition at line 100 of file tensor_benchmarks.h.
|
inline |
Definition at line 243 of file tensor_benchmarks.h.
|
inline |
Definition at line 357 of file tensor_benchmarks.h.
|
inline |
Definition at line 56 of file tensor_benchmarks.h.
|
private |
Definition at line 592 of file tensor_benchmarks.h.
|
private |
Definition at line 593 of file tensor_benchmarks.h.
|
private |
Definition at line 594 of file tensor_benchmarks.h.
|
private |
Definition at line 595 of file tensor_benchmarks.h.
|
private |
Definition at line 590 of file tensor_benchmarks.h.
|
private |
Definition at line 589 of file tensor_benchmarks.h.
|
private |
Definition at line 591 of file tensor_benchmarks.h.