36#if defined(TIMEMORY_USE_PAPI)
41 std::pair<std::vector<long long>,
double>)
43 std::pair<
std::vector<
long long>,
double>)
45 std::pair<
std::vector<
long long>,
double>)
46extern template struct
tim::component::cpu_roofline<
float>;
47extern template struct
tim::component::cpu_roofline<
double>;
48extern template struct
tim::component::cpu_roofline<
float,
double>;
51#if defined(TIMEMORY_USE_CUPTI)
55# if defined(TIMEMORY_USE_CUDA_HALF)
58 std::tuple<typename ::tim::component::cupti_activity::value_type,
59 typename ::tim::component::cupti_counters::value_type>)
63 std::tuple<typename ::tim::component::cupti_activity::value_type,
64 typename ::tim::component::cupti_counters::value_type>)
68 typename ::
tim::component::cupti_counters::value_type>)
72 typename ::
tim::component::cupti_counters::value_type>)
75#if defined(TIMEMORY_USE_CUPTI)
78# if defined(TIMEMORY_USE_CUDA_HALF)
Include the extern declarations for cupti components.
#define TIMEMORY_DECLARE_EXTERN_COMPONENT(NAME, HAS_DATA,...)
Include the extern declarations for papi components.
Implementation of the roofline component(s)
gpu_roofline< float, double > gpu_roofline_flops
gpu_roofline< cuda::fp16_t > gpu_roofline_hp_flops
A specialization of tim::component::gpu_roofline for 16-bit floating point operations (depending on a...
gpu_roofline< double > gpu_roofline_dp_flops
A specialization of tim::component::gpu_roofline for 64-bit floating point operations.
gpu_roofline< float > gpu_roofline_sp_flops
A specialization of tim::component::gpu_roofline for 32-bit floating point operations.
cpu_roofline< double > cpu_roofline_dp_flops
A specialization of tim::component::cpu_roofline for 64-bit floating point operations.
cpu_roofline< float > cpu_roofline_sp_flops
A specialization of tim::component::cpu_roofline for 32-bit floating point operations.
cpu_roofline< float, double > cpu_roofline_flops
Combines hardware counters and timers and executes the empirical roofline toolkit during application ...
typename typename typename