MueLu Version of the Day
|
#include <MueLu_PerfModels_decl.hpp>
Public Member Functions | |
PerfModels () | |
void | stream_vector_make_table (int KERNEL_REPEATS, int LOG_MAX_SIZE=20) |
double | stream_vector_copy_lookup (int SIZE_IN_BYTES) |
double | stream_vector_add_lookup (int SIZE_IN_BYTES) |
double | latency_corrected_stream_vector_copy_lookup (int SIZE_IN_BYTES) |
double | latency_corrected_stream_vector_add_lookup (int SIZE_IN_BYTES) |
double | stream_vector_lookup (int SIZE_IN_BYTES) |
double | latency_corrected_stream_vector_lookup (int SIZE_IN_BYTES) |
void | print_stream_vector_table (std::ostream &out) |
void | print_latency_corrected_stream_vector_table (std::ostream &out) |
void | pingpong_make_table (int KERNEL_REPEATS, int LOG_MAX_SIZE, const RCP< const Teuchos::Comm< int > > &comm) |
double | pingpong_host_lookup (int SIZE_IN_BYTES) |
double | pingpong_device_lookup (int SIZE_IN_BYTES) |
void | print_pingpong_table (std::ostream &out) |
void | launch_latency_make_table (int KERNEL_REPEATS) |
double | launch_latency_lookup () |
void | print_launch_latency_table (std::ostream &out) |
Private Member Functions | |
void | print_stream_vector_table_impl (std::ostream &out, bool use_latency_correction) |
Private Attributes | |
std::vector< int > | stream_sizes_ |
std::vector< double > | stream_copy_times_ |
std::vector< double > | stream_add_times_ |
std::vector< double > | latency_corrected_stream_copy_times_ |
std::vector< double > | latency_corrected_stream_add_times_ |
std::vector< int > | pingpong_sizes_ |
std::vector< double > | pingpong_host_times_ |
std::vector< double > | pingpong_device_times_ |
double | launch_and_wait_latency_ |
Definition at line 63 of file MueLu_PerfModels_decl.hpp.
MueLu::PerfModels< Scalar, LocalOrdinal, GlobalOrdinal, Node >::PerfModels | ( | ) |
Definition at line 247 of file MueLu_PerfModels_def.hpp.
void MueLu::PerfModels< Scalar, LocalOrdinal, GlobalOrdinal, Node >::stream_vector_make_table | ( | int | KERNEL_REPEATS, |
int | LOG_MAX_SIZE = 20 ) |
Definition at line 252 of file MueLu_PerfModels_def.hpp.
double MueLu::PerfModels< Scalar, LocalOrdinal, GlobalOrdinal, Node >::stream_vector_copy_lookup | ( | int | SIZE_IN_BYTES | ) |
Definition at line 289 of file MueLu_PerfModels_def.hpp.
double MueLu::PerfModels< Scalar, LocalOrdinal, GlobalOrdinal, Node >::stream_vector_add_lookup | ( | int | SIZE_IN_BYTES | ) |
Definition at line 295 of file MueLu_PerfModels_def.hpp.
double MueLu::PerfModels< Scalar, LocalOrdinal, GlobalOrdinal, Node >::latency_corrected_stream_vector_copy_lookup | ( | int | SIZE_IN_BYTES | ) |
Definition at line 308 of file MueLu_PerfModels_def.hpp.
double MueLu::PerfModels< Scalar, LocalOrdinal, GlobalOrdinal, Node >::latency_corrected_stream_vector_add_lookup | ( | int | SIZE_IN_BYTES | ) |
Definition at line 314 of file MueLu_PerfModels_def.hpp.
double MueLu::PerfModels< Scalar, LocalOrdinal, GlobalOrdinal, Node >::stream_vector_lookup | ( | int | SIZE_IN_BYTES | ) |
Definition at line 301 of file MueLu_PerfModels_def.hpp.
double MueLu::PerfModels< Scalar, LocalOrdinal, GlobalOrdinal, Node >::latency_corrected_stream_vector_lookup | ( | int | SIZE_IN_BYTES | ) |
Definition at line 320 of file MueLu_PerfModels_def.hpp.
void MueLu::PerfModels< Scalar, LocalOrdinal, GlobalOrdinal, Node >::print_stream_vector_table | ( | std::ostream & | out | ) |
Definition at line 327 of file MueLu_PerfModels_def.hpp.
void MueLu::PerfModels< Scalar, LocalOrdinal, GlobalOrdinal, Node >::print_latency_corrected_stream_vector_table | ( | std::ostream & | out | ) |
Definition at line 333 of file MueLu_PerfModels_def.hpp.
void MueLu::PerfModels< Scalar, LocalOrdinal, GlobalOrdinal, Node >::pingpong_make_table | ( | int | KERNEL_REPEATS, |
int | LOG_MAX_SIZE, | ||
const RCP< const Teuchos::Comm< int > > & | comm ) |
Definition at line 382 of file MueLu_PerfModels_def.hpp.
double MueLu::PerfModels< Scalar, LocalOrdinal, GlobalOrdinal, Node >::pingpong_host_lookup | ( | int | SIZE_IN_BYTES | ) |
Definition at line 392 of file MueLu_PerfModels_def.hpp.
double MueLu::PerfModels< Scalar, LocalOrdinal, GlobalOrdinal, Node >::pingpong_device_lookup | ( | int | SIZE_IN_BYTES | ) |
Definition at line 398 of file MueLu_PerfModels_def.hpp.
void MueLu::PerfModels< Scalar, LocalOrdinal, GlobalOrdinal, Node >::print_pingpong_table | ( | std::ostream & | out | ) |
Definition at line 405 of file MueLu_PerfModels_def.hpp.
void MueLu::PerfModels< Scalar, LocalOrdinal, GlobalOrdinal, Node >::launch_latency_make_table | ( | int | KERNEL_REPEATS | ) |
Definition at line 437 of file MueLu_PerfModels_def.hpp.
double MueLu::PerfModels< Scalar, LocalOrdinal, GlobalOrdinal, Node >::launch_latency_lookup | ( | ) |
Definition at line 460 of file MueLu_PerfModels_def.hpp.
void MueLu::PerfModels< Scalar, LocalOrdinal, GlobalOrdinal, Node >::print_launch_latency_table | ( | std::ostream & | out | ) |
Definition at line 467 of file MueLu_PerfModels_def.hpp.
|
private |
Definition at line 340 of file MueLu_PerfModels_def.hpp.
|
private |
Definition at line 129 of file MueLu_PerfModels_decl.hpp.
|
private |
Definition at line 130 of file MueLu_PerfModels_decl.hpp.
|
private |
Definition at line 131 of file MueLu_PerfModels_decl.hpp.
|
private |
Definition at line 132 of file MueLu_PerfModels_decl.hpp.
|
private |
Definition at line 133 of file MueLu_PerfModels_decl.hpp.
|
private |
Definition at line 135 of file MueLu_PerfModels_decl.hpp.
|
private |
Definition at line 136 of file MueLu_PerfModels_decl.hpp.
|
private |
Definition at line 137 of file MueLu_PerfModels_decl.hpp.
|
private |
Definition at line 139 of file MueLu_PerfModels_decl.hpp.