Go to the source code of this file.
|
int_t | get_max_buffer_size () |
|
double | get_acc_async_cost () |
|
double | estimate_acc_time (int m, int n, int k) |
|
double | estimate_acc_gemm_time (int m, int n, int k) |
|
double | estimate_acc_scatter_time (int m, int n, int k) |
|
double | estimate_cpu_time (int m, int n, int k) |
|
double | acc_data_send_time (size_t sz) |
|
void | LookUpTableInit (int my_rank) |
|
int_t | fixed_cpu_acc_partition (Ublock_info_t *Ublock_info_Phi, int_t num_u_blks_Phi, int_t Rnbrow, int_t ldu_Phi) |
|
int_t | tuned_partition (int_t num_u_blks_Phi, Ublock_info_t *Ublock_info_Phi, Remain_info_t *Remain_info, int_t RemainBlk, double cpu_time_0, int_t Rnbrow, int_t ldu_Phi) |
|
◆ mdwin_t
◆ acc_data_send_time()
double acc_data_send_time |
( |
size_t |
sz | ) |
|
◆ estimate_acc_gemm_time()
double estimate_acc_gemm_time |
( |
int |
m, |
|
|
int |
n, |
|
|
int |
k |
|
) |
| |
◆ estimate_acc_scatter_time()
double estimate_acc_scatter_time |
( |
int |
m, |
|
|
int |
n, |
|
|
int |
k |
|
) |
| |
◆ estimate_acc_time()
double estimate_acc_time |
( |
int |
m, |
|
|
int |
n, |
|
|
int |
k |
|
) |
| |
◆ estimate_cpu_time()
double estimate_cpu_time |
( |
int |
m, |
|
|
int |
n, |
|
|
int |
k |
|
) |
| |
◆ fixed_cpu_acc_partition()
◆ get_acc_async_cost()
double get_acc_async_cost |
( |
| ) |
|
◆ get_max_buffer_size()
int_t get_max_buffer_size |
( |
| ) |
|
◆ LookUpTableInit()
void LookUpTableInit |
( |
int |
my_rank | ) |
|
◆ tuned_partition()