libxmp/libxmpf in Omni Compiler
1.3.4
|
Go to the source code of this file.
Macros | |
#define | _XMP_GPU_M_GTOL(_desc, _dim) (((_XMP_gpu_array_t *)_desc)[_dim].gtol) |
#define | _XMP_GPU_M_ACC(_desc, _dim) (((_XMP_gpu_array_t *)_desc)[_dim].acc) |
#define | _XMP_M_CEILi(a_, b_) (((a_) % (b_)) == 0 ? ((a_) / (b_)) : ((a_) / (b_)) + 1) |
#define | _XMP_M_FLOORi(a_, b_) ((a_) / (b_)) |
#define | _XMP_M_COUNT_TRIPLETi(l_, u_, s_) (_XMP_M_FLOORi(((u_) - (l_)), s_) + 1) |
#define | _XMP_GPU_M_BARRIER_THREADS() __syncthreads() |
#define | _XMP_GPU_M_BARRIER_KERNEL() cudaThreadSynchronize() |
#define | _XMP_GPU_M_GET_ARRAY_GTOL(_gtol, _desc, _dim) _gtol = _XMP_GPU_M_GTOL(_desc, _dim) |
#define | _XMP_GPU_M_GET_ARRAY_ACC(_acc, _desc, _dim) _acc = _XMP_GPU_M_ACC(_desc, _dim) |
#define | _XMP_gpu_calc_iter_MAP_THREADS_1(_l0, _u0, _s0, _i0) |
#define | _XMP_gpu_calc_iter_MAP_THREADS_2(_l0, _u0, _s0, _l1, _u1, _s1, _i0, _i1) |
#define | _XMP_gpu_calc_iter_MAP_THREADS_3(_l0, _u0, _s0, _l1, _u1, _s1, _l2, _u2, _s2, _i0, _i1, _i2) |
#define | _XMP_GPU_M_CALC_CONFIG_PARAMS(_x, _y, _z) |
Functions | |
void | _XMP_fatal (char *msg) |
template<typename T > | |
__device__ void | _XMP_gpu_calc_thread_id (T *index) |
template<typename T > | |
__device__ void | _XMP_gpu_calc_iter (unsigned long long tid, T lower0, T upper0, T stride0, T *iter0) |
template<typename T > | |
__device__ void | _XMP_gpu_calc_iter (unsigned long long tid, T lower0, T upper0, T stride0, T lower1, T upper1, T stride1, T *iter0, T *iter1) |
template<typename T > | |
__device__ void | _XMP_gpu_calc_iter (unsigned long long tid, T lower0, T upper0, T stride0, T lower1, T upper1, T stride1, T lower2, T upper2, T stride2, T *iter0, T *iter1, T *iter2) |
template<typename T > | |
void | _XMP_gpu_calc_config_params (unsigned long long *total_iter, int *block_x, int *block_y, int *block_z, int *thread_x, int *thread_y, int *thread_z, T lower0, T upper0, T stride0) |
template<typename T > | |
void | _XMP_gpu_calc_config_params (unsigned long long *total_iter, int *block_x, int *block_y, int *block_z, int *thread_x, int *thread_y, int *thread_z, T lower0, T upper0, T stride0, T lower1, T upper1, T stride1) |
template<typename T > | |
void | _XMP_gpu_calc_config_params (unsigned long long *total_iter, int *block_x, int *block_y, int *block_z, int *thread_x, int *thread_y, int *thread_z, T lower0, T upper0, T stride0, T lower1, T upper1, T stride1, T lower2, T upper2, T stride2) |
template<typename T > | |
void | _XMP_gpu_calc_config_params_MAP_THREADS (int *block_x, int *block_y, int *block_z, int *thread_x, int *thread_y, int *thread_z, int thread_x_v, T lower0, T upper0, T stride0) |
template<typename T > | |
void | _XMP_gpu_calc_config_params_MAP_THREADS (int *block_x, int *block_y, int *block_z, int *thread_x, int *thread_y, int *thread_z, int thread_x_v, int thread_y_v, T lower0, T upper0, T stride0, T lower1, T upper1, T stride1) |
template<typename T > | |
void | _XMP_gpu_calc_config_params_MAP_THREADS (int *block_x, int *block_y, int *block_z, int *thread_x, int *thread_y, int *thread_z, int thread_x_v, int thread_y_v, int thread_z_v, T lower0, T upper0, T stride0, T lower1, T upper1, T stride1, T lower2, T upper2, T stride2) |
Variables | |
int | _XMP_gpu_max_thread |
int | _XMP_gpu_max_block_dim_x |
int | _XMP_gpu_max_block_dim_y |
int | _XMP_gpu_max_block_dim_z |
#define _XMP_gpu_calc_iter_MAP_THREADS_1 | ( | _l0, | |
_u0, | |||
_s0, | |||
_i0 | |||
) |
#define _XMP_gpu_calc_iter_MAP_THREADS_2 | ( | _l0, | |
_u0, | |||
_s0, | |||
_l1, | |||
_u1, | |||
_s1, | |||
_i0, | |||
_i1 | |||
) |
#define _XMP_gpu_calc_iter_MAP_THREADS_3 | ( | _l0, | |
_u0, | |||
_s0, | |||
_l1, | |||
_u1, | |||
_s1, | |||
_l2, | |||
_u2, | |||
_s2, | |||
_i0, | |||
_i1, | |||
_i2 | |||
) |
#define _XMP_GPU_M_ACC | ( | _desc, | |
_dim | |||
) | (((_XMP_gpu_array_t *)_desc)[_dim].acc) |
#define _XMP_GPU_M_BARRIER_KERNEL | ( | ) | cudaThreadSynchronize() |
#define _XMP_GPU_M_BARRIER_THREADS | ( | ) | __syncthreads() |
#define _XMP_GPU_M_CALC_CONFIG_PARAMS | ( | _x, | |
_y, | |||
_z | |||
) |
#define _XMP_GPU_M_GET_ARRAY_ACC | ( | _acc, | |
_desc, | |||
_dim | |||
) | _acc = _XMP_GPU_M_ACC(_desc, _dim) |
#define _XMP_GPU_M_GET_ARRAY_GTOL | ( | _gtol, | |
_desc, | |||
_dim | |||
) | _gtol = _XMP_GPU_M_GTOL(_desc, _dim) |
#define _XMP_GPU_M_GTOL | ( | _desc, | |
_dim | |||
) | (((_XMP_gpu_array_t *)_desc)[_dim].gtol) |
#define _XMP_M_CEILi | ( | a_, | |
b_ | |||
) | (((a_) % (b_)) == 0 ? ((a_) / (b_)) : ((a_) / (b_)) + 1) |
#define _XMP_M_COUNT_TRIPLETi | ( | l_, | |
u_, | |||
s_ | |||
) | (_XMP_M_FLOORi(((u_) - (l_)), s_) + 1) |
#define _XMP_M_FLOORi | ( | a_, | |
b_ | |||
) | ((a_) / (b_)) |
void _XMP_fatal | ( | char * | msg | ) |
void _XMP_gpu_calc_config_params | ( | unsigned long long * | total_iter, |
int * | block_x, | ||
int * | block_y, | ||
int * | block_z, | ||
int * | thread_x, | ||
int * | thread_y, | ||
int * | thread_z, | ||
T | lower0, | ||
T | upper0, | ||
T | stride0 | ||
) |
void _XMP_gpu_calc_config_params | ( | unsigned long long * | total_iter, |
int * | block_x, | ||
int * | block_y, | ||
int * | block_z, | ||
int * | thread_x, | ||
int * | thread_y, | ||
int * | thread_z, | ||
T | lower0, | ||
T | upper0, | ||
T | stride0, | ||
T | lower1, | ||
T | upper1, | ||
T | stride1 | ||
) |
void _XMP_gpu_calc_config_params | ( | unsigned long long * | total_iter, |
int * | block_x, | ||
int * | block_y, | ||
int * | block_z, | ||
int * | thread_x, | ||
int * | thread_y, | ||
int * | thread_z, | ||
T | lower0, | ||
T | upper0, | ||
T | stride0, | ||
T | lower1, | ||
T | upper1, | ||
T | stride1, | ||
T | lower2, | ||
T | upper2, | ||
T | stride2 | ||
) |
void _XMP_gpu_calc_config_params_MAP_THREADS | ( | int * | block_x, |
int * | block_y, | ||
int * | block_z, | ||
int * | thread_x, | ||
int * | thread_y, | ||
int * | thread_z, | ||
int | thread_x_v, | ||
int | thread_y_v, | ||
int | thread_z_v, | ||
T | lower0, | ||
T | upper0, | ||
T | stride0, | ||
T | lower1, | ||
T | upper1, | ||
T | stride1, | ||
T | lower2, | ||
T | upper2, | ||
T | stride2 | ||
) |
void _XMP_gpu_calc_config_params_MAP_THREADS | ( | int * | block_x, |
int * | block_y, | ||
int * | block_z, | ||
int * | thread_x, | ||
int * | thread_y, | ||
int * | thread_z, | ||
int | thread_x_v, | ||
int | thread_y_v, | ||
T | lower0, | ||
T | upper0, | ||
T | stride0, | ||
T | lower1, | ||
T | upper1, | ||
T | stride1 | ||
) |
void _XMP_gpu_calc_config_params_MAP_THREADS | ( | int * | block_x, |
int * | block_y, | ||
int * | block_z, | ||
int * | thread_x, | ||
int * | thread_y, | ||
int * | thread_z, | ||
int | thread_x_v, | ||
T | lower0, | ||
T | upper0, | ||
T | stride0 | ||
) |
__device__ void _XMP_gpu_calc_iter | ( | unsigned long long | tid, |
T | lower0, | ||
T | upper0, | ||
T | stride0, | ||
T * | iter0 | ||
) |
__device__ void _XMP_gpu_calc_iter | ( | unsigned long long | tid, |
T | lower0, | ||
T | upper0, | ||
T | stride0, | ||
T | lower1, | ||
T | upper1, | ||
T | stride1, | ||
T * | iter0, | ||
T * | iter1 | ||
) |
__device__ void _XMP_gpu_calc_iter | ( | unsigned long long | tid, |
T | lower0, | ||
T | upper0, | ||
T | stride0, | ||
T | lower1, | ||
T | upper1, | ||
T | stride1, | ||
T | lower2, | ||
T | upper2, | ||
T | stride2, | ||
T * | iter0, | ||
T * | iter1, | ||
T * | iter2 | ||
) |
__device__ void _XMP_gpu_calc_thread_id | ( | T * | index | ) |
int _XMP_gpu_max_block_dim_x |
int _XMP_gpu_max_block_dim_y |
int _XMP_gpu_max_block_dim_z |
int _XMP_gpu_max_thread |