|
HAMR
The Heterogeneous Accelerator Memory Resource
|
Go to the documentation of this file. 1 #ifndef hamr_hip_launch_h
2 #define hamr_hip_launch_h
6 #include "hamr_config.h"
10 #include <hip/hip_runtime.h>
41 int *block_grid_max,
int &warp_size,
42 int &max_warps_per_block);
52 return threadIdx.x + blockDim.x*(blockIdx.x + blockIdx.y * gridDim.x
53 + blockIdx.z * gridDim.x * gridDim.y);
61 return index < max_index;
83 int warps_per_block, dim3 &block_grid,
int &n_blocks,
103 int warps_per_block,
int warp_size,
int *block_grid_max,
104 dim3 &block_grid,
int &n_blocks, dim3 &thread_grid);
__device__ unsigned long thread_id_to_array_index()
Definition: hamr_cuda_launch.h:50
HAMR_EXPORT int get_launch_props(int device_id, int *block_grid_max, int &warp_size, int &max_warps_per_block)
query properties for the named CUDA device. retruns non-zero on error
__device__ int index_is_valid(unsigned long index, unsigned long max_index)
bounds check the flat index
Definition: hamr_cuda_launch.h:59
HAMR_EXPORT int partition_thread_blocks(int device_id, size_t array_size, int warps_per_block, dim3 &block_grid, int &n_blocks, dim3 &thread_grid)
heterogeneous accelerator memory resource
Definition: hamr_buffer.h:13