kernel_launch.hpp Source File#
tile/host/kernel_launch.hpp
Go to the documentation of this file.
51// Arch can be used to support linking multiple object files that have the same kernel compiled for
149 * this is the function to launch arbitrary number of kernels with optional timer(selected by stream_config)
152 * the simplest way is pass in a lambda function, with "[=](const stream_config& s){ call_your_kernel_here() }"
161 * if you use ck_tile kernel, or similiar to this style (structure with "static __device__ operator()(...){}")
162 * you can pass your kernel to ck_tile::make_kernel(), which will create a anonymous functor for you,
197launch_kernel_time_mask(const stream_config& s, PreprocessFunc preprocess, Callables&&... callables)
#define HIP_CHECK_ERROR(retval_or_funcall)
Definition host_utility/hip_check_error.hpp:21
Definition tile/core/algorithm/cluster_descriptor.hpp:13
CK_TILE_HOST double timing_loop_impl(TimerType timer, const stream_config &s, CallablesFunc &&callables_func, PreprocessFunc preprocess=nullptr)
Definition tile/host/kernel_launch.hpp:106
CK_TILE_HOST auto make_kernel(KernelImpl, dim3 grid_dim, dim3 block_dim, std::size_t lds_byte, Args... args)
Definition tile/host/kernel_launch.hpp:60
CK_TILE_HOST double preprocess_profiling_impl(TimerType timer, const stream_config &s, PreprocessFunc preprocess)
Definition tile/host/kernel_launch.hpp:90
CK_TILE_HOST void launch_and_check(const stream_config &sc, Callables &&... callables)
Definition tile/host/kernel_launch.hpp:78
CK_TILE_HOST float launch_kernel_time_mask(const stream_config &s, PreprocessFunc preprocess, Callables &&... callables)
Definition tile/host/kernel_launch.hpp:197
CK_TILE_HOST float launch_kernel(const stream_config &s, Callables &&... callables)
Definition tile/host/kernel_launch.hpp:173
Definition timer.hpp:52
Definition timer.hpp:15
Definition ck_tile/host/stream_config.hpp:30
hipStream_t stream_id_
Definition ck_tile/host/stream_config.hpp:31