Searched refs:total_work_block (Results 1 – 3 of 3) sorted by relevance
17 constexpr int total_work_block = n_threads * n_elems_per_thread; in C10_LAUNCH_BOUNDS_2() local18 int idx = total_work_block * blockIdx.x + threadIdx.x; in C10_LAUNCH_BOUNDS_2()36 constexpr int total_work_block = n_threads * n_elems_per_thread; in _lauch_kernel() local37 dim3 grid((total_n_elems + total_work_block - 1) / total_work_block); in _lauch_kernel()
78 constexpr int total_work_block = n_threads * n_elems_per_thread; in C10_LAUNCH_BOUNDS_2() local79 int idx = total_work_block * blockIdx.x + threadIdx.x; in C10_LAUNCH_BOUNDS_2()97 constexpr int total_work_block = n_threads * n_elems_per_thread; in _launch_kernel() local98 dim3 grid((total_n_elems + total_work_block - 1) / total_work_block); in _launch_kernel()
25 constexpr int total_work_block = n_threads * n_elems_per_thread; in C10_LAUNCH_BOUNDS_2() local26 int idx = total_work_block * blockIdx.x + threadIdx.x; in C10_LAUNCH_BOUNDS_2()44 constexpr int total_work_block = n_threads * n_elems_per_thread; in _launch_unfold_backward_kernel() local45 dim3 grid((total_n_elems + total_work_block - 1) / total_work_block); in _launch_unfold_backward_kernel()