Searched defs:C10_LAUNCH_BOUNDS_2 (Results 1 – 12 of 12) sorted by relevance
/external/pytorch/aten/src/ATen/native/sparse/cuda/ |
D | SparseCUDAApplyUtils.cuh | 44 C10_LAUNCH_BOUNDS_2(cuda::getApplyBlockSize(), cuda::getApplyBlocksPerSM()) in C10_LAUNCH_BOUNDS_2() function 74 C10_LAUNCH_BOUNDS_2(cuda::getApplyBlockSize(), cuda::getApplyBlocksPerSM()) in C10_LAUNCH_BOUNDS_2() function 98 C10_LAUNCH_BOUNDS_2(cuda::getApplyBlockSize(), cuda::getApplyBlocksPerSM()) in C10_LAUNCH_BOUNDS_2() function 145 C10_LAUNCH_BOUNDS_2(cuda::getApplyBlockSize(), cuda::getApplyBlocksPerSM()) in C10_LAUNCH_BOUNDS_2() function
|
D | SparseCUDATensorMath.cu | 505 C10_LAUNCH_BOUNDS_2(cuda::getApplyBlockSize(), cuda::getApplyBlocksPerSM()) in C10_LAUNCH_BOUNDS_2() function
|
/external/pytorch/aten/src/ATen/cuda/ |
D | CUDAApplyUtils.cuh | 273 C10_LAUNCH_BOUNDS_2(AT_APPLY_THREADS_PER_BLOCK, AT_APPLY_BLOCKS_PER_SM) in C10_LAUNCH_BOUNDS_2() function 359 C10_LAUNCH_BOUNDS_2(max_threads_per_block, min_blocks_per_sm) in C10_LAUNCH_BOUNDS_2() function
|
/external/pytorch/aten/src/ATen/native/cuda/ |
D | TensorTransformations.cu | 25 C10_LAUNCH_BOUNDS_2(cuda::getApplyBlockSize(), cuda::getApplyBlocksPerSM()) in C10_LAUNCH_BOUNDS_2() function
|
D | FunctionOfAMatrixUtilsKernel.cu | 15 C10_LAUNCH_BOUNDS_2(n_threads, n_elems_per_thread) in C10_LAUNCH_BOUNDS_2() function
|
D | LinearAlgebra.cu | 76 C10_LAUNCH_BOUNDS_2(n_threads, n_elems_per_thread) in C10_LAUNCH_BOUNDS_2() function
|
D | UnfoldBackwardKernel.cu | 23 C10_LAUNCH_BOUNDS_2(n_threads, n_elems_per_thread) in C10_LAUNCH_BOUNDS_2() function
|
D | SparseBinaryOpIntersectionKernel.cu | 47 C10_LAUNCH_BOUNDS_2(nt, vt) in C10_LAUNCH_BOUNDS_2() function
|
D | DistributionTemplates.h | 65 C10_LAUNCH_BOUNDS_2(block_size_bound, grid_size_bound) in C10_LAUNCH_BOUNDS_2() function
|
D | IndexKernel.cu | 27 C10_LAUNCH_BOUNDS_2(nt, launch_bound2) in C10_LAUNCH_BOUNDS_2() function
|
D | ScatterGatherKernel.cu | 87 C10_LAUNCH_BOUNDS_2(nt, vt) in C10_LAUNCH_BOUNDS_2() function
|
/external/pytorch/c10/macros/ |
D | Macros.h | 316 #define C10_LAUNCH_BOUNDS_2(max_threads_per_block, min_blocks_per_sm) \ macro
|