Home
last modified time | relevance | path

Searched refs:max_threads_per_block (Results 1 – 17 of 17) sorted by relevance

/external/clang/test/CodeGenCUDA/
Dlaunch-bounds.cu32 template <int max_threads_per_block>
34 __launch_bounds__(max_threads_per_block) in __launch_bounds__() argument
42 template <int max_threads_per_block, int min_blocks_per_mp>
44 __launch_bounds__(max_threads_per_block, min_blocks_per_mp) in __launch_bounds__() argument
54 template <int max_threads_per_block, int min_blocks_per_mp>
56 __launch_bounds__(max_threads_per_block + constint,
57 min_blocks_per_mp + max_threads_per_block)
/external/llvm-project/clang/test/CodeGenCUDA/
Dlaunch-bounds.cu32 template <int max_threads_per_block>
34 __launch_bounds__(max_threads_per_block) in __launch_bounds__() argument
42 template <int max_threads_per_block, int min_blocks_per_mp>
44 __launch_bounds__(max_threads_per_block, min_blocks_per_mp) in __launch_bounds__() argument
54 template <int max_threads_per_block, int min_blocks_per_mp>
56 __launch_bounds__(max_threads_per_block + constint,
57 min_blocks_per_mp + max_threads_per_block)
/external/mesa3d/src/gallium/frontends/clover/core/
Ddevice.hpp69 size_t max_threads_per_block() const;
Ddevice.cpp177 device::max_threads_per_block() const { in max_threads_per_block() function in device
Dkernel.cpp141 q.device().max_threads_per_block(), q.device().max_block_size(), in optimal_block_size()
/external/mesa3d/src/gallium/drivers/softpipe/
Dsp_screen.c531 uint64_t *max_threads_per_block = ret; in softpipe_get_compute_param() local
532 *max_threads_per_block = 1024; in softpipe_get_compute_param()
/external/mesa3d/src/gallium/frontends/clover/api/
Dkernel.cpp164 buf.as_scalar<size_t>() = dev.max_threads_per_block(); in clGetKernelWorkGroupInfo()
306 q.device().max_threads_per_block()) in validate_block_size()
Ddevice.cpp125 buf.as_scalar<size_t>() = dev.max_threads_per_block(); in clGetDeviceInfo()
/external/tensorflow/tensorflow/core/profiler/internal/gpu/
Dcupti_collector.cc550 auto max_threads_per_block = in GetDeviceCapabilities() local
569 max_threads_per_block && max_threads_per_sm && regs_per_block && in GetDeviceCapabilities()
575 device_properties_.maxThreadsPerBlock = *max_threads_per_block; in GetDeviceCapabilities()
/external/mesa3d/src/gallium/drivers/llvmpipe/
Dlp_screen.c467 uint64_t *max_threads_per_block = ret; in llvmpipe_get_compute_param() local
468 *max_threads_per_block = 1024; in llvmpipe_get_compute_param()
/external/mesa3d/src/gallium/drivers/radeonsi/
Dsi_get.c740 uint64_t *max_threads_per_block = ret; in si_get_compute_param() local
741 *max_threads_per_block = get_max_threads_per_block(sscreen, ir_type); in si_get_compute_param()
Dsi_pipe.c681 uint64_t max_threads_per_block; in si_create_context() local
683 &max_threads_per_block); in si_create_context()
698 MAX2(32 * sscreen->info.num_good_compute_units, max_threads_per_block / 64); in si_create_context()
/external/mesa3d/src/gallium/drivers/virgl/
Dvirgl_screen.c484 uint64_t *max_threads_per_block = ret; in virgl_get_compute_param() local
485 *max_threads_per_block = vscreen->caps.caps.v2.max_compute_work_group_invocations; in virgl_get_compute_param()
/external/mesa3d/src/gallium/frontends/lavapipe/
Dlvp_device.c394 uint64_t max_threads_per_block, max_local_size; in lvp_GetPhysicalDeviceProperties() local
402 &max_threads_per_block); in lvp_GetPhysicalDeviceProperties()
461 .maxComputeWorkGroupInvocations = max_threads_per_block, in lvp_GetPhysicalDeviceProperties()
/external/mesa3d/src/mesa/state_tracker/
Dst_extensions.c1582 uint64_t max_local_size, max_threads_per_block; in st_init_extensions() local
1590 &max_threads_per_block); in st_init_extensions()
1595 consts->MaxComputeWorkGroupInvocations = max_threads_per_block; in st_init_extensions()
/external/mesa3d/src/gallium/drivers/r600/
Dr600_pipe_common.c967 uint64_t *max_threads_per_block = ret; in r600_get_compute_param() local
968 *max_threads_per_block = get_max_threads_per_block(rscreen, ir_type); in r600_get_compute_param()
/external/mesa3d/src/amd/vulkan/
Dradv_device.c2814 uint32_t max_threads_per_block = 2048; in radv_CreateDevice() local
2816 max_threads_per_block / 64); in radv_CreateDevice()