Home
last modified time | relevance | path

Searched defs:threads_per_block (Results 1 – 11 of 11) sorted by relevance

/external/tensorflow/tensorflow/compiler/xla/service/gpu/
Dlaunch_dimensions.cc38 int64 threads_per_block = gpu_device_info.threads_per_block_limit; in ThreadsPerBlockLimit() local
79 int64 threads_per_block = ThreadsPerBlockLimit(gpu_device_info); in CalculateLaunchDimensions() local
Delemental_ir_emitter.cc313 llvm::Value* threads_per_block = IntCast( in EmitThreadId() local
Dir_emitter_unnested.cc4321 int threads_per_block) { in EmitFullWarpShuffleDownLoopForAllReduces()
4332 llvm::Value* partial_result_address, int threads_per_block) { in EmitFullWarpShuffleDownLoopForReduce()
4669 llvm::Value* IrEmitterUnnested::EmitThreadId(int64 threads_per_block, in EmitThreadId()
4681 int64 threads_per_block, llvm::Type* index_ty, int64 num_threads_x) { in EmitThreadIdInfo()
/external/tensorflow/tensorflow/core/kernels/image/
Dadjust_hue_op_gpu.cu.cc35 const int threads_per_block = config.thread_per_block; in operator ()() local
Dadjust_saturation_op_gpu.cu.cc36 const int threads_per_block = config.thread_per_block; in operator ()() local
/external/tensorflow/tensorflow/stream_executor/
Ddevice_description.cc155 int64 element_count, int64 *threads_per_block, in CalculateDimensionality()
/external/tensorflow/tensorflow/stream_executor/gpu/
Dredzone_allocator.cc223 int64 threads_per_block = std::min( in RunRedzoneChecker() local
/external/mesa3d/src/gallium/drivers/radeonsi/
Dsi_get.c731 unsigned threads_per_block = get_max_threads_per_block(sscreen, ir_type); in si_get_compute_param() local
/external/mesa3d/src/gallium/drivers/r600/
Dr600_pipe_common.c958 unsigned threads_per_block = get_max_threads_per_block(rscreen, ir_type); in r600_get_compute_param() local
/external/tensorflow/tensorflow/stream_executor/rocm/
Drocm_driver.cc1308 GpuContext* context, hipFunction_t kernel, int threads_per_block, in GetMaxOccupiedBlocksPerCore()
/external/tensorflow/tensorflow/stream_executor/cuda/
Dcuda_driver.cc1624 GpuContext* context, CUfunction kernel, int threads_per_block, in GetMaxOccupiedBlocksPerCore()