Searched defs:threads_per_block (Results 1 – 12 of 12) sorted by relevance
| /external/tensorflow/tensorflow/core/kernels/image/ |
| D | adjust_hue_op_gpu.cu.cc | 35 const int threads_per_block = config.thread_per_block; in operator ()() local
|
| D | adjust_saturation_op_gpu.cu.cc | 36 const int threads_per_block = config.thread_per_block; in operator ()() local
|
| /external/tensorflow/tensorflow/stream_executor/rocm/ |
| D | rocm_helpers.cu.cc | 36 const int threads_per_block = 256; in rocm_MakeBatchPointers() local
|
| D | rocm_driver.cc | 1339 GpuContext* context, hipFunction_t kernel, int threads_per_block, in GetMaxOccupiedBlocksPerCore()
|
| /external/tensorflow/tensorflow/compiler/xla/stream_executor/ |
| D | device_description.cc | 143 int64_t element_count, int64_t *threads_per_block, in CalculateDimensionality()
|
| /external/tensorflow/tensorflow/compiler/xla/service/gpu/ |
| D | launch_dimensions.cc | 39 int64_t threads_per_block = gpu_device_info.threads_per_block_limit; in ThreadsPerBlockLimit() local
|
| D | elemental_ir_emitter.cc | 329 llvm::Value* threads_per_block = IntCast( in EmitThreadId() local
|
| D | ir_emitter_unnested.cc | 3666 int threads_per_block, int num_results_per_warp) { in EmitFullWarpShuffleDownLoopForReduce() 4055 llvm::Value* IrEmitterUnnested::EmitThreadId(int64_t threads_per_block, in EmitThreadId()
|
| /external/tensorflow/tensorflow/compiler/xla/stream_executor/gpu/ |
| D | redzone_allocator.cc | 224 int64_t threads_per_block = std::min( in RunRedzoneChecker() local
|
| /external/mesa3d/src/gallium/drivers/radeonsi/ |
| D | si_get.c | 731 unsigned threads_per_block = get_max_threads_per_block(sscreen, ir_type); in si_get_compute_param() local
|
| /external/mesa3d/src/gallium/drivers/r600/ |
| D | r600_pipe_common.c | 958 unsigned threads_per_block = get_max_threads_per_block(rscreen, ir_type); in r600_get_compute_param() local
|
| /external/tensorflow/tensorflow/compiler/xla/stream_executor/cuda/ |
| D | cuda_driver.cc | 1637 GpuContext* context, CUfunction kernel, int threads_per_block, in GetMaxOccupiedBlocksPerCore()
|