Home
last modified time | relevance | path

Searched refs:thread_dims (Results 1 – 10 of 10) sorted by relevance

/external/tensorflow/tensorflow/stream_executor/cuda/
Dcuda_gpu_executor.cc420 bool GpuExecutor::Launch(Stream* stream, const ThreadDim& thread_dims, in Launch() argument
434 VlogOccupancyInfo(kernel, thread_dims, block_dims); in Launch()
449 block_dims.z, thread_dims.x, thread_dims.y, in Launch()
450 thread_dims.z, args.number_of_shared_bytes(), in Launch()
455 << " args; thread dim: " << thread_dims.ToString() in Launch()
467 const ThreadDim& thread_dims, in VlogOccupancyInfo() argument
471 VLOG(2) << "Thread dimensions (" << thread_dims.x << ", " << thread_dims.y in VlogOccupancyInfo()
472 << ", " << thread_dims.z << ")"; in VlogOccupancyInfo()
491 smem_per_block, thread_dims, cufunc); in VlogOccupancyInfo()
496 smem_per_block, thread_dims, cufunc); in VlogOccupancyInfo()
[all …]
/external/tensorflow/tensorflow/stream_executor/gpu/
Dgpu_executor.h72 bool Launch(Stream* stream, const ThreadDim& thread_dims,
80 const ThreadDim& thread_dims, GpuFunctionHandle func);
87 const ThreadDim& thread_dims, GpuFunctionHandle func);
269 void VlogOccupancyInfo(const KernelBase& kernel, const ThreadDim& thread_dims,
/external/tensorflow/tensorflow/stream_executor/rocm/
Drocm_gpu_executor.cc286 bool GpuExecutor::Launch(Stream* stream, const ThreadDim& thread_dims, in Launch() argument
300 VlogOccupancyInfo(kernel, thread_dims, block_dims); in Launch()
332 block_dims.z, thread_dims.x, thread_dims.y, thread_dims.z, in Launch()
336 << "; thread dim: " << thread_dims.ToString() in Launch()
347 const ThreadDim& thread_dims, in CalculateOccupancy() argument
357 const ThreadDim& thread_dims, in CompareOccupancy() argument
420 const ThreadDim& thread_dims, in VlogOccupancyInfo() argument
/external/tensorflow/tensorflow/stream_executor/
Dtrace_listener.h49 virtual void LaunchSubmit(Stream* stream, const ThreadDim& thread_dims, in LaunchSubmit() argument
Dstream_executor_pimpl.h452 bool Launch(Stream *stream, const ThreadDim &thread_dims,
867 inline Stream &Stream::ThenLaunch(ThreadDim thread_dims, BlockDim block_dims, in ThenLaunch() argument
882 parent_->Launch(this, thread_dims, block_dims, kernel, kernel_args); in ThenLaunch()
Dstream_executor_pimpl.cc479 bool StreamExecutor::Launch(Stream *stream, const ThreadDim &thread_dims, in Launch() argument
483 SubmitTrace(&TraceListener::LaunchSubmit, stream, thread_dims, block_dims, in Launch()
486 return implementation_->Launch(stream, thread_dims, block_dims, kernel, args); in Launch()
Dstream_executor_internal.h191 virtual bool Launch(Stream *stream, const ThreadDim &thread_dims, in Launch() argument
Dstream.h171 Stream &ThenLaunch(ThreadDim thread_dims, BlockDim block_dims,
/external/tensorflow/tensorflow/compiler/xla/service/interpreter/
Dexecutor.h65 bool Launch(Stream *stream, const ThreadDim &thread_dims, in Launch() argument
/external/tensorflow/tensorflow/stream_executor/host/
Dhost_gpu_executor.h57 bool Launch(Stream *stream, const ThreadDim &thread_dims, in Launch() argument