Home
last modified time | relevance | path

Searched refs:KernelBase (Results 1 – 22 of 22) sorted by relevance

/external/tensorflow/tensorflow/stream_executor/
Dkernel.cc61 KernelBase::KernelBase(KernelBase &&from) in KernelBase() function in stream_executor::KernelBase
70 KernelBase::KernelBase(StreamExecutor *parent) in KernelBase() function in stream_executor::KernelBase
74 KernelBase::KernelBase(StreamExecutor *parent, in KernelBase() function in stream_executor::KernelBase
78 KernelBase::~KernelBase() { in ~KernelBase()
84 unsigned KernelBase::Arity() const { return implementation_->Arity(); } in Arity()
86 void KernelBase::SetPreferredCacheConfig(KernelCacheConfig config) { in SetPreferredCacheConfig()
90 KernelCacheConfig KernelBase::GetPreferredCacheConfig() const { in GetPreferredCacheConfig()
97 void KernelBase::set_name(absl::string_view name) { in set_name()
Dkernel.h135 class KernelBase {
137 KernelBase(KernelBase &&from);
143 explicit KernelBase(StreamExecutor *parent);
146 KernelBase(StreamExecutor *parent, internal::KernelInterface *implementation);
150 ~KernelBase();
196 SE_DISALLOW_COPY_AND_ASSIGN(KernelBase);
497 class TypedKernel : public KernelBase {
502 explicit TypedKernel(StreamExecutor *parent) : KernelBase(parent) {}
507 : KernelBase(parent, implementation) {}
Dstream_executor_internal.h183 KernelBase *kernel) { in GetKernel()
192 const BlockDim &block_dims, const KernelBase &k, in Launch()
197 virtual void UnloadKernel(const KernelBase *kernel) {} in UnloadKernel()
Dtrace_listener.h51 const KernelBase& kernel, in LaunchSubmit()
Dstream_executor_pimpl.h105 bool GetKernel(const MultiKernelLoaderSpec &spec, KernelBase *kernel);
108 void UnloadKernel(const KernelBase *kernel);
453 const BlockDim &block_dims, const KernelBase &kernel,
Dstream_executor_pimpl.cc235 KernelBase *kernel) { in GetKernel()
239 void StreamExecutor::UnloadKernel(const KernelBase *kernel) { in UnloadKernel()
481 const KernelBase &kernel, in Launch()
/external/gemmlowp/internal/
Dkernel_neon.h34 struct NEON_32_Kernel12x4Depth2 : KernelBase {
293 struct NEON_32_Kernel12x4Depth2Assuming12BitProducts : KernelBase {
667 struct NEON_32bit_GEMM_Int8Operands_LhsNonzero : KernelBase {
929 struct NEON_64bit_GEMM_Int8Operands_LhsNonzero : KernelBase {
1265 struct NEON_64_Kernel12x8Depth2 : KernelBase {
Dcompute.h34 const KernelBase& kernel_;
42 ComputeImpl(const KernelBase& _kernel, const BlockParams& _block_params, in ComputeImpl()
106 void Compute(const KernelBase& kernel, const BlockParams& block_params, in Compute()
Dkernel_sse.h32 struct SSE4_32_Kernel4x4Depth2 : KernelBase {
206 struct SSE4_64_Kernel12x4Depth2 : KernelBase {
Dkernel.h205 struct KernelBase { struct
216 virtual ~KernelBase() {} in ~KernelBase() argument
Dkernel_msa.h44 struct MSA_Kernel12x8Depth2 : KernelBase {
Dmulti_thread_gemm.h441 GemmWithPackedRhsTask(GemmContextType* _context, const KernelBase& _kernel, in GemmWithPackedRhsTask()
499 const KernelBase& kernel;
608 void MultiThreadGemm(GemmContextType* context, const KernelBase& kernel, in MultiThreadGemm()
Dkernel_reference.h33 struct ReferenceKernel : KernelBase {
Dsingle_thread_gemm.h67 const KernelBase& kernel, in SingleThreadGemm()
/external/tensorflow/tensorflow/stream_executor/gpu/
Dgpu_executor.h65 KernelBase* kernel) override;
67 void UnloadKernel(const KernelBase* kernel) override;
73 const BlockDim& block_dims, const KernelBase& k,
269 void VlogOccupancyInfo(const KernelBase& kernel, const ThreadDim& thread_dims,
304 std::unordered_map<const KernelBase*, const void*> kernel_to_gpu_binary_
Dgpu_kernel.h92 inline const GpuKernel* AsGpuKernel(const KernelBase* kernel) { in AsGpuKernel()
98 inline GpuKernel* AsGpuKernel(KernelBase* kernel) { in AsGpuKernel()
/external/tensorflow/tensorflow/compiler/xla/service/gpu/
Dkernel_thunk.cc60 it = kernel_cache_.emplace(executor, se::KernelBase(executor)).first; in Initialize()
80 const se::KernelBase* kernel = nullptr; in ExecuteOnStream()
Dkernel_thunk.h91 std::unordered_map<se::StreamExecutor*, se::KernelBase> kernel_cache_
/external/tensorflow/tensorflow/compiler/xla/service/interpreter/
Dexecutor.h62 KernelBase *kernel) override { in GetKernel()
66 const BlockDim &block_dims, const KernelBase &kernel, in Launch()
/external/tensorflow/tensorflow/stream_executor/host/
Dhost_gpu_executor.h54 KernelBase *kernel) override { in GetKernel()
58 const BlockDim &block_dims, const KernelBase &kernel, in Launch()
/external/tensorflow/tensorflow/stream_executor/rocm/
Drocm_gpu_executor.cc139 void GpuExecutor::UnloadKernel(const KernelBase* kernel) { in UnloadKernel()
222 KernelBase* kernel) { in GetKernel()
287 const BlockDim& block_dims, const KernelBase& kernel, in Launch()
419 void GpuExecutor::VlogOccupancyInfo(const KernelBase& kernel, in VlogOccupancyInfo()
/external/tensorflow/tensorflow/stream_executor/cuda/
Dcuda_gpu_executor.cc268 KernelBase* kernel) { in GetKernel()
344 void GpuExecutor::UnloadKernel(const KernelBase* kernel) { in UnloadKernel()
421 const BlockDim& block_dims, const KernelBase& kernel, in Launch()
466 void GpuExecutor::VlogOccupancyInfo(const KernelBase& kernel, in VlogOccupancyInfo()