Home
last modified time | relevance | path

Searched refs:NumThreads (Results 1 – 17 of 17) sorted by relevance

/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/gpu/cuda_impl/
Dtopk_lib.cuh72 template <int NumThreads, typename T, typename S, int N, int L, bool AllThreads, bool is_descend, b…
101 template <int NumThreads, typename T, typename S, int L, bool is_descend, bool FullMerge>
103 constexpr int kLoopPerThread = L / NumThreads; in BlockSortBigK()
106 int tid = loop * NumThreads + threadIdx.x; in BlockSortBigK()
119 int tid = loop * NumThreads + threadIdx.x; in BlockSortBigK()
128 template <int NumThreads, typename T, typename S, int N, int L, bool is_descend, bool FullMerge = t…
130 if (L <= NumThreads) { in SortBlockStep()
131 int kNumParallelMerges = NumThreads / L; in SortBlockStep()
135 BlockSortSmallK<NumThreads, T, S, N, L, false, is_descend, FullMerge>(list_k, list_v); in SortBlockStep()
139 …BlockSortSmallK<NumThreads, T, S, N, L, true, is_descend, FullMerge>(list_k + start, list_v + star… in SortBlockStep()
[all …]
Dtranspose_impl_opt.cu85 __global__ void Swap3DTensorLast2DimKernel_shared(const T *input, int NumThreads, int TileHeight, i… in Swap3DTensorLast2DimKernel_shared() argument
90 …int NumRowsPerLoadLoop = NumThreads / TileWidth; // the number of shm rows that all threads can l… in Swap3DTensorLast2DimKernel_shared()
92 NumThreads / TileHeight; // the number of shm cols that all threads can write into output once in Swap3DTensorLast2DimKernel_shared()
/third_party/skia/third_party/externals/swiftshader/third_party/subzero/src/
DLinuxMallocProfiling.cpp67 LinuxMallocProfiling::LinuxMallocProfiling(size_t NumThreads, Ostream *Ls) in LinuxMallocProfiling() argument
69 if (NumThreads != 0) { in LinuxMallocProfiling()
102 LinuxMallocProfiling::LinuxMallocProfiling(size_t NumThreads, Ostream *Ls) { in LinuxMallocProfiling() argument
103 (void)NumThreads; in LinuxMallocProfiling()
DIceBrowserCompileServer.cpp116 char *onInitCallback(uint32_t NumThreads, int *ObjFileFDs, in onInitCallback() argument
152 gCompileServer->getParsedFlags(UseNumThreadsFromBrowser, NumThreads, in onInitCallback()
242 uint32_t NumThreads, int argc, in getParsedFlags() argument
248 ClFlags::Flags.setNumTranslationThreads(NumThreads); in getParsedFlags()
DLinuxMallocProfiling.h32 LinuxMallocProfiling(size_t NumThreads, Ostream *Ls);
DIceBrowserCompileServer.h53 void getParsedFlags(bool UseNumThreadsFromBrowser, uint32_t NumThreads,
/third_party/boost/libs/interprocess/test/
Dcondition_test_template.hpp263 const int NumThreads = thread_factor*queue_size; variable
306 boost::interprocess::ipcdetail::OS_thread_t thgroup[NumThreads]; in do_test_condition_queue_notify_one()
307 for(int i = 0; i< NumThreads; ++i){ in do_test_condition_queue_notify_one()
314 for(int i = 0; i < NumThreads; ++i){ in do_test_condition_queue_notify_one()
326 for(int i = 0; i< NumThreads; ++i){ in do_test_condition_queue_notify_one()
351 boost::interprocess::ipcdetail::OS_thread_t thgroup[NumThreads]; in do_test_condition_queue_notify_all()
352 for(int i = 0; i< NumThreads; ++i){ in do_test_condition_queue_notify_all()
358 for(int i = 0; i < NumThreads; ++i){ in do_test_condition_queue_notify_all()
370 for(int i = 0; i< NumThreads; ++i){ in do_test_condition_queue_notify_all()
/third_party/skia/third_party/externals/swiftshader/third_party/subzero/crosstest/
Dtest_sync_atomic_main.cpp241 const size_t NumThreads = 4; in testAtomicRMWThreads() local
242 pthread_t t[NumThreads]; in testAtomicRMWThreads()
243 pthread_attr_t attr[NumThreads]; in testAtomicRMWThreads()
247 for (size_t m = 0; m < NumThreads; ++m) { in testAtomicRMWThreads()
255 for (size_t m = 0; m < NumThreads; ++m) { in testAtomicRMWThreads()
262 for (size_t m = 0; m < NumThreads; ++m) { in testAtomicRMWThreads()
273 for (size_t m = 0; m < NumThreads; ++m) { in testAtomicRMWThreads()
/third_party/skia/third_party/externals/swiftshader/third_party/marl/tools/bench/
Dbench.go32 NumThreads uint member
50 t.NumThreads = uint(n)
/third_party/grpc/test/cpp/qps/
Dclient_callback.cc68 num_threads_ = NumThreads(config); in CallbackClient()
122 int NumThreads(const ClientConfig& config) { in NumThreads() function in grpc::testing::CallbackClient
Dclient_async.cc168 num_async_threads_(NumThreads(config)) { in AsyncClient()
222 int NumThreads(const ClientConfig& config) { in NumThreads() function in grpc::testing::AsyncClient
/third_party/skia/third_party/externals/swiftshader/third_party/llvm-10.0/llvm/lib/Frontend/OpenMP/
DOMPIRBuilder.cpp307 Value *NumThreads, omp::ProcBindKind ProcBind, bool IsCancellable) { in CreateParallel() argument
315 if (NumThreads) { in CreateParallel()
319 Builder.CreateIntCast(NumThreads, Int32, /*isSigned*/ false)}; in CreateParallel()
/third_party/skia/third_party/externals/swiftshader/third_party/llvm-10.0/llvm/include/llvm/Frontend/OpenMP/
DOMPIRBuilder.h168 Value *IfCondition, Value *NumThreads,
/third_party/benchmark/test/
Duser_counters_test.cc279 CHECK_COUNTER_VALUE(e, int, "foo", EQ, e.NumThreads()); in CheckThreads()
280 CHECK_COUNTER_VALUE(e, int, "bar", EQ, 2 * e.NumThreads()); in CheckThreads()
Doutput_test.h100 int NumThreads() const;
Doutput_test_helper.cc309 int Results::NumThreads() const { in NumThreads() function in Results
/third_party/skia/third_party/externals/swiftshader/third_party/llvm-10.0/llvm/lib/Transforms/Scalar/
DJumpThreading.cpp85 STATISTIC(NumThreads, "Number of jumps threaded");
2138 ++NumThreads; in ThreadEdge()