Home
last modified time | relevance | path

Searched refs:kNumThreads (Results 1 – 25 of 223) sorted by relevance

123456789

/external/pytorch/aten/src/ATen/native/transformers/cuda/mem_eff_attention/kernels/
DcutlassB.h14 …ardKernel<cutlass::arch::Sm70, cutlass::half_t, true, false, false, 64, 64, 32, true>::kNumThreads,
18 …nBackwardKernel<cutlass::arch::Sm70, cutlass::half_t, true, false, false, 64, 64, 32>::kNumThreads,
22 …ardKernel<cutlass::arch::Sm70, cutlass::half_t, true, false, false, 64, 64, 64, true>::kNumThreads,
26 …nBackwardKernel<cutlass::arch::Sm70, cutlass::half_t, true, false, false, 64, 64, 64>::kNumThreads,
30 …dKernel<cutlass::arch::Sm70, cutlass::half_t, true, false, false, 128, 64, 128, true>::kNumThreads,
34 …ackwardKernel<cutlass::arch::Sm70, cutlass::half_t, true, false, false, 128, 64, 128>::kNumThreads,
38 …rdKernel<cutlass::arch::Sm70, cutlass::half_t, true, false, false, 64, 64, 128, true>::kNumThreads,
42 …BackwardKernel<cutlass::arch::Sm70, cutlass::half_t, true, false, false, 64, 64, 128>::kNumThreads,
46 …kwardKernel<cutlass::arch::Sm70, cutlass::half_t, true, false, false, 128, 64, 65536>::kNumThreads,
50 …ckwardKernel<cutlass::arch::Sm70, cutlass::half_t, true, false, false, 64, 64, 65536>::kNumThreads,
[all …]
DcutlassF.h14 …tentionKernel<cutlass::bfloat16_t, cutlass::arch::Sm80, true, 64, 64, 64, true, true>::kNumThreads,
18 …ntionKernel<cutlass::bfloat16_t, cutlass::arch::Sm80, true, 64, 128, 128, true, true>::kNumThreads,
22 …ionKernel<cutlass::bfloat16_t, cutlass::arch::Sm80, true, 32, 128, 65536, true, true>::kNumThreads,
34 … AttentionKernel<cutlass::half_t, cutlass::arch::Sm50, true, 64, 64, 64, true, true>::kNumThreads,
38 …AttentionKernel<cutlass::half_t, cutlass::arch::Sm50, true, 32, 128, 128, true, true>::kNumThreads,
42 …tentionKernel<cutlass::half_t, cutlass::arch::Sm50, true, 32, 128, 65536, true, true>::kNumThreads,
46 … AttentionKernel<cutlass::half_t, cutlass::arch::Sm50, false, 64, 64, 64, true, true>::kNumThreads,
50 …ttentionKernel<cutlass::half_t, cutlass::arch::Sm50, false, 32, 128, 128, true, true>::kNumThreads,
54 …entionKernel<cutlass::half_t, cutlass::arch::Sm50, false, 32, 128, 65536, true, true>::kNumThreads,
69 … AttentionKernel<cutlass::half_t, cutlass::arch::Sm70, true, 64, 64, 64, true, true>::kNumThreads,
[all …]
DcutlassF_f32_aligned.cu12 AttentionKernel<float, cutlass::arch::Sm50, true, 64, 64, 64, true, true>::kNumThreads, in __launch_bounds__() argument
31 AttentionKernel<float, cutlass::arch::Sm70, true, 64, 64, 64, true, true>::kNumThreads, in __launch_bounds__() argument
50 AttentionKernel<float, cutlass::arch::Sm75, true, 64, 64, 64, true, true>::kNumThreads, in __launch_bounds__() argument
69 AttentionKernel<float, cutlass::arch::Sm80, true, 64, 64, 64, true, true>::kNumThreads, in __launch_bounds__() argument
88 AttentionKernel<float, cutlass::arch::Sm50, true, 32, 128, 128, true, true>::kNumThreads, in __launch_bounds__() argument
107 AttentionKernel<float, cutlass::arch::Sm70, true, 32, 128, 128, true, true>::kNumThreads, in __launch_bounds__() argument
126 AttentionKernel<float, cutlass::arch::Sm75, true, 32, 128, 128, true, true>::kNumThreads, in __launch_bounds__() argument
145 AttentionKernel<float, cutlass::arch::Sm80, true, 64, 128, 128, true, true>::kNumThreads, in __launch_bounds__() argument
164 AttentionKernel<float, cutlass::arch::Sm50, true, 32, 128, 65536, true, true>::kNumThreads, in __launch_bounds__() argument
183 AttentionKernel<float, cutlass::arch::Sm70, true, 32, 128, 65536, true, true>::kNumThreads, in __launch_bounds__() argument
[all …]
DcutlassF_f32_notaligned.cu12 AttentionKernel<float, cutlass::arch::Sm50, false, 64, 64, 64, true, true>::kNumThreads, in __launch_bounds__() argument
31 AttentionKernel<float, cutlass::arch::Sm70, false, 64, 64, 64, true, true>::kNumThreads, in __launch_bounds__() argument
50 AttentionKernel<float, cutlass::arch::Sm75, false, 64, 64, 64, true, true>::kNumThreads, in __launch_bounds__() argument
69 AttentionKernel<float, cutlass::arch::Sm50, false, 32, 128, 128, true, true>::kNumThreads, in __launch_bounds__() argument
88 AttentionKernel<float, cutlass::arch::Sm70, false, 32, 128, 128, true, true>::kNumThreads, in __launch_bounds__() argument
107 AttentionKernel<float, cutlass::arch::Sm75, false, 32, 128, 128, true, true>::kNumThreads, in __launch_bounds__() argument
126 AttentionKernel<float, cutlass::arch::Sm50, false, 32, 128, 65536, true, true>::kNumThreads, in __launch_bounds__() argument
145 AttentionKernel<float, cutlass::arch::Sm70, false, 32, 128, 65536, true, true>::kNumThreads, in __launch_bounds__() argument
164 AttentionKernel<float, cutlass::arch::Sm75, false, 32, 128, 65536, true, true>::kNumThreads, in __launch_bounds__() argument
DcutlassF_f16_aligned.cu12 … AttentionKernel<cutlass::half_t, cutlass::arch::Sm50, true, 64, 64, 64, true, true>::kNumThreads, in __launch_bounds__() argument
31 … AttentionKernel<cutlass::half_t, cutlass::arch::Sm70, true, 64, 64, 64, true, true>::kNumThreads, in __launch_bounds__() argument
50 … AttentionKernel<cutlass::half_t, cutlass::arch::Sm75, true, 64, 64, 64, true, true>::kNumThreads, in __launch_bounds__() argument
69 … AttentionKernel<cutlass::half_t, cutlass::arch::Sm80, true, 64, 64, 64, true, true>::kNumThreads, in __launch_bounds__() argument
88 …AttentionKernel<cutlass::half_t, cutlass::arch::Sm50, true, 32, 128, 128, true, true>::kNumThreads, in __launch_bounds__() argument
107 …AttentionKernel<cutlass::half_t, cutlass::arch::Sm70, true, 32, 128, 128, true, true>::kNumThreads, in __launch_bounds__() argument
126 …AttentionKernel<cutlass::half_t, cutlass::arch::Sm75, true, 32, 128, 128, true, true>::kNumThreads, in __launch_bounds__() argument
145 …AttentionKernel<cutlass::half_t, cutlass::arch::Sm80, true, 64, 128, 128, true, true>::kNumThreads, in __launch_bounds__() argument
164 …tentionKernel<cutlass::half_t, cutlass::arch::Sm50, true, 32, 128, 65536, true, true>::kNumThreads, in __launch_bounds__() argument
183 …tentionKernel<cutlass::half_t, cutlass::arch::Sm70, true, 32, 128, 65536, true, true>::kNumThreads, in __launch_bounds__() argument
[all …]
DcutlassB_f16_aligned_k128.cu12 …dKernel<cutlass::arch::Sm70, cutlass::half_t, true, false, false, 128, 64, 128, true>::kNumThreads, in __launch_bounds__() argument
31 …dKernel<cutlass::arch::Sm80, cutlass::half_t, true, false, true, 128, 128, 128, true>::kNumThreads, in __launch_bounds__() argument
50 …ackwardKernel<cutlass::arch::Sm70, cutlass::half_t, true, false, false, 128, 64, 128>::kNumThreads, in __launch_bounds__() argument
69 …ackwardKernel<cutlass::arch::Sm75, cutlass::half_t, true, false, false, 128, 64, 128>::kNumThreads, in __launch_bounds__() argument
88 …ackwardKernel<cutlass::arch::Sm80, cutlass::half_t, true, false, true, 128, 128, 128>::kNumThreads, in __launch_bounds__() argument
107 …rdKernel<cutlass::arch::Sm70, cutlass::half_t, true, false, false, 64, 64, 128, true>::kNumThreads, in __launch_bounds__() argument
126 …rdKernel<cutlass::arch::Sm80, cutlass::half_t, true, false, false, 64, 64, 128, true>::kNumThreads, in __launch_bounds__() argument
145 …BackwardKernel<cutlass::arch::Sm50, cutlass::half_t, true, false, false, 64, 64, 128>::kNumThreads, in __launch_bounds__() argument
164 …BackwardKernel<cutlass::arch::Sm70, cutlass::half_t, true, false, false, 64, 64, 128>::kNumThreads, in __launch_bounds__() argument
183 …BackwardKernel<cutlass::arch::Sm75, cutlass::half_t, true, false, false, 64, 64, 128>::kNumThreads, in __launch_bounds__() argument
[all …]
DcutlassF_f16_notaligned.cu12 … AttentionKernel<cutlass::half_t, cutlass::arch::Sm50, false, 64, 64, 64, true, true>::kNumThreads, in __launch_bounds__() argument
31 … AttentionKernel<cutlass::half_t, cutlass::arch::Sm70, false, 64, 64, 64, true, true>::kNumThreads, in __launch_bounds__() argument
50 … AttentionKernel<cutlass::half_t, cutlass::arch::Sm75, false, 64, 64, 64, true, true>::kNumThreads, in __launch_bounds__() argument
69 …ttentionKernel<cutlass::half_t, cutlass::arch::Sm50, false, 32, 128, 128, true, true>::kNumThreads, in __launch_bounds__() argument
88 …ttentionKernel<cutlass::half_t, cutlass::arch::Sm70, false, 32, 128, 128, true, true>::kNumThreads, in __launch_bounds__() argument
107 …ttentionKernel<cutlass::half_t, cutlass::arch::Sm75, false, 32, 128, 128, true, true>::kNumThreads, in __launch_bounds__() argument
126 …entionKernel<cutlass::half_t, cutlass::arch::Sm50, false, 32, 128, 65536, true, true>::kNumThreads, in __launch_bounds__() argument
145 …entionKernel<cutlass::half_t, cutlass::arch::Sm70, false, 32, 128, 65536, true, true>::kNumThreads, in __launch_bounds__() argument
164 …entionKernel<cutlass::half_t, cutlass::arch::Sm75, false, 32, 128, 65536, true, true>::kNumThreads, in __launch_bounds__() argument
DcutlassB_f16_aligned_k65536_dropout.cu12 …ckwardKernel<cutlass::arch::Sm70, cutlass::half_t, true, true, false, 128, 64, 65536>::kNumThreads, in __launch_bounds__() argument
31 …ckwardKernel<cutlass::arch::Sm75, cutlass::half_t, true, true, false, 128, 64, 65536>::kNumThreads, in __launch_bounds__() argument
50 …ckwardKernel<cutlass::arch::Sm80, cutlass::half_t, true, true, false, 128, 64, 65536>::kNumThreads, in __launch_bounds__() argument
69 …ackwardKernel<cutlass::arch::Sm50, cutlass::half_t, true, true, false, 64, 64, 65536>::kNumThreads, in __launch_bounds__() argument
88 …ackwardKernel<cutlass::arch::Sm70, cutlass::half_t, true, true, false, 64, 64, 65536>::kNumThreads, in __launch_bounds__() argument
107 …ackwardKernel<cutlass::arch::Sm75, cutlass::half_t, true, true, false, 64, 64, 65536>::kNumThreads, in __launch_bounds__() argument
126 …ackwardKernel<cutlass::arch::Sm80, cutlass::half_t, true, true, false, 64, 64, 65536>::kNumThreads, in __launch_bounds__() argument
DcutlassB_f16_aligned_k128_dropout.cu12 …BackwardKernel<cutlass::arch::Sm70, cutlass::half_t, true, true, false, 128, 64, 128>::kNumThreads, in __launch_bounds__() argument
31 …BackwardKernel<cutlass::arch::Sm75, cutlass::half_t, true, true, false, 128, 64, 128>::kNumThreads, in __launch_bounds__() argument
50 …BackwardKernel<cutlass::arch::Sm80, cutlass::half_t, true, true, true, 128, 128, 128>::kNumThreads, in __launch_bounds__() argument
69 …nBackwardKernel<cutlass::arch::Sm50, cutlass::half_t, true, true, false, 64, 64, 128>::kNumThreads, in __launch_bounds__() argument
88 …nBackwardKernel<cutlass::arch::Sm70, cutlass::half_t, true, true, false, 64, 64, 128>::kNumThreads, in __launch_bounds__() argument
107 …nBackwardKernel<cutlass::arch::Sm75, cutlass::half_t, true, true, false, 64, 64, 128>::kNumThreads, in __launch_bounds__() argument
126 …nBackwardKernel<cutlass::arch::Sm80, cutlass::half_t, true, true, false, 64, 64, 128>::kNumThreads, in __launch_bounds__() argument
DcutlassB_f16_aligned_k65536.cu12 …kwardKernel<cutlass::arch::Sm70, cutlass::half_t, true, false, false, 128, 64, 65536>::kNumThreads, in __launch_bounds__() argument
31 …kwardKernel<cutlass::arch::Sm75, cutlass::half_t, true, false, false, 128, 64, 65536>::kNumThreads, in __launch_bounds__() argument
50 …kwardKernel<cutlass::arch::Sm80, cutlass::half_t, true, false, false, 128, 64, 65536>::kNumThreads, in __launch_bounds__() argument
69 …ckwardKernel<cutlass::arch::Sm50, cutlass::half_t, true, false, false, 64, 64, 65536>::kNumThreads, in __launch_bounds__() argument
88 …ckwardKernel<cutlass::arch::Sm70, cutlass::half_t, true, false, false, 64, 64, 65536>::kNumThreads, in __launch_bounds__() argument
107 …ckwardKernel<cutlass::arch::Sm75, cutlass::half_t, true, false, false, 64, 64, 65536>::kNumThreads, in __launch_bounds__() argument
126 …ckwardKernel<cutlass::arch::Sm80, cutlass::half_t, true, false, false, 64, 64, 65536>::kNumThreads, in __launch_bounds__() argument
/external/icing/icing/index/lite/
Dlite-index_thread-safety_test.cc133 constexpr int kNumThreads = 50; in TEST_F() local
134 std::vector<std::vector<DocHitInfo>> hits(kNumThreads); in TEST_F()
144 for (int i = 0; i < kNumThreads; ++i) { in TEST_F()
149 for (int i = 0; i < kNumThreads; ++i) { in TEST_F()
182 constexpr int kNumThreads = 50; in TEST_F() local
183 std::vector<std::vector<DocHitInfo>> hits(kNumThreads); in TEST_F()
200 for (int i = 0; i < kNumThreads; ++i) { in TEST_F()
205 for (int i = 0; i < kNumThreads; ++i) { in TEST_F()
233 constexpr int kNumThreads = 50; in TEST_F() local
234 std::vector<std::vector<DocHitInfo>> hits(kNumThreads); in TEST_F()
[all …]
/external/icing/icing/result/
Dresult-state-manager_thread-safety_test.cc191 constexpr int kNumThreads = 50; in TEST_F() local
192 std::vector<std::optional<PageResultInfo>> page_results(kNumThreads); in TEST_F()
209 for (int i = 0; i < kNumThreads; ++i) { in TEST_F()
214 for (int i = 0; i < kNumThreads; ++i) { in TEST_F()
241 for (int i = 0; i < kNumThreads; ++i) { in TEST_F()
294 constexpr int kNumThreads = 50; in TEST_F() local
295 std::vector<std::optional<PageResultInfo>> page_results(kNumThreads); in TEST_F()
317 for (int i = 0; i < kNumThreads; ++i) { in TEST_F()
327 for (int i = 0; i < kNumThreads; ++i) { in TEST_F()
379 constexpr int kNumThreads = 50; in TEST_F() local
[all …]
/external/grpc-grpc/test/core/client_channel/resolvers/
Dgoogle_c2p_resolver_test.cc68 const int kNumThreads = 10; in TEST() local
69 threads.reserve(kNumThreads); in TEST()
70 for (int i = 0; i < kNumThreads; i++) { in TEST()
87 const int kNumThreads = 10; in TEST() local
88 threads.reserve(kNumThreads); in TEST()
89 for (int i = 0; i < kNumThreads; i++) { in TEST()
/external/compiler-rt/test/tsan/Darwin/
Dgcd-once.mm8 static const long kNumThreads = 4;
40 barrier_init(&barrier, kNumThreads);
42 pthread_t t[kNumThreads];
43 for (int i = 0; i < kNumThreads; i++) {
46 for (int i = 0; i < kNumThreads; i++) {
/external/rust/android-crates-io/crates/quiche/deps/boringssl/src/crypto/
Dthread_test.cc135 constexpr size_t kNumThreads = 10; in TEST() local
139 threads.reserve(kNumThreads); in TEST()
140 for (size_t i = 0; i < kNumThreads; i++) { in TEST()
149 constexpr size_t kNumThreads = 10; in TEST() local
153 threads.reserve(kNumThreads); in TEST()
154 for (size_t i = 0; i < kNumThreads; i++) { in TEST()
/external/tensorflow/tensorflow/core/lib/core/
Dthreadpool_test.cc32 static const int kNumThreads = 30; variable
35 for (int num_threads = 1; num_threads < kNumThreads; num_threads++) { in TEST()
43 for (int num_threads = 1; num_threads < kNumThreads; num_threads++) { in TEST()
266 for (int num_threads = 1; num_threads < kNumThreads; num_threads++) { in TEST()
292 for (int num_threads = 1; num_threads < kNumThreads; num_threads++) { in TEST()
321 for (int num_threads = 1; num_threads < kNumThreads; num_threads++) { in TEST()
329 std::atomic<bool> threads_running[kNumThreads + 1]; in TEST()
339 ASSERT_LE(id, kNumThreads); in TEST()
360 ThreadPool pool(Env::Default(), "test", kNumThreads); in TEST()
362 absl::Barrier barrier(kNumThreads); in TEST()
[all …]
/external/angle/third_party/abseil-cpp/absl/base/internal/
Dthread_identity_test.cc78 static const int kNumThreads = 32; in TEST() local
81 for (int i = 0; i < kNumThreads; ++i) { in TEST()
94 EXPECT_LT(kNumThreads, num_identities_reused); in TEST()
104 static const int kNumThreads = 12; in TEST() local
111 for (int thread = 0; thread < kNumThreads; ++thread) { in TEST()
/external/openscreen/third_party/abseil/src/absl/base/internal/
Dthread_identity_test.cc78 static const int kNumThreads = 32; in TEST() local
81 for (int i = 0; i < kNumThreads; ++i) { in TEST()
94 EXPECT_LT(kNumThreads, num_identities_reused); in TEST()
104 static const int kNumThreads = 12; in TEST() local
111 for (int thread = 0; thread < kNumThreads; ++thread) { in TEST()
/external/abseil-cpp/absl/base/internal/
Dthread_identity_test.cc78 static const int kNumThreads = 32; in TEST() local
81 for (int i = 0; i < kNumThreads; ++i) { in TEST()
94 EXPECT_LT(kNumThreads, num_identities_reused); in TEST()
104 static const int kNumThreads = 12; in TEST() local
111 for (int thread = 0; thread < kNumThreads; ++thread) { in TEST()
/external/cronet/tot/third_party/abseil-cpp/absl/base/internal/
Dthread_identity_test.cc78 static const int kNumThreads = 32; in TEST() local
81 for (int i = 0; i < kNumThreads; ++i) { in TEST()
94 EXPECT_LT(kNumThreads, num_identities_reused); in TEST()
104 static const int kNumThreads = 12; in TEST() local
111 for (int thread = 0; thread < kNumThreads; ++thread) { in TEST()
/external/cronet/stable/third_party/abseil-cpp/absl/base/internal/
Dthread_identity_test.cc78 static const int kNumThreads = 32; in TEST() local
81 for (int i = 0; i < kNumThreads; ++i) { in TEST()
94 EXPECT_LT(kNumThreads, num_identities_reused); in TEST()
104 static const int kNumThreads = 12; in TEST() local
111 for (int thread = 0; thread < kNumThreads; ++thread) { in TEST()
/external/rust/android-crates-io/crates/grpcio-sys/grpc/third_party/abseil-cpp/absl/base/internal/
Dthread_identity_test.cc78 static const int kNumThreads = 32; in TEST() local
81 for (int i = 0; i < kNumThreads; ++i) { in TEST()
94 EXPECT_LT(kNumThreads, num_identities_reused); in TEST()
104 static const int kNumThreads = 12; in TEST() local
111 for (int thread = 0; thread < kNumThreads; ++thread) { in TEST()
/external/openscreen/third_party/abseil/src/absl/synchronization/
Dbarrier_test.cc26 constexpr int kNumThreads = 10; in TEST() local
27 absl::Barrier* barrier = new absl::Barrier(kNumThreads); in TEST()
46 for (int i = 0; i < kNumThreads - 1; ++i) { in TEST()
74 EXPECT_EQ(counter, kNumThreads); in TEST()
/external/cronet/tot/third_party/abseil-cpp/absl/synchronization/
Dbarrier_test.cc26 constexpr int kNumThreads = 10; in TEST() local
27 absl::Barrier* barrier = new absl::Barrier(kNumThreads); in TEST()
46 for (int i = 0; i < kNumThreads - 1; ++i) { in TEST()
74 EXPECT_EQ(counter, kNumThreads); in TEST()
/external/cronet/stable/third_party/abseil-cpp/absl/synchronization/
Dbarrier_test.cc26 constexpr int kNumThreads = 10; in TEST() local
27 absl::Barrier* barrier = new absl::Barrier(kNumThreads); in TEST()
46 for (int i = 0; i < kNumThreads - 1; ++i) { in TEST()
74 EXPECT_EQ(counter, kNumThreads); in TEST()

123456789