/external/llvm-project/openmp/libomptarget/deviceRTLs/common/src/ |
D | reduction.cu | 35 INLINE static void gpu_regular_warp_reduce(void *reduce_data, in gpu_regular_warp_reduce() argument 38 shflFct(reduce_data, /*LaneId - not used= */ 0, in gpu_regular_warp_reduce() 43 INLINE static void gpu_irregular_warp_reduce(void *reduce_data, in gpu_irregular_warp_reduce() argument 51 shflFct(reduce_data, /*LaneId = */ tid, /*Offset=*/mask, /*AlgoVersion=*/1); in gpu_irregular_warp_reduce() 59 gpu_irregular_simd_reduce(void *reduce_data, kmp_ShuffleReductFctPtr shflFct) { in gpu_irregular_simd_reduce() argument 71 shflFct(reduce_data, /*LaneId =*/logical_lane_id, in gpu_irregular_simd_reduce() 80 int32_t global_tid, int32_t num_vars, size_t reduce_size, void *reduce_data, in nvptx_parallel_reduce_nowait() argument 107 gpu_regular_warp_reduce(reduce_data, shflFct); in nvptx_parallel_reduce_nowait() 109 gpu_irregular_warp_reduce(reduce_data, shflFct, in nvptx_parallel_reduce_nowait() 120 cpyFct(reduce_data, WarpsNeeded); in nvptx_parallel_reduce_nowait() [all …]
|
/external/llvm-project/openmp/runtime/src/ |
D | kmp_tasking.cpp | 2152 tg->reduce_data = (void *)arr; in __kmp_task_reduction_init() 2194 kmp_taskgroup_t *tg, void *reduce_data) { in __kmp_task_reduction_init_copy() argument 2198 thr, tg, reduce_data)); in __kmp_task_reduction_init_copy() 2202 KMP_MEMCPY(arr, reduce_data, num * sizeof(kmp_taskred_data_t)); in __kmp_task_reduction_init_copy() 2206 tg->reduce_data = (void *)arr; in __kmp_task_reduction_init_copy() 2230 kmp_taskred_data_t *arr = (kmp_taskred_data_t *)(tg->reduce_data); in __kmpc_task_reduction_get_th_data() 2268 arr = (kmp_taskred_data_t *)(tg->reduce_data); in __kmpc_task_reduction_get_th_data() 2280 kmp_taskred_data_t *arr = (kmp_taskred_data_t *)tg->reduce_data; in __kmp_task_reduction_fini() 2310 tg->reduce_data = NULL; in __kmp_task_reduction_fini() 2318 __kmp_thread_free(th, tg->reduce_data); in __kmp_task_reduction_clean() [all …]
|
D | kmp_barrier.cpp | 131 (*reduce)(this_thr->th.th_local.reduce_data, in __kmp_linear_barrier_gather_template() 132 other_threads[i]->th.th_local.reduce_data); in __kmp_linear_barrier_gather_template() 359 (*reduce)(this_thr->th.th_local.reduce_data, in __kmp_tree_barrier_gather() 360 child_thr->th.th_local.reduce_data); in __kmp_tree_barrier_gather() 609 (*reduce)(this_thr->th.th_local.reduce_data, in __kmp_hyper_barrier_gather() 610 child_thr->th.th_local.reduce_data); in __kmp_hyper_barrier_gather() 932 (*reduce)(this_thr->th.th_local.reduce_data, in __kmp_hierarchical_barrier_gather() 933 other_threads[child_tid]->th.th_local.reduce_data); in __kmp_hierarchical_barrier_gather() 968 (*reduce)(this_thr->th.th_local.reduce_data, in __kmp_hierarchical_barrier_gather() 969 child_thr->th.th_local.reduce_data); in __kmp_hierarchical_barrier_gather() [all …]
|
D | kmp.h | 2059 void *reduce_data; member 2212 void *reduce_data; // reduction related info member 3540 size_t reduce_size, void *reduce_data, 3827 void *reduce_data, void (*reduce_func)(void *lhs_data, void *rhs_data), 3833 void *reduce_data, void (*reduce_func)(void *lhs_data, void *rhs_data), 3842 void *reduce_data, void (*reduce_func)(void *lhs_data, void *rhs_data),
|
D | kmp_csupport.cpp | 3353 size_t reduce_size, void *reduce_data, in __kmpc_reduce_nowait() argument 3406 loc, global_tid, num_vars, reduce_size, reduce_data, reduce_func, lck); in __kmpc_reduce_nowait() 3472 global_tid, FALSE, reduce_size, reduce_data, reduce_func); in __kmpc_reduce_nowait() 3582 size_t reduce_size, void *reduce_data, in __kmpc_reduce() argument 3619 loc, global_tid, num_vars, reduce_size, reduce_data, reduce_func, lck); in __kmpc_reduce() 3662 global_tid, TRUE, reduce_size, reduce_data, reduce_func); in __kmpc_reduce()
|
D | kmp_runtime.cpp | 8234 void *reduce_data, void (*reduce_func)(void *lhs_data, void *rhs_data), in __kmp_determine_reduction_method() argument 8255 #define FAST_REDUCTION_TREE_METHOD_GENERATED ((reduce_data) && (reduce_func)) in __kmp_determine_reduction_method()
|
/external/llvm-project/openmp/libomptarget/deviceRTLs/nvptx/docs/ |
D | ReductionDesign.txt | 101 gpu_regular_warp_reduce(void *reduce_data, 104 ShuffleReduceFn(reduce_data, 0, offset, 0); 132 gpu_irregular_warp_reduce(void *reduce_data, 140 ShuffleReduceFn(reduce_data, lane_id, offset, 1); 180 gpu_irregular_simt_reduce(void *reduce_data, 190 ShuffleReduceFn(reduce_data, logical_lane_id, remote_id-1-threadIdx.x, 2); 248 gpu_irregular_block_reduce(void *reduce_data, 263 gpu_regular_warp_reduce(reduce_data, shuflReduceFn); 267 gpu_irregular_warp_reduce(reduce_data, shuflReduceFn, thread_num, 275 interWarpCpyFn(reduce_data, warp_needed); [all …]
|
/external/mesa3d/src/compiler/nir/ |
D | nir_opt_uniform_atomics.c | 181 reduce_data(nir_builder *b, nir_op op, nir_ssa_def *data, in reduce_data() function 216 reduce_data(b, op, data, &reduce, combined_scan_reduce ? &scan : NULL); in optimize_atomic() 238 reduce_data(b, op, data, NULL, &scan); in optimize_atomic()
|
/external/llvm-project/openmp/runtime/test/misc_bugs/ |
D | teams-reduction.c | 46 size_t reduce_size, void *reduce_data, void *reduce_func,
|
/external/llvm-project/openmp/libomptarget/deviceRTLs/ |
D | interface.h | 200 typedef void (*kmp_ListGlobalFctPtr)(void *buffer, int idx, void *reduce_data); 349 void *reduce_data, kmp_ShuffleReductFctPtr shflFct, 353 int32_t num_of_records, void *reduce_data, kmp_ShuffleReductFctPtr shflFct,
|