Home
last modified time | relevance | path

Searched refs:lane_id (Results 1 – 4 of 4) sorted by relevance

/external/tensorflow/tensorflow/core/util/
Dcuda_device_functions.h115 unsigned int lane_id; in CudaLaneId() local
116 asm("mov.u32 %0, %%laneid;" : "=r"(lane_id)); in CudaLaneId()
117 return lane_id; in CudaLaneId()
145 int lane_id = CudaLaneId(); in CudaShuffleGetSrcLane() local
146 int lane_base = lane_id & ~width + 1; in CudaShuffleGetSrcLane()
153 unsigned lane_id = CudaLaneId(); in CudaShuffleUpGetSrcLane() local
154 if ((lane_id & width - 1) < delta) { in CudaShuffleUpGetSrcLane()
155 return lane_id; in CudaShuffleUpGetSrcLane()
157 return lane_id - delta; in CudaShuffleUpGetSrcLane()
163 unsigned lane_id = CudaLaneId(); in CudaShuffleDownGetSrcLane() local
[all …]
Dcuda_kernel_helper_test.cu.cc93 unsigned lane_id = CudaLaneId(); in CudaShuffleGetSrcLaneTest() local
99 op_name, param, width, lane_id, actual, expected); in CudaShuffleGetSrcLaneTest()
106 CudaShuffleSync(kCudaWarpAll, lane_id, src_lane, width); in CudaShuffleGetSrcLaneTest()
112 CudaShuffleUpSync(kCudaWarpAll, lane_id, delta, width); in CudaShuffleGetSrcLaneTest()
118 CudaShuffleDownSync(kCudaWarpAll, lane_id, delta, width); in CudaShuffleGetSrcLaneTest()
124 CudaShuffleXorSync(kCudaWarpAll, lane_id, lane_lane, width); in CudaShuffleGetSrcLaneTest()
/external/swiftshader/third_party/llvm-7.0/llvm/test/CodeGen/Hexagon/
Djt-in-text.ll15 define void @test2(i32 %lane_id, i32 %rx_pwr_st) #0 {
17 %lane_id.addr = alloca i32, align 4
19 store i32 %lane_id, i32* %lane_id.addr, align 4
21 %0 = load i32, i32* %lane_id.addr, align 4
/external/tensorflow/tensorflow/compiler/xla/service/gpu/
Dir_emitter_unnested.cc2793 llvm::Value* lane_id = reduction_info->GetLaneId(); in EmitEpilogueForReduction() local
2795 ICmpEQ(lane_id, llvm::ConstantInt::get(lane_id->getType(), 0)), in EmitEpilogueForReduction()