Home
last modified time | relevance | path

Searched refs:shfl (Results 1 – 8 of 8) sorted by relevance

/external/llvm/test/CodeGen/NVPTX/
Dshfl.ll3 declare i32 @llvm.nvvm.shfl.down.i32(i32, i32, i32)
4 declare float @llvm.nvvm.shfl.down.f32(float, i32, i32)
5 declare i32 @llvm.nvvm.shfl.up.i32(i32, i32, i32)
6 declare float @llvm.nvvm.shfl.up.f32(float, i32, i32)
7 declare i32 @llvm.nvvm.shfl.bfly.i32(i32, i32, i32)
8 declare float @llvm.nvvm.shfl.bfly.f32(float, i32, i32)
9 declare i32 @llvm.nvvm.shfl.idx.i32(i32, i32, i32)
10 declare float @llvm.nvvm.shfl.idx.f32(float, i32, i32)
13 ; shfl.down.
15 ; CHECK-LABEL: .func{{.*}}shfl.down1
[all …]
/external/mesa3d/src/gallium/drivers/nouveau/codegen/
Dnv50_ir_lowering_gm107.cpp189 Instruction *shfl; in handleDFDX() local
206 shfl = bld.mkOp2(OP_SHFL, TYPE_F32, bld.getScratch(), in handleDFDX()
208 shfl->subOp = NV50_IR_SUBOP_SHFL_BFLY; in handleDFDX()
213 insn->setSrc(0, shfl->getDef(0)); in handleDFDX()
/external/llvm/include/llvm/IR/
DIntrinsicsNVVM.td3695 // shfl.down.b32 dest, val, offset, mask_and_clamp
3698 [IntrNoMem, IntrConvergent], "llvm.nvvm.shfl.down.i32">,
3702 [IntrNoMem, IntrConvergent], "llvm.nvvm.shfl.down.f32">,
3705 // shfl.up.b32 dest, val, offset, mask_and_clamp
3708 [IntrNoMem, IntrConvergent], "llvm.nvvm.shfl.up.i32">,
3712 [IntrNoMem, IntrConvergent], "llvm.nvvm.shfl.up.f32">,
3715 // shfl.bfly.b32 dest, val, offset, mask_and_clamp
3718 [IntrNoMem, IntrConvergent], "llvm.nvvm.shfl.bfly.i32">,
3722 [IntrNoMem, IntrConvergent], "llvm.nvvm.shfl.bfly.f32">,
3725 // shfl.idx.b32 dest, val, lane, mask_and_clamp
[all …]
/external/llvm/lib/Target/NVPTX/
DNVPTXIntrinsics.td68 // shfl.{up,down,bfly,idx}.b32
70 // The last two parameters to shfl can be regs or imms. ptxas is smart
77 !strconcat("shfl.", mode, ".b32 $dst, $src, $offset, $mask;"),
83 !strconcat("shfl.", mode, ".b32 $dst, $src, $offset, $mask;"),
89 !strconcat("shfl.", mode, ".b32 $dst, $src, $offset, $mask;"),
95 !strconcat("shfl.", mode, ".b32 $dst, $src, $offset, $mask;"),
/external/swiftshader/third_party/llvm-subzero/build/Android/include/llvm/IR/
DIntrinsics.gen3193 nvvm_shfl_bfly_f32, // llvm.nvvm.shfl.bfly.f32
3194 nvvm_shfl_bfly_i32, // llvm.nvvm.shfl.bfly.i32
3195 nvvm_shfl_down_f32, // llvm.nvvm.shfl.down.f32
3196 nvvm_shfl_down_i32, // llvm.nvvm.shfl.down.i32
3197 nvvm_shfl_idx_f32, // llvm.nvvm.shfl.idx.f32
3198 nvvm_shfl_idx_i32, // llvm.nvvm.shfl.idx.i32
3199 nvvm_shfl_up_f32, // llvm.nvvm.shfl.up.f32
3200 nvvm_shfl_up_i32, // llvm.nvvm.shfl.up.i32
9251 "llvm.nvvm.shfl.bfly.f32",
9252 "llvm.nvvm.shfl.bfly.i32",
[all …]
/external/swiftshader/third_party/llvm-subzero/build/MacOS/include/llvm/IR/
DIntrinsics.gen3187 nvvm_shfl_bfly_f32, // llvm.nvvm.shfl.bfly.f32
3188 nvvm_shfl_bfly_i32, // llvm.nvvm.shfl.bfly.i32
3189 nvvm_shfl_down_f32, // llvm.nvvm.shfl.down.f32
3190 nvvm_shfl_down_i32, // llvm.nvvm.shfl.down.i32
3191 nvvm_shfl_idx_f32, // llvm.nvvm.shfl.idx.f32
3192 nvvm_shfl_idx_i32, // llvm.nvvm.shfl.idx.i32
3193 nvvm_shfl_up_f32, // llvm.nvvm.shfl.up.f32
3194 nvvm_shfl_up_i32, // llvm.nvvm.shfl.up.i32
9211 "llvm.nvvm.shfl.bfly.f32",
9212 "llvm.nvvm.shfl.bfly.i32",
[all …]
/external/swiftshader/third_party/llvm-subzero/build/Windows/include/llvm/IR/
DIntrinsics.gen3193 nvvm_shfl_bfly_f32, // llvm.nvvm.shfl.bfly.f32
3194 nvvm_shfl_bfly_i32, // llvm.nvvm.shfl.bfly.i32
3195 nvvm_shfl_down_f32, // llvm.nvvm.shfl.down.f32
3196 nvvm_shfl_down_i32, // llvm.nvvm.shfl.down.i32
3197 nvvm_shfl_idx_f32, // llvm.nvvm.shfl.idx.f32
3198 nvvm_shfl_idx_i32, // llvm.nvvm.shfl.idx.i32
3199 nvvm_shfl_up_f32, // llvm.nvvm.shfl.up.f32
3200 nvvm_shfl_up_i32, // llvm.nvvm.shfl.up.i32
9251 "llvm.nvvm.shfl.bfly.f32",
9252 "llvm.nvvm.shfl.bfly.i32",
[all …]
/external/swiftshader/third_party/llvm-subzero/build/Linux/include/llvm/IR/
DIntrinsics.gen3193 nvvm_shfl_bfly_f32, // llvm.nvvm.shfl.bfly.f32
3194 nvvm_shfl_bfly_i32, // llvm.nvvm.shfl.bfly.i32
3195 nvvm_shfl_down_f32, // llvm.nvvm.shfl.down.f32
3196 nvvm_shfl_down_i32, // llvm.nvvm.shfl.down.i32
3197 nvvm_shfl_idx_f32, // llvm.nvvm.shfl.idx.f32
3198 nvvm_shfl_idx_i32, // llvm.nvvm.shfl.idx.i32
3199 nvvm_shfl_up_f32, // llvm.nvvm.shfl.up.f32
3200 nvvm_shfl_up_i32, // llvm.nvvm.shfl.up.i32
9251 "llvm.nvvm.shfl.bfly.f32",
9252 "llvm.nvvm.shfl.bfly.i32",
[all …]