Searched refs:shfl (Results 1 – 8 of 8) sorted by relevance
/external/llvm/test/CodeGen/NVPTX/ |
D | shfl.ll | 3 declare i32 @llvm.nvvm.shfl.down.i32(i32, i32, i32) 4 declare float @llvm.nvvm.shfl.down.f32(float, i32, i32) 5 declare i32 @llvm.nvvm.shfl.up.i32(i32, i32, i32) 6 declare float @llvm.nvvm.shfl.up.f32(float, i32, i32) 7 declare i32 @llvm.nvvm.shfl.bfly.i32(i32, i32, i32) 8 declare float @llvm.nvvm.shfl.bfly.f32(float, i32, i32) 9 declare i32 @llvm.nvvm.shfl.idx.i32(i32, i32, i32) 10 declare float @llvm.nvvm.shfl.idx.f32(float, i32, i32) 13 ; shfl.down. 15 ; CHECK-LABEL: .func{{.*}}shfl.down1 [all …]
|
/external/mesa3d/src/gallium/drivers/nouveau/codegen/ |
D | nv50_ir_lowering_gm107.cpp | 189 Instruction *shfl; in handleDFDX() local 206 shfl = bld.mkOp2(OP_SHFL, TYPE_F32, bld.getScratch(), in handleDFDX() 208 shfl->subOp = NV50_IR_SUBOP_SHFL_BFLY; in handleDFDX() 213 insn->setSrc(0, shfl->getDef(0)); in handleDFDX()
|
/external/llvm/include/llvm/IR/ |
D | IntrinsicsNVVM.td | 3695 // shfl.down.b32 dest, val, offset, mask_and_clamp 3698 [IntrNoMem, IntrConvergent], "llvm.nvvm.shfl.down.i32">, 3702 [IntrNoMem, IntrConvergent], "llvm.nvvm.shfl.down.f32">, 3705 // shfl.up.b32 dest, val, offset, mask_and_clamp 3708 [IntrNoMem, IntrConvergent], "llvm.nvvm.shfl.up.i32">, 3712 [IntrNoMem, IntrConvergent], "llvm.nvvm.shfl.up.f32">, 3715 // shfl.bfly.b32 dest, val, offset, mask_and_clamp 3718 [IntrNoMem, IntrConvergent], "llvm.nvvm.shfl.bfly.i32">, 3722 [IntrNoMem, IntrConvergent], "llvm.nvvm.shfl.bfly.f32">, 3725 // shfl.idx.b32 dest, val, lane, mask_and_clamp [all …]
|
/external/llvm/lib/Target/NVPTX/ |
D | NVPTXIntrinsics.td | 68 // shfl.{up,down,bfly,idx}.b32 70 // The last two parameters to shfl can be regs or imms. ptxas is smart 77 !strconcat("shfl.", mode, ".b32 $dst, $src, $offset, $mask;"), 83 !strconcat("shfl.", mode, ".b32 $dst, $src, $offset, $mask;"), 89 !strconcat("shfl.", mode, ".b32 $dst, $src, $offset, $mask;"), 95 !strconcat("shfl.", mode, ".b32 $dst, $src, $offset, $mask;"),
|
/external/swiftshader/third_party/llvm-subzero/build/Android/include/llvm/IR/ |
D | Intrinsics.gen | 3193 nvvm_shfl_bfly_f32, // llvm.nvvm.shfl.bfly.f32 3194 nvvm_shfl_bfly_i32, // llvm.nvvm.shfl.bfly.i32 3195 nvvm_shfl_down_f32, // llvm.nvvm.shfl.down.f32 3196 nvvm_shfl_down_i32, // llvm.nvvm.shfl.down.i32 3197 nvvm_shfl_idx_f32, // llvm.nvvm.shfl.idx.f32 3198 nvvm_shfl_idx_i32, // llvm.nvvm.shfl.idx.i32 3199 nvvm_shfl_up_f32, // llvm.nvvm.shfl.up.f32 3200 nvvm_shfl_up_i32, // llvm.nvvm.shfl.up.i32 9251 "llvm.nvvm.shfl.bfly.f32", 9252 "llvm.nvvm.shfl.bfly.i32", [all …]
|
/external/swiftshader/third_party/llvm-subzero/build/MacOS/include/llvm/IR/ |
D | Intrinsics.gen | 3187 nvvm_shfl_bfly_f32, // llvm.nvvm.shfl.bfly.f32 3188 nvvm_shfl_bfly_i32, // llvm.nvvm.shfl.bfly.i32 3189 nvvm_shfl_down_f32, // llvm.nvvm.shfl.down.f32 3190 nvvm_shfl_down_i32, // llvm.nvvm.shfl.down.i32 3191 nvvm_shfl_idx_f32, // llvm.nvvm.shfl.idx.f32 3192 nvvm_shfl_idx_i32, // llvm.nvvm.shfl.idx.i32 3193 nvvm_shfl_up_f32, // llvm.nvvm.shfl.up.f32 3194 nvvm_shfl_up_i32, // llvm.nvvm.shfl.up.i32 9211 "llvm.nvvm.shfl.bfly.f32", 9212 "llvm.nvvm.shfl.bfly.i32", [all …]
|
/external/swiftshader/third_party/llvm-subzero/build/Windows/include/llvm/IR/ |
D | Intrinsics.gen | 3193 nvvm_shfl_bfly_f32, // llvm.nvvm.shfl.bfly.f32 3194 nvvm_shfl_bfly_i32, // llvm.nvvm.shfl.bfly.i32 3195 nvvm_shfl_down_f32, // llvm.nvvm.shfl.down.f32 3196 nvvm_shfl_down_i32, // llvm.nvvm.shfl.down.i32 3197 nvvm_shfl_idx_f32, // llvm.nvvm.shfl.idx.f32 3198 nvvm_shfl_idx_i32, // llvm.nvvm.shfl.idx.i32 3199 nvvm_shfl_up_f32, // llvm.nvvm.shfl.up.f32 3200 nvvm_shfl_up_i32, // llvm.nvvm.shfl.up.i32 9251 "llvm.nvvm.shfl.bfly.f32", 9252 "llvm.nvvm.shfl.bfly.i32", [all …]
|
/external/swiftshader/third_party/llvm-subzero/build/Linux/include/llvm/IR/ |
D | Intrinsics.gen | 3193 nvvm_shfl_bfly_f32, // llvm.nvvm.shfl.bfly.f32 3194 nvvm_shfl_bfly_i32, // llvm.nvvm.shfl.bfly.i32 3195 nvvm_shfl_down_f32, // llvm.nvvm.shfl.down.f32 3196 nvvm_shfl_down_i32, // llvm.nvvm.shfl.down.i32 3197 nvvm_shfl_idx_f32, // llvm.nvvm.shfl.idx.f32 3198 nvvm_shfl_idx_i32, // llvm.nvvm.shfl.idx.i32 3199 nvvm_shfl_up_f32, // llvm.nvvm.shfl.up.f32 3200 nvvm_shfl_up_i32, // llvm.nvvm.shfl.up.i32 9251 "llvm.nvvm.shfl.bfly.f32", 9252 "llvm.nvvm.shfl.bfly.i32", [all …]
|