1; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py 2; RUN: llc -mtriple=thumbv8.1m.main -mattr=+mve.fp -verify-machineinstrs -o - %s | FileCheck %s 3 4define arm_aapcs_vfpcc <16 x i8> @test_vclsq_m_s8(<16 x i8> %inactive, <16 x i8> %a, i16 zeroext %p) { 5; CHECK-LABEL: test_vclsq_m_s8: 6; CHECK: @ %bb.0: @ %entry 7; CHECK-NEXT: vmsr p0, r0 8; CHECK-NEXT: vpst 9; CHECK-NEXT: vclst.s8 q0, q1 10; CHECK-NEXT: bx lr 11entry: 12 %0 = zext i16 %p to i32 13 %1 = tail call <16 x i1> @llvm.arm.mve.pred.i2v.v16i1(i32 %0) 14 %2 = tail call <16 x i8> @llvm.arm.mve.cls.predicated.v16i8.v16i1(<16 x i8> %a, <16 x i1> %1, <16 x i8> %inactive) 15 ret <16 x i8> %2 16} 17 18define arm_aapcs_vfpcc <8 x i16> @test_vclsq_m_s16(<8 x i16> %inactive, <8 x i16> %a, i16 zeroext %p) { 19; CHECK-LABEL: test_vclsq_m_s16: 20; CHECK: @ %bb.0: @ %entry 21; CHECK-NEXT: vmsr p0, r0 22; CHECK-NEXT: vpst 23; CHECK-NEXT: vclst.s16 q0, q1 24; CHECK-NEXT: bx lr 25entry: 26 %0 = zext i16 %p to i32 27 %1 = tail call <8 x i1> @llvm.arm.mve.pred.i2v.v8i1(i32 %0) 28 %2 = tail call <8 x i16> @llvm.arm.mve.cls.predicated.v8i16.v8i1(<8 x i16> %a, <8 x i1> %1, <8 x i16> %inactive) 29 ret <8 x i16> %2 30} 31 32define arm_aapcs_vfpcc <4 x i32> @test_vclsq_m_s32(<4 x i32> %inactive, <4 x i32> %a, i16 zeroext %p) { 33; CHECK-LABEL: test_vclsq_m_s32: 34; CHECK: @ %bb.0: @ %entry 35; CHECK-NEXT: vmsr p0, r0 36; CHECK-NEXT: vpst 37; CHECK-NEXT: vclst.s32 q0, q1 38; CHECK-NEXT: bx lr 39entry: 40 %0 = zext i16 %p to i32 41 %1 = tail call <4 x i1> @llvm.arm.mve.pred.i2v.v4i1(i32 %0) 42 %2 = tail call <4 x i32> @llvm.arm.mve.cls.predicated.v4i32.v4i1(<4 x i32> %a, <4 x i1> %1, <4 x i32> %inactive) 43 ret <4 x i32> %2 44} 45 46define arm_aapcs_vfpcc <16 x i8> @test_vclzq_m_s8(<16 x i8> %inactive, <16 x i8> %a, i16 zeroext %p) { 47; CHECK-LABEL: test_vclzq_m_s8: 48; CHECK: @ %bb.0: @ %entry 49; CHECK-NEXT: vmsr p0, r0 50; CHECK-NEXT: vpst 51; CHECK-NEXT: vclzt.i8 q0, q1 52; CHECK-NEXT: bx lr 53entry: 54 %0 = zext i16 %p to i32 55 %1 = tail call <16 x i1> @llvm.arm.mve.pred.i2v.v16i1(i32 %0) 56 %2 = tail call <16 x i8> @llvm.arm.mve.clz.predicated.v16i8.v16i1(<16 x i8> %a, <16 x i1> %1, <16 x i8> %inactive) 57 ret <16 x i8> %2 58} 59 60define arm_aapcs_vfpcc <8 x i16> @test_vclzq_m_s16(<8 x i16> %inactive, <8 x i16> %a, i16 zeroext %p) { 61; CHECK-LABEL: test_vclzq_m_s16: 62; CHECK: @ %bb.0: @ %entry 63; CHECK-NEXT: vmsr p0, r0 64; CHECK-NEXT: vpst 65; CHECK-NEXT: vclzt.i16 q0, q1 66; CHECK-NEXT: bx lr 67entry: 68 %0 = zext i16 %p to i32 69 %1 = tail call <8 x i1> @llvm.arm.mve.pred.i2v.v8i1(i32 %0) 70 %2 = tail call <8 x i16> @llvm.arm.mve.clz.predicated.v8i16.v8i1(<8 x i16> %a, <8 x i1> %1, <8 x i16> %inactive) 71 ret <8 x i16> %2 72} 73 74define arm_aapcs_vfpcc <4 x i32> @test_vclzq_m_s32(<4 x i32> %inactive, <4 x i32> %a, i16 zeroext %p) { 75; CHECK-LABEL: test_vclzq_m_s32: 76; CHECK: @ %bb.0: @ %entry 77; CHECK-NEXT: vmsr p0, r0 78; CHECK-NEXT: vpst 79; CHECK-NEXT: vclzt.i32 q0, q1 80; CHECK-NEXT: bx lr 81entry: 82 %0 = zext i16 %p to i32 83 %1 = tail call <4 x i1> @llvm.arm.mve.pred.i2v.v4i1(i32 %0) 84 %2 = tail call <4 x i32> @llvm.arm.mve.clz.predicated.v4i32.v4i1(<4 x i32> %a, <4 x i1> %1, <4 x i32> %inactive) 85 ret <4 x i32> %2 86} 87 88define arm_aapcs_vfpcc <16 x i8> @test_vclzq_m_u8(<16 x i8> %inactive, <16 x i8> %a, i16 zeroext %p) { 89; CHECK-LABEL: test_vclzq_m_u8: 90; CHECK: @ %bb.0: @ %entry 91; CHECK-NEXT: vmsr p0, r0 92; CHECK-NEXT: vpst 93; CHECK-NEXT: vclzt.i8 q0, q1 94; CHECK-NEXT: bx lr 95entry: 96 %0 = zext i16 %p to i32 97 %1 = tail call <16 x i1> @llvm.arm.mve.pred.i2v.v16i1(i32 %0) 98 %2 = tail call <16 x i8> @llvm.arm.mve.clz.predicated.v16i8.v16i1(<16 x i8> %a, <16 x i1> %1, <16 x i8> %inactive) 99 ret <16 x i8> %2 100} 101 102define arm_aapcs_vfpcc <8 x i16> @test_vclzq_m_u16(<8 x i16> %inactive, <8 x i16> %a, i16 zeroext %p) { 103; CHECK-LABEL: test_vclzq_m_u16: 104; CHECK: @ %bb.0: @ %entry 105; CHECK-NEXT: vmsr p0, r0 106; CHECK-NEXT: vpst 107; CHECK-NEXT: vclzt.i16 q0, q1 108; CHECK-NEXT: bx lr 109entry: 110 %0 = zext i16 %p to i32 111 %1 = tail call <8 x i1> @llvm.arm.mve.pred.i2v.v8i1(i32 %0) 112 %2 = tail call <8 x i16> @llvm.arm.mve.clz.predicated.v8i16.v8i1(<8 x i16> %a, <8 x i1> %1, <8 x i16> %inactive) 113 ret <8 x i16> %2 114} 115 116define arm_aapcs_vfpcc <4 x i32> @test_vclzq_m_u32(<4 x i32> %inactive, <4 x i32> %a, i16 zeroext %p) { 117; CHECK-LABEL: test_vclzq_m_u32: 118; CHECK: @ %bb.0: @ %entry 119; CHECK-NEXT: vmsr p0, r0 120; CHECK-NEXT: vpst 121; CHECK-NEXT: vclzt.i32 q0, q1 122; CHECK-NEXT: bx lr 123entry: 124 %0 = zext i16 %p to i32 125 %1 = tail call <4 x i1> @llvm.arm.mve.pred.i2v.v4i1(i32 %0) 126 %2 = tail call <4 x i32> @llvm.arm.mve.clz.predicated.v4i32.v4i1(<4 x i32> %a, <4 x i1> %1, <4 x i32> %inactive) 127 ret <4 x i32> %2 128} 129 130declare <16 x i1> @llvm.arm.mve.pred.i2v.v16i1(i32) 131declare <8 x i1> @llvm.arm.mve.pred.i2v.v8i1(i32) 132declare <4 x i1> @llvm.arm.mve.pred.i2v.v4i1(i32) 133declare <16 x i8> @llvm.arm.mve.cls.predicated.v16i8.v16i1(<16 x i8>, <16 x i1>, <16 x i8>) 134declare <8 x i16> @llvm.arm.mve.cls.predicated.v8i16.v8i1(<8 x i16>, <8 x i1>, <8 x i16>) 135declare <4 x i32> @llvm.arm.mve.cls.predicated.v4i32.v4i1(<4 x i32>, <4 x i1>, <4 x i32>) 136declare <16 x i8> @llvm.arm.mve.clz.predicated.v16i8.v16i1(<16 x i8>, <16 x i1>, <16 x i8>) 137declare <8 x i16> @llvm.arm.mve.clz.predicated.v8i16.v8i1(<8 x i16>, <8 x i1>, <8 x i16>) 138declare <4 x i32> @llvm.arm.mve.clz.predicated.v4i32.v4i1(<4 x i32>, <4 x i1>, <4 x i32>) 139