1 // REQUIRES: aarch64-registered-target
2 // RUN: %clang_cc1 -triple aarch64-none-linux-gnu -target-feature +sve -fallow-half-arguments-and-returns -S -O1 -Werror -Wall -emit-llvm -o - %s | FileCheck %s
3 // RUN: %clang_cc1 -DSVE_OVERLOADED_FORMS -triple aarch64-none-linux-gnu -target-feature +sve -fallow-half-arguments-and-returns -S -O1 -Werror -Wall -emit-llvm -o - %s | FileCheck %s
4 // RUN: %clang_cc1 -triple aarch64-none-linux-gnu -target-feature +sve -fallow-half-arguments-and-returns -S -O1 -Werror -Wall -o - %s >/dev/null 2>%t
5 // RUN: FileCheck --check-prefix=ASM --allow-empty %s <%t
6
7 // If this check fails please read test/CodeGen/aarch64-sve-intrinsics/README for instructions on how to resolve it.
8 // ASM-NOT: warning
9 #include <arm_sve.h>
10
11 #ifdef SVE_OVERLOADED_FORMS
12 // A simple used,unused... macro, long enough to represent any SVE builtin.
13 #define SVE_ACLE_FUNC(A1,A2_UNUSED,A3,A4_UNUSED) A1##A3
14 #else
15 #define SVE_ACLE_FUNC(A1,A2,A3,A4) A1##A2##A3##A4
16 #endif
17
test_svsqrt_f16_z(svbool_t pg,svfloat16_t op)18 svfloat16_t test_svsqrt_f16_z(svbool_t pg, svfloat16_t op)
19 {
20 // CHECK-LABEL: test_svsqrt_f16_z
21 // CHECK: %[[PG:.*]] = call <vscale x 8 x i1> @llvm.aarch64.sve.convert.from.svbool.nxv8i1(<vscale x 16 x i1> %pg)
22 // CHECK: %[[INTRINSIC:.*]] = call <vscale x 8 x half> @llvm.aarch64.sve.fsqrt.nxv8f16(<vscale x 8 x half> zeroinitializer, <vscale x 8 x i1> %[[PG]], <vscale x 8 x half> %op)
23 // CHECK: ret <vscale x 8 x half> %[[INTRINSIC]]
24 return SVE_ACLE_FUNC(svsqrt,_f16,_z,)(pg, op);
25 }
26
test_svsqrt_f32_z(svbool_t pg,svfloat32_t op)27 svfloat32_t test_svsqrt_f32_z(svbool_t pg, svfloat32_t op)
28 {
29 // CHECK-LABEL: test_svsqrt_f32_z
30 // CHECK: %[[PG:.*]] = call <vscale x 4 x i1> @llvm.aarch64.sve.convert.from.svbool.nxv4i1(<vscale x 16 x i1> %pg)
31 // CHECK: %[[INTRINSIC:.*]] = call <vscale x 4 x float> @llvm.aarch64.sve.fsqrt.nxv4f32(<vscale x 4 x float> zeroinitializer, <vscale x 4 x i1> %[[PG]], <vscale x 4 x float> %op)
32 // CHECK: ret <vscale x 4 x float> %[[INTRINSIC]]
33 return SVE_ACLE_FUNC(svsqrt,_f32,_z,)(pg, op);
34 }
35
test_svsqrt_f64_z(svbool_t pg,svfloat64_t op)36 svfloat64_t test_svsqrt_f64_z(svbool_t pg, svfloat64_t op)
37 {
38 // CHECK-LABEL: test_svsqrt_f64_z
39 // CHECK: %[[PG:.*]] = call <vscale x 2 x i1> @llvm.aarch64.sve.convert.from.svbool.nxv2i1(<vscale x 16 x i1> %pg)
40 // CHECK: %[[INTRINSIC:.*]] = call <vscale x 2 x double> @llvm.aarch64.sve.fsqrt.nxv2f64(<vscale x 2 x double> zeroinitializer, <vscale x 2 x i1> %[[PG]], <vscale x 2 x double> %op)
41 // CHECK: ret <vscale x 2 x double> %[[INTRINSIC]]
42 return SVE_ACLE_FUNC(svsqrt,_f64,_z,)(pg, op);
43 }
44
test_svsqrt_f16_m(svfloat16_t inactive,svbool_t pg,svfloat16_t op)45 svfloat16_t test_svsqrt_f16_m(svfloat16_t inactive, svbool_t pg, svfloat16_t op)
46 {
47 // CHECK-LABEL: test_svsqrt_f16_m
48 // CHECK: %[[PG:.*]] = call <vscale x 8 x i1> @llvm.aarch64.sve.convert.from.svbool.nxv8i1(<vscale x 16 x i1> %pg)
49 // CHECK: %[[INTRINSIC:.*]] = call <vscale x 8 x half> @llvm.aarch64.sve.fsqrt.nxv8f16(<vscale x 8 x half> %inactive, <vscale x 8 x i1> %[[PG]], <vscale x 8 x half> %op)
50 // CHECK: ret <vscale x 8 x half> %[[INTRINSIC]]
51 return SVE_ACLE_FUNC(svsqrt,_f16,_m,)(inactive, pg, op);
52 }
53
test_svsqrt_f32_m(svfloat32_t inactive,svbool_t pg,svfloat32_t op)54 svfloat32_t test_svsqrt_f32_m(svfloat32_t inactive, svbool_t pg, svfloat32_t op)
55 {
56 // CHECK-LABEL: test_svsqrt_f32_m
57 // CHECK: %[[PG:.*]] = call <vscale x 4 x i1> @llvm.aarch64.sve.convert.from.svbool.nxv4i1(<vscale x 16 x i1> %pg)
58 // CHECK: %[[INTRINSIC:.*]] = call <vscale x 4 x float> @llvm.aarch64.sve.fsqrt.nxv4f32(<vscale x 4 x float> %inactive, <vscale x 4 x i1> %[[PG]], <vscale x 4 x float> %op)
59 // CHECK: ret <vscale x 4 x float> %[[INTRINSIC]]
60 return SVE_ACLE_FUNC(svsqrt,_f32,_m,)(inactive, pg, op);
61 }
62
test_svsqrt_f64_m(svfloat64_t inactive,svbool_t pg,svfloat64_t op)63 svfloat64_t test_svsqrt_f64_m(svfloat64_t inactive, svbool_t pg, svfloat64_t op)
64 {
65 // CHECK-LABEL: test_svsqrt_f64_m
66 // CHECK: %[[PG:.*]] = call <vscale x 2 x i1> @llvm.aarch64.sve.convert.from.svbool.nxv2i1(<vscale x 16 x i1> %pg)
67 // CHECK: %[[INTRINSIC:.*]] = call <vscale x 2 x double> @llvm.aarch64.sve.fsqrt.nxv2f64(<vscale x 2 x double> %inactive, <vscale x 2 x i1> %[[PG]], <vscale x 2 x double> %op)
68 // CHECK: ret <vscale x 2 x double> %[[INTRINSIC]]
69 return SVE_ACLE_FUNC(svsqrt,_f64,_m,)(inactive, pg, op);
70 }
71
test_svsqrt_f16_x(svbool_t pg,svfloat16_t op)72 svfloat16_t test_svsqrt_f16_x(svbool_t pg, svfloat16_t op)
73 {
74 // CHECK-LABEL: test_svsqrt_f16_x
75 // CHECK: %[[PG:.*]] = call <vscale x 8 x i1> @llvm.aarch64.sve.convert.from.svbool.nxv8i1(<vscale x 16 x i1> %pg)
76 // CHECK: %[[INTRINSIC:.*]] = call <vscale x 8 x half> @llvm.aarch64.sve.fsqrt.nxv8f16(<vscale x 8 x half> undef, <vscale x 8 x i1> %[[PG]], <vscale x 8 x half> %op)
77 // CHECK: ret <vscale x 8 x half> %[[INTRINSIC]]
78 return SVE_ACLE_FUNC(svsqrt,_f16,_x,)(pg, op);
79 }
80
test_svsqrt_f32_x(svbool_t pg,svfloat32_t op)81 svfloat32_t test_svsqrt_f32_x(svbool_t pg, svfloat32_t op)
82 {
83 // CHECK-LABEL: test_svsqrt_f32_x
84 // CHECK: %[[PG:.*]] = call <vscale x 4 x i1> @llvm.aarch64.sve.convert.from.svbool.nxv4i1(<vscale x 16 x i1> %pg)
85 // CHECK: %[[INTRINSIC:.*]] = call <vscale x 4 x float> @llvm.aarch64.sve.fsqrt.nxv4f32(<vscale x 4 x float> undef, <vscale x 4 x i1> %[[PG]], <vscale x 4 x float> %op)
86 // CHECK: ret <vscale x 4 x float> %[[INTRINSIC]]
87 return SVE_ACLE_FUNC(svsqrt,_f32,_x,)(pg, op);
88 }
89
test_svsqrt_f64_x(svbool_t pg,svfloat64_t op)90 svfloat64_t test_svsqrt_f64_x(svbool_t pg, svfloat64_t op)
91 {
92 // CHECK-LABEL: test_svsqrt_f64_x
93 // CHECK: %[[PG:.*]] = call <vscale x 2 x i1> @llvm.aarch64.sve.convert.from.svbool.nxv2i1(<vscale x 16 x i1> %pg)
94 // CHECK: %[[INTRINSIC:.*]] = call <vscale x 2 x double> @llvm.aarch64.sve.fsqrt.nxv2f64(<vscale x 2 x double> undef, <vscale x 2 x i1> %[[PG]], <vscale x 2 x double> %op)
95 // CHECK: ret <vscale x 2 x double> %[[INTRINSIC]]
96 return SVE_ACLE_FUNC(svsqrt,_f64,_x,)(pg, op);
97 }
98