• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 // RUN: %clang_cc1 -triple thumbv7-apple-darwin \
2 // RUN:   -target-abi apcs-gnu \
3 // RUN:   -target-cpu cortex-a8 \
4 // RUN:   -mfloat-abi soft \
5 // RUN:   -target-feature +soft-float-abi \
6 // RUN:   -ffreestanding \
7 // RUN:   -emit-llvm -w -o - %s | opt -S -mem2reg | FileCheck %s
8 
9 #include <arm_neon.h>
10 
11 // Check that the vget_low/vget_high intrinsics generate a single shuffle
12 // without any bitcasting.
low_s8(int8x16_t a)13 int8x8_t low_s8(int8x16_t a) {
14 // CHECK: shufflevector <16 x i8> %a, <16 x i8> %a, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
15   return vget_low_s8(a);
16 }
17 
low_u8(uint8x16_t a)18 uint8x8_t low_u8 (uint8x16_t a) {
19 // CHECK: shufflevector <16 x i8> %a, <16 x i8> %a, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
20   return vget_low_u8(a);
21 }
22 
low_s16(int16x8_t a)23 int16x4_t low_s16( int16x8_t a) {
24 // CHECK: shufflevector <8 x i16> %a, <8 x i16> %a, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
25   return vget_low_s16(a);
26 }
27 
low_u16(uint16x8_t a)28 uint16x4_t low_u16(uint16x8_t a) {
29 // CHECK: shufflevector <8 x i16> %a, <8 x i16> %a, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
30   return vget_low_u16(a);
31 }
32 
low_s32(int32x4_t a)33 int32x2_t low_s32( int32x4_t a) {
34 // CHECK: shufflevector <4 x i32> %a, <4 x i32> %a, <2 x i32> <i32 0, i32 1>
35   return vget_low_s32(a);
36 }
37 
low_u32(uint32x4_t a)38 uint32x2_t low_u32(uint32x4_t a) {
39 // CHECK: shufflevector <4 x i32> %a, <4 x i32> %a, <2 x i32> <i32 0, i32 1>
40   return vget_low_u32(a);
41 }
42 
low_s64(int64x2_t a)43 int64x1_t low_s64( int64x2_t a) {
44 // CHECK: shufflevector <2 x i64> %a, <2 x i64> %a, <1 x i32> zeroinitializer
45   return vget_low_s64(a);
46 }
47 
low_u64(uint64x2_t a)48 uint64x1_t low_u64(uint64x2_t a) {
49 // CHECK: shufflevector <2 x i64> %a, <2 x i64> %a, <1 x i32> zeroinitializer
50   return vget_low_u64(a);
51 }
52 
low_p8(poly8x16_t a)53 poly8x8_t low_p8 (poly8x16_t a) {
54 // CHECK: shufflevector <16 x i8> %a, <16 x i8> %a, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
55   return vget_low_p8(a);
56 }
57 
low_p16(poly16x8_t a)58 poly16x4_t low_p16(poly16x8_t a) {
59 // CHECK: shufflevector <8 x i16> %a, <8 x i16> %a, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
60   return vget_low_p16(a);
61 }
62 
low_f32(float32x4_t a)63 float32x2_t low_f32(float32x4_t a) {
64 // CHECK: shufflevector <4 x float> %a, <4 x float> %a, <2 x i32> <i32 0, i32 1>
65   return vget_low_f32(a);
66 }
67 
68 
high_s8(int8x16_t a)69 int8x8_t high_s8(int8x16_t a) {
70 // CHECK: shufflevector <16 x i8> %a, <16 x i8> %a, <8 x i32> <i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
71   return vget_high_s8(a);
72 }
73 
high_u8(uint8x16_t a)74 uint8x8_t high_u8 (uint8x16_t a) {
75 // CHECK: shufflevector <16 x i8> %a, <16 x i8> %a, <8 x i32> <i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
76   return vget_high_u8(a);
77 }
78 
high_s16(int16x8_t a)79 int16x4_t high_s16( int16x8_t a) {
80 // CHECK: shufflevector <8 x i16> %a, <8 x i16> %a, <4 x i32> <i32 4, i32 5, i32 6, i32 7>
81   return vget_high_s16(a);
82 }
83 
high_u16(uint16x8_t a)84 uint16x4_t high_u16(uint16x8_t a) {
85 // CHECK: shufflevector <8 x i16> %a, <8 x i16> %a, <4 x i32> <i32 4, i32 5, i32 6, i32 7>
86   return vget_high_u16(a);
87 }
88 
high_s32(int32x4_t a)89 int32x2_t high_s32( int32x4_t a) {
90 // CHECK: shufflevector <4 x i32> %a, <4 x i32> %a, <2 x i32> <i32 2, i32 3>
91   return vget_high_s32(a);
92 }
93 
high_u32(uint32x4_t a)94 uint32x2_t high_u32(uint32x4_t a) {
95 // CHECK: shufflevector <4 x i32> %a, <4 x i32> %a, <2 x i32> <i32 2, i32 3>
96   return vget_high_u32(a);
97 }
98 
high_s64(int64x2_t a)99 int64x1_t high_s64( int64x2_t a) {
100 // CHECK: shufflevector <2 x i64> %a, <2 x i64> %a, <1 x i32> <i32 1>
101   return vget_high_s64(a);
102 }
103 
high_u64(uint64x2_t a)104 uint64x1_t high_u64(uint64x2_t a) {
105 // CHECK: shufflevector <2 x i64> %a, <2 x i64> %a, <1 x i32> <i32 1>
106   return vget_high_u64(a);
107 }
108 
high_p8(poly8x16_t a)109 poly8x8_t high_p8 (poly8x16_t a) {
110 // CHECK: shufflevector <16 x i8> %a, <16 x i8> %a, <8 x i32> <i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
111   return vget_high_p8(a);
112 }
113 
high_p16(poly16x8_t a)114 poly16x4_t high_p16(poly16x8_t a) {
115 // CHECK: shufflevector <8 x i16> %a, <8 x i16> %a, <4 x i32> <i32 4, i32 5, i32 6, i32 7>
116   return vget_high_p16(a);
117 }
118 
high_f32(float32x4_t a)119 float32x2_t high_f32(float32x4_t a) {
120 // CHECK: shufflevector <4 x float> %a, <4 x float> %a, <2 x i32> <i32 2, i32 3>
121   return vget_high_f32(a);
122 }
123 
124