Home
last modified time | relevance | path

Searched refs:SSE41 (Results 1 – 25 of 30) sorted by relevance

12

/external/llvm/test/CodeGen/X86/
Dvector-sext.ll3 …-unknown-unknown -mcpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=SSE --check-prefix=SSE41
8 … %s -mtriple=i686-unknown-unknown -mcpu=i686 -mattr=+sse4.1 | FileCheck %s --check-prefix=X32-SSE41
35 ; SSE41-LABEL: sext_8i16_to_8i32:
36 ; SSE41: # BB#0: # %entry
37 ; SSE41-NEXT: movdqa %xmm0, %xmm1
38 ; SSE41-NEXT: pmovzxwd %xmm1, %xmm0
39 ; SSE41-NEXT: pslld $16, %xmm0
40 ; SSE41-NEXT: psrad $16, %xmm0
41 ; SSE41-NEXT: punpckhwd {{.*#+}} xmm1 = xmm1[4,4,5,5,6,6,7,7]
42 ; SSE41-NEXT: pslld $16, %xmm1
[all …]
Dvector-idiv.ll1 ; RUN: llc -march=x86-64 -mcpu=core2 -mattr=+sse4.1 < %s | FileCheck %s --check-prefix=SSE41
8 ; SSE41-LABEL: test1:
9 ; SSE41: # BB#0:
10 ; SSE41-NEXT: movdqa {{.*#+}} xmm1 = [613566757,613566757,613566757,613566757]
11 ; SSE41-NEXT: pshufd {{.*#+}} xmm2 = xmm1[1,1,3,3]
12 ; SSE41-NEXT: pshufd {{.*#+}} xmm3 = xmm0[1,1,3,3]
13 ; SSE41-NEXT: pmuludq %xmm2, %xmm3
14 ; SSE41-NEXT: pmuludq %xmm0, %xmm1
15 ; SSE41-NEXT: pshufd {{.*#+}} xmm1 = xmm1[1,1,3,3]
16 ; SSE41-NEXT: pblendw {{.*#+}} xmm1 = xmm1[0,1],xmm3[2,3],xmm1[4,5],xmm3[6,7]
[all …]
Dpr12312.ll1 …N: llc -mtriple=x86_64-unknown-unknown -mattr=+sse4.1,-avx < %s | FileCheck %s --check-prefix SSE41
14 ; SSE41: veccond128
15 ; SSE41: ptest
16 ; SSE41: ret
32 ; SSE41: veccond256
33 ; SSE41: por
34 ; SSE41: ptest
35 ; SSE41: ret
51 ; SSE41: veccond512
52 ; SSE41: por
[all …]
Dvselect-2.ll2 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse4.1 | FileCheck %s --check-prefix=SSE41
11 ; SSE41-LABEL: test1:
12 ; SSE41: # BB#0:
13 ; SSE41-NEXT: pblendw {{.*#+}} xmm0 = xmm0[0,1,2,3],xmm1[4,5,6,7]
14 ; SSE41-NEXT: retq
25 ; SSE41-LABEL: test2:
26 ; SSE41: # BB#0:
27 ; SSE41-NEXT: pblendw {{.*#+}} xmm0 = xmm1[0,1,2,3],xmm0[4,5,6,7]
28 ; SSE41-NEXT: retq
40 ; SSE41-LABEL: test3:
[all …]
Dvector-blend.ll3 … %s -mtriple=x86_64-unknown-unknown -mcpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=SSE41
22 ; SSE41-LABEL: vsel_float:
23 ; SSE41: # BB#0: # %entry
24 ; SSE41-NEXT: blendps {{.*#+}} xmm0 = xmm0[0],xmm1[1],xmm0[2],xmm1[3]
25 ; SSE41-NEXT: retq
49 ; SSE41-LABEL: vsel_float2:
50 ; SSE41: # BB#0: # %entry
51 ; SSE41-NEXT: blendps {{.*#+}} xmm0 = xmm0[0],xmm1[1,2,3]
52 ; SSE41-NEXT: retq
76 ; SSE41-LABEL: vsel_4xi8:
[all …]
Dvector-shuffle-128-v8.ll3 …cpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41
48 ; SSE41-LABEL: shuffle_v8i16_456789AB:
49 ; SSE41: # BB#0:
50 ; SSE41-NEXT: palignr {{.*#+}} xmm1 = xmm0[8,9,10,11,12,13,14,15],xmm1[0,1,2,3,4,5,6,7]
51 ; SSE41-NEXT: movdqa %xmm1, %xmm0
52 ; SSE41-NEXT: retq
75 ; SSE41-LABEL: shuffle_v8i16_00000000:
76 ; SSE41: # BB#0:
77 ; SSE41-NEXT: pshufb {{.*#+}} xmm0 = xmm0[0,1,0,1,0,1,0,1,0,1,0,1,0,1,0,1]
78 ; SSE41-NEXT: retq
[all …]
Dvector-trunc.ll3 …-unknown-unknown -mcpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=SSE --check-prefix=SSE41
21 ; SSE41-LABEL: trunc2x2i64:
22 ; SSE41: # BB#0: # %entry
23 ; SSE41-NEXT: pshufd {{.*#+}} xmm1 = xmm1[0,1,0,2]
24 ; SSE41-NEXT: pshufd {{.*#+}} xmm0 = xmm0[0,2,2,3]
25 ; SSE41-NEXT: pblendw {{.*#+}} xmm0 = xmm0[0,1,2,3],xmm1[4,5,6,7]
26 ; SSE41-NEXT: retq
83 ; SSE41-LABEL: trunc2x4i32:
84 ; SSE41: # BB#0: # %entry
85 ; SSE41-NEXT: movdqa {{.*#+}} xmm2 = [0,1,4,5,8,9,12,13,8,9,12,13,12,13,14,15]
[all …]
Dvec_setcc.ll2 … < %s -mtriple=x86_64-unknown-unknown -mcpu=x86-64 -mattr=sse4.1 | FileCheck %s -check-prefix=SSE41
13 ; SSE41-LABEL: v16i8_icmp_uge:
14 ; SSE41: pmaxub %xmm0, %xmm1
15 ; SSE41: pcmpeqb %xmm1, %xmm0
30 ; SSE41-LABEL: v16i8_icmp_ule:
31 ; SSE41: pminub %xmm0, %xmm1
32 ; SSE41: pcmpeqb %xmm1, %xmm0
49 ; SSE41-LABEL: v8i16_icmp_uge:
50 ; SSE41: pmaxuw %xmm0, %xmm1
51 ; SSE41: pcmpeqw %xmm1, %xmm0
[all …]
Dvector-shuffle-128-v4.ll4 …cpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41
263 ; SSE41-LABEL: shuffle_v4f32_0022:
264 ; SSE41: # BB#0:
265 ; SSE41-NEXT: movsldup {{.*#+}} xmm0 = xmm0[0,0,2,2]
266 ; SSE41-NEXT: retq
291 ; SSE41-LABEL: shuffle_v4f32_1133:
292 ; SSE41: # BB#0:
293 ; SSE41-NEXT: movshdup {{.*#+}} xmm0 = xmm0[1,1,3,3]
294 ; SSE41-NEXT: retq
323 ; SSE41-LABEL: shuffle_v4i32_0124:
[all …]
Dvector-zext.ll3 …-unknown-unknown -mcpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=SSE --check-prefix=SSE41
28 ; SSE41-LABEL: zext_8i16_to_8i32:
29 ; SSE41: # BB#0: # %entry
30 ; SSE41-NEXT: movdqa %xmm0, %xmm1
31 ; SSE41-NEXT: pmovzxwd {{.*#+}} xmm0 = xmm1[0],zero,xmm1[1],zero,xmm1[2],zero,xmm1[3],zero
32 ; SSE41-NEXT: punpckhwd {{.*#+}} xmm1 = xmm1[4,4,5,5,6,6,7,7]
33 ; SSE41-NEXT: pand .LCPI0_0(%rip), %xmm1
34 ; SSE41-NEXT: retq
74 ; SSE41-LABEL: zext_4i32_to_4i64:
75 ; SSE41: # BB#0: # %entry
[all …]
Dpmul.ll2 …mtriple=x86_64-unknown-unknown -mattr=sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE41
16 ; SSE41-LABEL: a:
17 ; SSE41: # BB#0: # %entry
18 ; SSE41-NEXT: pmulld {{.*}}(%rip), %xmm0
19 ; SSE41-NEXT: retq
57 ; SSE41-LABEL: c:
58 ; SSE41: # BB#0: # %entry
59 ; SSE41-NEXT: pmulld %xmm1, %xmm0
60 ; SSE41-NEXT: retq
107 ; SSE41-LABEL: e:
[all …]
Dvec_uint_to_fp.ll2 …ple-macosx -mattr=+sse4.1 | FileCheck --check-prefix=CHECK --check-prefix=SSE41 --check-prefix=CST…
56 ; SSE41: movdqa [[LOWCSTADDR]](%rip), [[LOWVEC:%xmm[0-9]+]]
57 ; SSE41-NEXT: pblendw $85, %xmm0, [[LOWVEC]]
58 ; SSE41-NEXT: psrld $16, %xmm0
59 ; SSE41-NEXT: pblendw $170, [[HIGHCSTADDR]](%rip), %xmm0
60 ; SSE41-NEXT: addps [[MAGICCSTADDR]](%rip), %xmm0
61 ; SSE41-NEXT: addps [[LOWVEC]], %xmm0
62 ; SSE41-NEXT: retq
122 ; SSE41: movdqa {{.*#+}} [[LOWCST:xmm[0-9]+]] = [1258291200,1258291200,1258291200,1258291200]
123 ; SSE41-NEXT: movdqa %xmm0, [[VECLOW:%xmm[0-9]+]]
[all …]
Dvector-shuffle-128-v16.ll3 …cpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41
33 ; SSE41-LABEL: shuffle_v16i8_00_00_00_00_00_00_00_00_00_00_00_00_00_00_00_00:
34 ; SSE41: # BB#0:
35 ; SSE41-NEXT: pxor %xmm1, %xmm1
36 ; SSE41-NEXT: pshufb %xmm1, %xmm0
37 ; SSE41-NEXT: retq
67 ; SSE41-LABEL: shuffle_v16i8_00_00_00_00_00_00_00_00_01_01_01_01_01_01_01_01:
68 ; SSE41: # BB#0:
69 ; SSE41-NEXT: pshufb {{.*#+}} xmm0 = xmm0[0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1]
70 ; SSE41-NEXT: retq
[all …]
Dcombine-64bit-vec-binop.ll1 …cpu=corei7 -mtriple=x86_64-unknown-linux-gnu | FileCheck %s -check-prefix=CHECK -check-prefix=SSE41
13 ; SSE41: paddd
26 ; SSE41: paddw
38 ; SSE41: paddb
51 ; SSE41: psubd
64 ; SSE41: psubw
77 ; SSE41: psubb
90 ; SSE41: pmulld
103 ; SSE41: pmullw
129 ; SSE41: andps
[all …]
Dvector-shuffle-combining.ll3 …cpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41
292 ; SSE41-LABEL: combine_bitwise_ops_test1b:
293 ; SSE41: # BB#0:
294 ; SSE41-NEXT: pand %xmm1, %xmm0
295 ; SSE41-NEXT: pblendw {{.*#+}} xmm0 = xmm0[0,1],xmm2[2,3],xmm0[4,5],xmm2[6,7]
296 ; SSE41-NEXT: retq
332 ; SSE41-LABEL: combine_bitwise_ops_test2b:
333 ; SSE41: # BB#0:
334 ; SSE41-NEXT: por %xmm1, %xmm0
335 ; SSE41-NEXT: pblendw {{.*#+}} xmm0 = xmm0[0,1],xmm2[2,3],xmm0[4,5],xmm2[6,7]
[all …]
Dvec_compare-sse4.ll2 ; RUN: llc < %s -march=x86 -mattr=-sse4.2,+sse4.1 | FileCheck %s -check-prefix=SSE41
9 ; SSE41-LABEL: test1:
10 ; SSE41-NOT: pcmpgtq
11 ; SSE41: ret
25 ; SSE41-LABEL: test2:
26 ; SSE41: pcmpeqq
27 ; SSE41: ret
Dvector-shuffle-128-v2.ll4 …cpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41
116 ; SSE41-LABEL: shuffle_v2f64_00:
117 ; SSE41: # BB#0:
118 ; SSE41-NEXT: movddup {{.*#+}} xmm0 = xmm0[0,0]
119 ; SSE41-NEXT: retq
171 ; SSE41-LABEL: shuffle_v2f64_22:
172 ; SSE41: # BB#0:
173 ; SSE41-NEXT: movddup {{.*#+}} xmm0 = xmm1[0,0]
174 ; SSE41-NEXT: retq
230 ; SSE41-LABEL: shuffle_v2f64_03:
[all …]
Dsse41-pmovxrm-intrinsics.ll1 …4-apple-darwin -mcpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=CHECK --check-prefix=SSE41
6 ; SSE41: pmovsxbw (%rdi), %xmm0
15 ; SSE41: pmovsxbd (%rdi), %xmm0
24 ; SSE41: pmovsxbq (%rdi), %xmm0
33 ; SSE41: pmovsxwd (%rdi), %xmm0
42 ; SSE41: pmovsxwq (%rdi), %xmm0
51 ; SSE41: pmovsxdq (%rdi), %xmm0
60 ; SSE41: pmovzxbw (%rdi), %xmm0
69 ; SSE41: pmovzxbd (%rdi), %xmm0
78 ; SSE41: pmovzxbq (%rdi), %xmm0
[all …]
Dextract-store.ll1 ; RUN: llc < %s -o - -mcpu=generic -march=x86-64 -mattr=+sse4.1 | FileCheck %s -check-prefix=SSE41
6 ; SSE41: pextrb
8 ; SSE41-NOT: movb
16 ; SSE41: pextrw
18 ; SSE41-NOT: movw
Dpmovsx-inreg.ll1 ; RUN: llc < %s -march=x86-64 -mcpu=penryn | FileCheck -check-prefix=SSE41 %s
15 ; SSE41-LABEL: test1:
16 ; SSE41: pmovsxbq
43 ; SSE41-LABEL: test3:
44 ; SSE41: pmovsxbd
71 ; SSE41-LABEL: test5:
72 ; SSE41: pmovsxbw
100 ; SSE41-LABEL: test7:
101 ; SSE41: pmovsxwq
128 ; SSE41-LABEL: test9:
[all …]
Dvector-zmov.ll3 …-unknown-unknown -mcpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=SSE --check-prefix=SSE41
/external/llvm/test/Analysis/CostModel/X86/
Dalternate-shuffle-cost.ll3 …-linux-gnu -mcpu=corei7 -cost-model -analyze | FileCheck %s -check-prefix=CHECK -check-prefix=SSE41
21 ; SSE41: Cost Model: {{.*}} 1 for instruction: %1 = shufflevector
32 ; SSE41: Cost Model: {{.*}} 1 for instruction: %1 = shufflevector
43 ; SSE41: Cost Model: {{.*}} 1 for instruction: %1 = shufflevector
54 ; SSE41: Cost Model: {{.*}} 1 for instruction: %1 = shufflevector
68 ; SSE41: Cost Model: {{.*}} 1 for instruction: %1 = shufflevector
79 ; SSE41: Cost Model: {{.*}} 1 for instruction: %1 = shufflevector
91 ; SSE41: Cost Model: {{.*}} 1 for instruction: %1 = shufflevector
103 ; SSE41: Cost Model: {{.*}} 1 for instruction: %1 = shufflevector
116 ; SSE41: Cost Model: {{.*}} 1 for instruction: %1 = shufflevector
[all …]
Dvselect-cost.ll2 …-linux-gnu -mcpu=corei7 -cost-model -analyze | FileCheck %s -check-prefix=CHECK -check-prefix=SSE41
9 ; SSE41 added blend instructions with an immediate for <2 x double> and
15 ; SSE41: Cost Model: {{.*}} 1 for instruction: %sel = select <2 x i1>
25 ; SSE41: Cost Model: {{.*}} 1 for instruction: %sel = select <2 x i1>
35 ; SSE41: Cost Model: {{.*}} 1 for instruction: %sel = select <4 x i1>
45 ; SSE41: Cost Model: {{.*}} 1 for instruction: %sel = select <4 x i1>
55 ; SSE41: Cost Model: {{.*}} 1 for instruction: %sel = select <16 x i1>
67 ; SSE41: Cost Model: {{.*}} 2 for instruction: %sel = select <4 x i1>
77 ; SSE41: Cost Model: {{.*}} 2 for instruction: %sel = select <4 x i1>
87 ; SSE41: Cost Model: {{.*}} 2 for instruction: %sel = select <8 x i1>
[all …]
Dvshift-cost.ll2 …-linux-gnu -mcpu=corei7 -cost-model -analyze | FileCheck %s -check-prefix=CHECK -check-prefix=SSE41
39 ; SSE41: Found an estimated cost of 1 for instruction: %shl
50 ; SSE41: Found an estimated cost of 1 for instruction: %shl
66 ; SSE41: Found an estimated cost of 20 for instruction: %shl
90 ; SSE41: Found an estimated cost of 2 for instruction: %shl
105 ; SSE41: Found an estimated cost of 2 for instruction: %shl
121 ; SSE41: Found an estimated cost of 40 for instruction: %shl
134 ; SSE41: Found an estimated cost of 4 for instruction: %shl
147 ; SSE41: Found an estimated cost of 4 for instruction: %shl
163 ; SSE41: Found an estimated cost of 80 for instruction: %shl
/external/llvm/lib/Target/X86/
DX86Subtarget.h50 NoMMXSSE, MMX, SSE1, SSE2, SSE3, SSSE3, SSE41, SSE42, AVX, AVX2, AVX512F enumerator
332 bool hasSSE41() const { return X86SSELevel >= SSE41; } in hasSSE41()

12