Home
last modified time | relevance | path

Searched refs:SSE2 (Results 1 – 25 of 530) sorted by relevance

12345678910>>...22

/external/swiftshader/third_party/llvm-7.0/llvm/test/CodeGen/X86/
Dftrunc.ll2 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse2 | FileCheck %s --check-prefix=SSE2
7 ; SSE2-LABEL: trunc_unsigned_f32:
8 ; SSE2: # %bb.0:
9 ; SSE2-NEXT: cvttss2si %xmm0, %rax
10 ; SSE2-NEXT: movl %eax, %eax
11 ; SSE2-NEXT: xorps %xmm0, %xmm0
12 ; SSE2-NEXT: cvtsi2ssq %rax, %xmm0
13 ; SSE2-NEXT: retq
30 ; SSE2-LABEL: trunc_unsigned_f64:
31 ; SSE2: # %bb.0:
[all …]
Dfunnel-shift-rot.ll2 ; RUN: llc < %s -mtriple=i686-- -mattr=sse2 | FileCheck %s --check-prefixes=ANY,X32-SSE2
20 ; X32-SSE2-LABEL: rotl_i8_const_shift:
21 ; X32-SSE2: # %bb.0:
22 ; X32-SSE2-NEXT: movb {{[0-9]+}}(%esp), %al
23 ; X32-SSE2-NEXT: rolb $3, %al
24 ; X32-SSE2-NEXT: retl
36 ; X32-SSE2-LABEL: rotl_i64_const_shift:
37 ; X32-SSE2: # %bb.0:
38 ; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %ecx
39 ; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %edx
[all …]
Dvselect-minmax.ll2 … -mtriple=x86_64-unknown-unknown -mattr=+sse2 | FileCheck %s --check-prefix=SSE --check-prefix=SSE2
10 ; SSE2-LABEL: test1:
11 ; SSE2: # %bb.0: # %entry
12 ; SSE2-NEXT: movdqa %xmm1, %xmm2
13 ; SSE2-NEXT: pcmpgtb %xmm0, %xmm2
14 ; SSE2-NEXT: pand %xmm2, %xmm0
15 ; SSE2-NEXT: pandn %xmm1, %xmm2
16 ; SSE2-NEXT: por %xmm2, %xmm0
17 ; SSE2-NEXT: retq
35 ; SSE2-LABEL: test2:
[all …]
Dfunnel-shift.ll2 ; RUN: llc < %s -mtriple=i686-- -mattr=sse2 | FileCheck %s --check-prefixes=ANY,X32-SSE2
20 ; X32-SSE2-LABEL: fshl_i32:
21 ; X32-SSE2: # %bb.0:
22 ; X32-SSE2-NEXT: pushl %edi
23 ; X32-SSE2-NEXT: pushl %esi
24 ; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %esi
25 ; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %edi
26 ; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %edx
27 ; X32-SSE2-NEXT: movl $32, %ecx
28 ; X32-SSE2-NEXT: subl %edx, %ecx
[all …]
Dvector-bitreverse.ll2 …known-unknown -mattr=+sse2 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE2
235 ; SSE2-LABEL: test_bitreverse_v16i8:
236 ; SSE2: # %bb.0:
237 ; SSE2-NEXT: movdqa {{.*#+}} xmm1 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15]
238 ; SSE2-NEXT: movdqa %xmm0, %xmm2
239 ; SSE2-NEXT: pand %xmm1, %xmm2
240 ; SSE2-NEXT: psllw $4, %xmm2
241 ; SSE2-NEXT: movdqa {{.*#+}} xmm3 = [240,240,240,240,240,240,240,240,240,240,240,240,240,240,240…
242 ; SSE2-NEXT: pand %xmm3, %xmm2
243 ; SSE2-NEXT: pand %xmm3, %xmm0
[all …]
Dvector-reduce-umin.ll2 …known-unknown -mattr=+sse2 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE2
14 ; SSE2-LABEL: test_v2i64:
15 ; SSE2: # %bb.0:
16 ; SSE2-NEXT: pshufd {{.*#+}} xmm1 = xmm0[2,3,0,1]
17 ; SSE2-NEXT: movdqa {{.*#+}} xmm2 = [2147483648,2147483648,2147483648,2147483648]
18 ; SSE2-NEXT: movdqa %xmm0, %xmm3
19 ; SSE2-NEXT: pxor %xmm2, %xmm3
20 ; SSE2-NEXT: pxor %xmm1, %xmm2
21 ; SSE2-NEXT: movdqa %xmm2, %xmm4
22 ; SSE2-NEXT: pcmpgtd %xmm3, %xmm4
[all …]
Dvector-reduce-smax.ll2 …known-unknown -mattr=+sse2 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE2
14 ; SSE2-LABEL: test_v2i64:
15 ; SSE2: # %bb.0:
16 ; SSE2-NEXT: pshufd {{.*#+}} xmm1 = xmm0[2,3,0,1]
17 ; SSE2-NEXT: movdqa {{.*#+}} xmm2 = [2147483648,0,2147483648,0]
18 ; SSE2-NEXT: movdqa %xmm0, %xmm3
19 ; SSE2-NEXT: pxor %xmm2, %xmm3
20 ; SSE2-NEXT: pxor %xmm1, %xmm2
21 ; SSE2-NEXT: movdqa %xmm3, %xmm4
22 ; SSE2-NEXT: pcmpgtd %xmm2, %xmm4
[all …]
Dvector-reduce-smin.ll2 …known-unknown -mattr=+sse2 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE2
14 ; SSE2-LABEL: test_v2i64:
15 ; SSE2: # %bb.0:
16 ; SSE2-NEXT: pshufd {{.*#+}} xmm1 = xmm0[2,3,0,1]
17 ; SSE2-NEXT: movdqa {{.*#+}} xmm2 = [2147483648,0,2147483648,0]
18 ; SSE2-NEXT: movdqa %xmm0, %xmm3
19 ; SSE2-NEXT: pxor %xmm2, %xmm3
20 ; SSE2-NEXT: pxor %xmm1, %xmm2
21 ; SSE2-NEXT: movdqa %xmm2, %xmm4
22 ; SSE2-NEXT: pcmpgtd %xmm3, %xmm4
[all …]
Dvector-compare-results.ll2 … -mtriple=x86_64-unknown-unknown -mattr=+sse2 | FileCheck %s --check-prefix=SSE --check-prefix=SSE2
45 ; SSE2-LABEL: test_cmp_v2i64:
46 ; SSE2: # %bb.0:
47 ; SSE2-NEXT: movdqa {{.*#+}} xmm2 = [2147483648,0,2147483648,0]
48 ; SSE2-NEXT: pxor %xmm2, %xmm1
49 ; SSE2-NEXT: pxor %xmm2, %xmm0
50 ; SSE2-NEXT: movdqa %xmm0, %xmm2
51 ; SSE2-NEXT: pcmpgtd %xmm1, %xmm2
52 ; SSE2-NEXT: pshufd {{.*#+}} xmm3 = xmm2[0,0,2,2]
53 ; SSE2-NEXT: pcmpeqd %xmm1, %xmm0
[all …]
Dpr34080.ll2 ; RUN: llc < %s -mtriple=x86_64-apple-darwin -mattr=+sse2 | FileCheck %s --check-prefix=SSE2
3 … -mtriple=x86_64-apple-darwin -mattr=+sse2 -mcpu=x86-64 | FileCheck %s --check-prefix=SSE2-SCHEDULE
10 ; SSE2-LABEL: _Z1fe:
11 ; SSE2: ## %bb.0: ## %entry
12 ; SSE2-NEXT: pushq %rbp
13 ; SSE2-NEXT: .cfi_def_cfa_offset 16
14 ; SSE2-NEXT: .cfi_offset %rbp, -16
15 ; SSE2-NEXT: movq %rsp, %rbp
16 ; SSE2-NEXT: .cfi_def_cfa_register %rbp
17 ; SSE2-NEXT: fldt 16(%rbp)
[all …]
Dwiden_conv-4.ll2 …c < %s -mtriple=i686-unknown -mattr=+sse2 | FileCheck %s --check-prefix=X86 --check-prefix=X86-SSE2
4 …< %s -mtriple=x86_64-unknown -mattr=+sse2 | FileCheck %s --check-prefix=X64 --check-prefix=X64-SSE2
10 ; X86-SSE2-LABEL: convert_v7i16_v7f32:
11 ; X86-SSE2: # %bb.0: # %entry
12 ; X86-SSE2-NEXT: movl {{[0-9]+}}(%esp), %eax
13 ; X86-SSE2-NEXT: pxor %xmm1, %xmm1
14 ; X86-SSE2-NEXT: movdqa %xmm0, %xmm2
15 ; X86-SSE2-NEXT: punpckhwd {{.*#+}} xmm2 = xmm2[4],xmm1[4],xmm2[5],xmm1[5],xmm2[6],xmm1[6],xmm2[…
16 ; X86-SSE2-NEXT: cvtdq2ps %xmm2, %xmm2
17 ; X86-SSE2-NEXT: punpcklwd {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1],xmm0[2],xmm1[2],xmm0[…
[all …]
Dvector-reduce-umax.ll2 …known-unknown -mattr=+sse2 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE2
14 ; SSE2-LABEL: test_v2i64:
15 ; SSE2: # %bb.0:
16 ; SSE2-NEXT: pshufd {{.*#+}} xmm1 = xmm0[2,3,0,1]
17 ; SSE2-NEXT: movdqa {{.*#+}} xmm2 = [2147483648,2147483648,2147483648,2147483648]
18 ; SSE2-NEXT: movdqa %xmm0, %xmm3
19 ; SSE2-NEXT: pxor %xmm2, %xmm3
20 ; SSE2-NEXT: pxor %xmm1, %xmm2
21 ; SSE2-NEXT: movdqa %xmm3, %xmm4
22 ; SSE2-NEXT: pcmpgtd %xmm2, %xmm4
[all …]
Dwiden_conv-3.ll2 …c < %s -mtriple=i686-unknown -mattr=+sse2 | FileCheck %s --check-prefix=X86 --check-prefix=X86-SSE2
4 …< %s -mtriple=x86_64-unknown -mattr=+sse2 | FileCheck %s --check-prefix=X64 --check-prefix=X64-SSE2
10 ; X86-SSE2-LABEL: convert_v2i16_to_v2f32:
11 ; X86-SSE2: # %bb.0: # %entry
12 ; X86-SSE2-NEXT: movl {{[0-9]+}}(%esp), %eax
13 ; X86-SSE2-NEXT: psllq $48, %xmm0
14 ; X86-SSE2-NEXT: psrad $16, %xmm0
15 ; X86-SSE2-NEXT: pshufd {{.*#+}} xmm0 = xmm0[1,3,2,3]
16 ; X86-SSE2-NEXT: cvtdq2ps %xmm0, %xmm0
17 ; X86-SSE2-NEXT: movss %xmm0, (%eax)
[all …]
Dtrunc-ext-ld-st.ll2 …c < %s -mtriple=x86_64-unknown -mattr=+sse2 | FileCheck %s --check-prefix=CHECK --check-prefix=SSE2
7 ; SSE2-LABEL: load_2_i8:
8 ; SSE2: # %bb.0:
9 ; SSE2-NEXT: movzwl (%rdi), %eax
10 ; SSE2-NEXT: movd %eax, %xmm0
11 ; SSE2-NEXT: punpcklbw {{.*#+}} xmm0 = xmm0[0,0,1,1,2,2,3,3,4,4,5,5,6,6,7,7]
12 ; SSE2-NEXT: punpcklwd {{.*#+}} xmm0 = xmm0[0,0,1,1,2,2,3,3]
13 ; SSE2-NEXT: pshufd {{.*#+}} xmm0 = xmm0[0,1,1,3]
14 ; SSE2-NEXT: paddq {{.*}}(%rip), %xmm0
15 ; SSE2-NEXT: pand {{.*}}(%rip), %xmm0
[all …]
Dsetcc-wide-types.ll2 …triple=x86_64-unknown-unknown -mattr=sse2 | FileCheck %s --check-prefix=ANY --check-prefix=SSE2
11 ; SSE2-LABEL: ne_i128:
12 ; SSE2: # %bb.0:
13 ; SSE2-NEXT: pcmpeqb %xmm1, %xmm0
14 ; SSE2-NEXT: pmovmskb %xmm0, %ecx
15 ; SSE2-NEXT: xorl %eax, %eax
16 ; SSE2-NEXT: cmpl $65535, %ecx # imm = 0xFFFF
17 ; SSE2-NEXT: setne %al
18 ; SSE2-NEXT: retq
36 ; SSE2-LABEL: eq_i128:
[all …]
/external/llvm/test/Analysis/CostModel/X86/
Dtestshiftlshr.ll1 ; RUN: llc -mtriple=x86_64-apple-darwin -mcpu=core2 < %s | FileCheck --check-prefix=SSE2-CODEGEN %s
2 …triple=x86_64-apple-darwin -mcpu=core2 -cost-model -analyze < %s | FileCheck --check-prefix=SSE2 %s
7 ; SSE2: shift2i16
8 ; SSE2: cost of 4 {{.*}} lshr
9 ; SSE2-CODEGEN: shift2i16
10 ; SSE2-CODEGEN: psrlq
19 ; SSE2: shift4i16
20 ; SSE2: cost of 16 {{.*}} lshr
21 ; SSE2-CODEGEN: shift4i16
22 ; SSE2-CODEGEN: psrld
[all …]
Dtestshiftashr.ll1 ; RUN: llc -mtriple=x86_64-apple-darwin -mcpu=core2 < %s | FileCheck --check-prefix=SSE2-CODEGEN %s
2 …triple=x86_64-apple-darwin -mcpu=core2 -cost-model -analyze < %s | FileCheck --check-prefix=SSE2 %s
7 ; SSE2: shift2i16
8 ; SSE2: cost of 12 {{.*}} ashr
9 ; SSE2-CODEGEN: shift2i16
10 ; SSE2-CODEGEN: psrlq
19 ; SSE2: shift4i16
20 ; SSE2: cost of 16 {{.*}} ashr
21 ; SSE2-CODEGEN: shift4i16
22 ; SSE2-CODEGEN: psrad
[all …]
Dtestshiftshl.ll1 ; RUN: llc -mtriple=x86_64-apple-darwin -mcpu=core2 < %s | FileCheck --check-prefix=SSE2-CODEGEN %s
2 …triple=x86_64-apple-darwin -mcpu=core2 -cost-model -analyze < %s | FileCheck --check-prefix=SSE2 %s
7 ; SSE2: shift2i16
8 ; SSE2: cost of 4 {{.*}} shl
9 ; SSE2-CODEGEN: shift2i16
10 ; SSE2-CODEGEN: psllq
19 ; SSE2: shift4i16
20 ; SSE2: cost of 10 {{.*}} shl
21 ; SSE2-CODEGEN: shift4i16
22 ; SSE2-CODEGEN: pmuludq
[all …]
/external/swiftshader/third_party/llvm-7.0/llvm/test/Analysis/CostModel/X86/
Dtestshiftlshr.ll1 ; RUN: llc -mtriple=x86_64-apple-darwin -mcpu=core2 < %s | FileCheck --check-prefix=SSE2-CODEGEN %s
2 …triple=x86_64-apple-darwin -mcpu=core2 -cost-model -analyze < %s | FileCheck --check-prefix=SSE2 %s
7 ; SSE2: shift2i16
8 ; SSE2: cost of 4 {{.*}} lshr
9 ; SSE2-CODEGEN: shift2i16
10 ; SSE2-CODEGEN: psrlq
19 ; SSE2: shift4i16
20 ; SSE2: cost of 16 {{.*}} lshr
21 ; SSE2-CODEGEN: shift4i16
22 ; SSE2-CODEGEN: psrld
[all …]
Dtestshiftashr.ll1 ; RUN: llc -mtriple=x86_64-apple-darwin -mcpu=core2 < %s | FileCheck --check-prefix=SSE2-CODEGEN %s
2 …triple=x86_64-apple-darwin -mcpu=core2 -cost-model -analyze < %s | FileCheck --check-prefix=SSE2 %s
7 ; SSE2: shift2i16
8 ; SSE2: cost of 12 {{.*}} ashr
9 ; SSE2-CODEGEN: shift2i16
10 ; SSE2-CODEGEN: psrlq
19 ; SSE2: shift4i16
20 ; SSE2: cost of 16 {{.*}} ashr
21 ; SSE2-CODEGEN: shift4i16
22 ; SSE2-CODEGEN: psrad
[all …]
Dtestshiftshl.ll1 ; RUN: llc -mtriple=x86_64-apple-darwin -mcpu=core2 < %s | FileCheck --check-prefix=SSE2-CODEGEN %s
2 …triple=x86_64-apple-darwin -mcpu=core2 -cost-model -analyze < %s | FileCheck --check-prefix=SSE2 %s
7 ; SSE2: shift2i16
8 ; SSE2: cost of 4 {{.*}} shl
9 ; SSE2-CODEGEN: shift2i16
10 ; SSE2-CODEGEN: psllq
19 ; SSE2: shift4i16
20 ; SSE2: cost of 10 {{.*}} shl
21 ; SSE2-CODEGEN: shift4i16
22 ; SSE2-CODEGEN: pmuludq
[all …]
/external/llvm/test/CodeGen/X86/
Dvselect-minmax.ll2 … -mtriple=x86_64-unknown-unknown -mattr=+sse2 | FileCheck %s --check-prefix=SSE --check-prefix=SSE2
10 ; SSE2-LABEL: test1:
11 ; SSE2: # BB#0: # %entry
12 ; SSE2-NEXT: movdqa %xmm1, %xmm2
13 ; SSE2-NEXT: pcmpgtb %xmm0, %xmm2
14 ; SSE2-NEXT: pand %xmm2, %xmm0
15 ; SSE2-NEXT: pandn %xmm1, %xmm2
16 ; SSE2-NEXT: por %xmm2, %xmm0
17 ; SSE2-NEXT: retq
35 ; SSE2-LABEL: test2:
[all …]
Dwiden_conv-4.ll2 …c < %s -mtriple=i686-unknown -mattr=+sse2 | FileCheck %s --check-prefix=X86 --check-prefix=X86-SSE2
4 …< %s -mtriple=x86_64-unknown -mattr=+sse2 | FileCheck %s --check-prefix=X64 --check-prefix=X64-SSE2
10 ; X86-SSE2-LABEL: convert_v7i16_v7f32:
11 ; X86-SSE2: # BB#0: # %entry
12 ; X86-SSE2-NEXT: movl {{[0-9]+}}(%esp), %eax
13 ; X86-SSE2-NEXT: pxor %xmm1, %xmm1
14 ; X86-SSE2-NEXT: movdqa %xmm0, %xmm2
15 ; X86-SSE2-NEXT: punpckhwd {{.*#+}} xmm2 = xmm2[4],xmm1[4],xmm2[5],xmm1[5],xmm2[6],xmm1[6],xmm2[…
16 ; X86-SSE2-NEXT: cvtdq2ps %xmm2, %xmm2
17 ; X86-SSE2-NEXT: punpcklwd {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1],xmm0[2],xmm1[2],xmm0[…
[all …]
Dwiden_conv-3.ll2 …c < %s -mtriple=i686-unknown -mattr=+sse2 | FileCheck %s --check-prefix=X86 --check-prefix=X86-SSE2
4 …< %s -mtriple=x86_64-unknown -mattr=+sse2 | FileCheck %s --check-prefix=X64 --check-prefix=X64-SSE2
10 ; X86-SSE2-LABEL: convert_v2i16_to_v2f32:
11 ; X86-SSE2: # BB#0: # %entry
12 ; X86-SSE2-NEXT: movl {{[0-9]+}}(%esp), %eax
13 ; X86-SSE2-NEXT: psllq $48, %xmm0
14 ; X86-SSE2-NEXT: psrad $16, %xmm0
15 ; X86-SSE2-NEXT: pshufd {{.*#+}} xmm0 = xmm0[1,3,2,3]
16 ; X86-SSE2-NEXT: cvtdq2ps %xmm0, %xmm0
17 ; X86-SSE2-NEXT: movss %xmm0, (%eax)
[all …]
Dvector-bitreverse.ll2 …known-unknown -mattr=+sse2 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE2
1022 ; SSE2-LABEL: test_bitreverse_v16i8:
1023 ; SSE2: # BB#0:
1024 ; SSE2-NEXT: movdqa %xmm0, %xmm2
1025 ; SSE2-NEXT: psrlw $7, %xmm2
1026 ; SSE2-NEXT: movdqa {{.*#+}} xmm1 = [1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1]
1027 ; SSE2-NEXT: pand %xmm1, %xmm1
1028 ; SSE2-NEXT: pand %xmm2, %xmm1
1029 ; SSE2-NEXT: movdqa %xmm0, %xmm2
1030 ; SSE2-NEXT: psllw $7, %xmm2
[all …]

12345678910>>...22