/external/swiftshader/third_party/llvm-7.0/llvm/test/CodeGen/X86/ |
D | ftrunc.ll | 2 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse2 | FileCheck %s --check-prefix=SSE2 7 ; SSE2-LABEL: trunc_unsigned_f32: 8 ; SSE2: # %bb.0: 9 ; SSE2-NEXT: cvttss2si %xmm0, %rax 10 ; SSE2-NEXT: movl %eax, %eax 11 ; SSE2-NEXT: xorps %xmm0, %xmm0 12 ; SSE2-NEXT: cvtsi2ssq %rax, %xmm0 13 ; SSE2-NEXT: retq 30 ; SSE2-LABEL: trunc_unsigned_f64: 31 ; SSE2: # %bb.0: [all …]
|
D | funnel-shift-rot.ll | 2 ; RUN: llc < %s -mtriple=i686-- -mattr=sse2 | FileCheck %s --check-prefixes=ANY,X32-SSE2 20 ; X32-SSE2-LABEL: rotl_i8_const_shift: 21 ; X32-SSE2: # %bb.0: 22 ; X32-SSE2-NEXT: movb {{[0-9]+}}(%esp), %al 23 ; X32-SSE2-NEXT: rolb $3, %al 24 ; X32-SSE2-NEXT: retl 36 ; X32-SSE2-LABEL: rotl_i64_const_shift: 37 ; X32-SSE2: # %bb.0: 38 ; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %ecx 39 ; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %edx [all …]
|
D | vselect-minmax.ll | 2 … -mtriple=x86_64-unknown-unknown -mattr=+sse2 | FileCheck %s --check-prefix=SSE --check-prefix=SSE2 10 ; SSE2-LABEL: test1: 11 ; SSE2: # %bb.0: # %entry 12 ; SSE2-NEXT: movdqa %xmm1, %xmm2 13 ; SSE2-NEXT: pcmpgtb %xmm0, %xmm2 14 ; SSE2-NEXT: pand %xmm2, %xmm0 15 ; SSE2-NEXT: pandn %xmm1, %xmm2 16 ; SSE2-NEXT: por %xmm2, %xmm0 17 ; SSE2-NEXT: retq 35 ; SSE2-LABEL: test2: [all …]
|
D | funnel-shift.ll | 2 ; RUN: llc < %s -mtriple=i686-- -mattr=sse2 | FileCheck %s --check-prefixes=ANY,X32-SSE2 20 ; X32-SSE2-LABEL: fshl_i32: 21 ; X32-SSE2: # %bb.0: 22 ; X32-SSE2-NEXT: pushl %edi 23 ; X32-SSE2-NEXT: pushl %esi 24 ; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %esi 25 ; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %edi 26 ; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %edx 27 ; X32-SSE2-NEXT: movl $32, %ecx 28 ; X32-SSE2-NEXT: subl %edx, %ecx [all …]
|
D | vector-bitreverse.ll | 2 …known-unknown -mattr=+sse2 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE2 235 ; SSE2-LABEL: test_bitreverse_v16i8: 236 ; SSE2: # %bb.0: 237 ; SSE2-NEXT: movdqa {{.*#+}} xmm1 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15] 238 ; SSE2-NEXT: movdqa %xmm0, %xmm2 239 ; SSE2-NEXT: pand %xmm1, %xmm2 240 ; SSE2-NEXT: psllw $4, %xmm2 241 ; SSE2-NEXT: movdqa {{.*#+}} xmm3 = [240,240,240,240,240,240,240,240,240,240,240,240,240,240,240… 242 ; SSE2-NEXT: pand %xmm3, %xmm2 243 ; SSE2-NEXT: pand %xmm3, %xmm0 [all …]
|
D | vector-reduce-umin.ll | 2 …known-unknown -mattr=+sse2 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE2 14 ; SSE2-LABEL: test_v2i64: 15 ; SSE2: # %bb.0: 16 ; SSE2-NEXT: pshufd {{.*#+}} xmm1 = xmm0[2,3,0,1] 17 ; SSE2-NEXT: movdqa {{.*#+}} xmm2 = [2147483648,2147483648,2147483648,2147483648] 18 ; SSE2-NEXT: movdqa %xmm0, %xmm3 19 ; SSE2-NEXT: pxor %xmm2, %xmm3 20 ; SSE2-NEXT: pxor %xmm1, %xmm2 21 ; SSE2-NEXT: movdqa %xmm2, %xmm4 22 ; SSE2-NEXT: pcmpgtd %xmm3, %xmm4 [all …]
|
D | vector-reduce-smax.ll | 2 …known-unknown -mattr=+sse2 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE2 14 ; SSE2-LABEL: test_v2i64: 15 ; SSE2: # %bb.0: 16 ; SSE2-NEXT: pshufd {{.*#+}} xmm1 = xmm0[2,3,0,1] 17 ; SSE2-NEXT: movdqa {{.*#+}} xmm2 = [2147483648,0,2147483648,0] 18 ; SSE2-NEXT: movdqa %xmm0, %xmm3 19 ; SSE2-NEXT: pxor %xmm2, %xmm3 20 ; SSE2-NEXT: pxor %xmm1, %xmm2 21 ; SSE2-NEXT: movdqa %xmm3, %xmm4 22 ; SSE2-NEXT: pcmpgtd %xmm2, %xmm4 [all …]
|
D | vector-reduce-smin.ll | 2 …known-unknown -mattr=+sse2 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE2 14 ; SSE2-LABEL: test_v2i64: 15 ; SSE2: # %bb.0: 16 ; SSE2-NEXT: pshufd {{.*#+}} xmm1 = xmm0[2,3,0,1] 17 ; SSE2-NEXT: movdqa {{.*#+}} xmm2 = [2147483648,0,2147483648,0] 18 ; SSE2-NEXT: movdqa %xmm0, %xmm3 19 ; SSE2-NEXT: pxor %xmm2, %xmm3 20 ; SSE2-NEXT: pxor %xmm1, %xmm2 21 ; SSE2-NEXT: movdqa %xmm2, %xmm4 22 ; SSE2-NEXT: pcmpgtd %xmm3, %xmm4 [all …]
|
D | vector-compare-results.ll | 2 … -mtriple=x86_64-unknown-unknown -mattr=+sse2 | FileCheck %s --check-prefix=SSE --check-prefix=SSE2 45 ; SSE2-LABEL: test_cmp_v2i64: 46 ; SSE2: # %bb.0: 47 ; SSE2-NEXT: movdqa {{.*#+}} xmm2 = [2147483648,0,2147483648,0] 48 ; SSE2-NEXT: pxor %xmm2, %xmm1 49 ; SSE2-NEXT: pxor %xmm2, %xmm0 50 ; SSE2-NEXT: movdqa %xmm0, %xmm2 51 ; SSE2-NEXT: pcmpgtd %xmm1, %xmm2 52 ; SSE2-NEXT: pshufd {{.*#+}} xmm3 = xmm2[0,0,2,2] 53 ; SSE2-NEXT: pcmpeqd %xmm1, %xmm0 [all …]
|
D | pr34080.ll | 2 ; RUN: llc < %s -mtriple=x86_64-apple-darwin -mattr=+sse2 | FileCheck %s --check-prefix=SSE2 3 … -mtriple=x86_64-apple-darwin -mattr=+sse2 -mcpu=x86-64 | FileCheck %s --check-prefix=SSE2-SCHEDULE 10 ; SSE2-LABEL: _Z1fe: 11 ; SSE2: ## %bb.0: ## %entry 12 ; SSE2-NEXT: pushq %rbp 13 ; SSE2-NEXT: .cfi_def_cfa_offset 16 14 ; SSE2-NEXT: .cfi_offset %rbp, -16 15 ; SSE2-NEXT: movq %rsp, %rbp 16 ; SSE2-NEXT: .cfi_def_cfa_register %rbp 17 ; SSE2-NEXT: fldt 16(%rbp) [all …]
|
D | widen_conv-4.ll | 2 …c < %s -mtriple=i686-unknown -mattr=+sse2 | FileCheck %s --check-prefix=X86 --check-prefix=X86-SSE2 4 …< %s -mtriple=x86_64-unknown -mattr=+sse2 | FileCheck %s --check-prefix=X64 --check-prefix=X64-SSE2 10 ; X86-SSE2-LABEL: convert_v7i16_v7f32: 11 ; X86-SSE2: # %bb.0: # %entry 12 ; X86-SSE2-NEXT: movl {{[0-9]+}}(%esp), %eax 13 ; X86-SSE2-NEXT: pxor %xmm1, %xmm1 14 ; X86-SSE2-NEXT: movdqa %xmm0, %xmm2 15 ; X86-SSE2-NEXT: punpckhwd {{.*#+}} xmm2 = xmm2[4],xmm1[4],xmm2[5],xmm1[5],xmm2[6],xmm1[6],xmm2[… 16 ; X86-SSE2-NEXT: cvtdq2ps %xmm2, %xmm2 17 ; X86-SSE2-NEXT: punpcklwd {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1],xmm0[2],xmm1[2],xmm0[… [all …]
|
D | vector-reduce-umax.ll | 2 …known-unknown -mattr=+sse2 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE2 14 ; SSE2-LABEL: test_v2i64: 15 ; SSE2: # %bb.0: 16 ; SSE2-NEXT: pshufd {{.*#+}} xmm1 = xmm0[2,3,0,1] 17 ; SSE2-NEXT: movdqa {{.*#+}} xmm2 = [2147483648,2147483648,2147483648,2147483648] 18 ; SSE2-NEXT: movdqa %xmm0, %xmm3 19 ; SSE2-NEXT: pxor %xmm2, %xmm3 20 ; SSE2-NEXT: pxor %xmm1, %xmm2 21 ; SSE2-NEXT: movdqa %xmm3, %xmm4 22 ; SSE2-NEXT: pcmpgtd %xmm2, %xmm4 [all …]
|
D | widen_conv-3.ll | 2 …c < %s -mtriple=i686-unknown -mattr=+sse2 | FileCheck %s --check-prefix=X86 --check-prefix=X86-SSE2 4 …< %s -mtriple=x86_64-unknown -mattr=+sse2 | FileCheck %s --check-prefix=X64 --check-prefix=X64-SSE2 10 ; X86-SSE2-LABEL: convert_v2i16_to_v2f32: 11 ; X86-SSE2: # %bb.0: # %entry 12 ; X86-SSE2-NEXT: movl {{[0-9]+}}(%esp), %eax 13 ; X86-SSE2-NEXT: psllq $48, %xmm0 14 ; X86-SSE2-NEXT: psrad $16, %xmm0 15 ; X86-SSE2-NEXT: pshufd {{.*#+}} xmm0 = xmm0[1,3,2,3] 16 ; X86-SSE2-NEXT: cvtdq2ps %xmm0, %xmm0 17 ; X86-SSE2-NEXT: movss %xmm0, (%eax) [all …]
|
D | trunc-ext-ld-st.ll | 2 …c < %s -mtriple=x86_64-unknown -mattr=+sse2 | FileCheck %s --check-prefix=CHECK --check-prefix=SSE2 7 ; SSE2-LABEL: load_2_i8: 8 ; SSE2: # %bb.0: 9 ; SSE2-NEXT: movzwl (%rdi), %eax 10 ; SSE2-NEXT: movd %eax, %xmm0 11 ; SSE2-NEXT: punpcklbw {{.*#+}} xmm0 = xmm0[0,0,1,1,2,2,3,3,4,4,5,5,6,6,7,7] 12 ; SSE2-NEXT: punpcklwd {{.*#+}} xmm0 = xmm0[0,0,1,1,2,2,3,3] 13 ; SSE2-NEXT: pshufd {{.*#+}} xmm0 = xmm0[0,1,1,3] 14 ; SSE2-NEXT: paddq {{.*}}(%rip), %xmm0 15 ; SSE2-NEXT: pand {{.*}}(%rip), %xmm0 [all …]
|
D | setcc-wide-types.ll | 2 …triple=x86_64-unknown-unknown -mattr=sse2 | FileCheck %s --check-prefix=ANY --check-prefix=SSE2 11 ; SSE2-LABEL: ne_i128: 12 ; SSE2: # %bb.0: 13 ; SSE2-NEXT: pcmpeqb %xmm1, %xmm0 14 ; SSE2-NEXT: pmovmskb %xmm0, %ecx 15 ; SSE2-NEXT: xorl %eax, %eax 16 ; SSE2-NEXT: cmpl $65535, %ecx # imm = 0xFFFF 17 ; SSE2-NEXT: setne %al 18 ; SSE2-NEXT: retq 36 ; SSE2-LABEL: eq_i128: [all …]
|
/external/llvm/test/Analysis/CostModel/X86/ |
D | testshiftlshr.ll | 1 ; RUN: llc -mtriple=x86_64-apple-darwin -mcpu=core2 < %s | FileCheck --check-prefix=SSE2-CODEGEN %s 2 …triple=x86_64-apple-darwin -mcpu=core2 -cost-model -analyze < %s | FileCheck --check-prefix=SSE2 %s 7 ; SSE2: shift2i16 8 ; SSE2: cost of 4 {{.*}} lshr 9 ; SSE2-CODEGEN: shift2i16 10 ; SSE2-CODEGEN: psrlq 19 ; SSE2: shift4i16 20 ; SSE2: cost of 16 {{.*}} lshr 21 ; SSE2-CODEGEN: shift4i16 22 ; SSE2-CODEGEN: psrld [all …]
|
D | testshiftashr.ll | 1 ; RUN: llc -mtriple=x86_64-apple-darwin -mcpu=core2 < %s | FileCheck --check-prefix=SSE2-CODEGEN %s 2 …triple=x86_64-apple-darwin -mcpu=core2 -cost-model -analyze < %s | FileCheck --check-prefix=SSE2 %s 7 ; SSE2: shift2i16 8 ; SSE2: cost of 12 {{.*}} ashr 9 ; SSE2-CODEGEN: shift2i16 10 ; SSE2-CODEGEN: psrlq 19 ; SSE2: shift4i16 20 ; SSE2: cost of 16 {{.*}} ashr 21 ; SSE2-CODEGEN: shift4i16 22 ; SSE2-CODEGEN: psrad [all …]
|
D | testshiftshl.ll | 1 ; RUN: llc -mtriple=x86_64-apple-darwin -mcpu=core2 < %s | FileCheck --check-prefix=SSE2-CODEGEN %s 2 …triple=x86_64-apple-darwin -mcpu=core2 -cost-model -analyze < %s | FileCheck --check-prefix=SSE2 %s 7 ; SSE2: shift2i16 8 ; SSE2: cost of 4 {{.*}} shl 9 ; SSE2-CODEGEN: shift2i16 10 ; SSE2-CODEGEN: psllq 19 ; SSE2: shift4i16 20 ; SSE2: cost of 10 {{.*}} shl 21 ; SSE2-CODEGEN: shift4i16 22 ; SSE2-CODEGEN: pmuludq [all …]
|
/external/swiftshader/third_party/llvm-7.0/llvm/test/Analysis/CostModel/X86/ |
D | testshiftlshr.ll | 1 ; RUN: llc -mtriple=x86_64-apple-darwin -mcpu=core2 < %s | FileCheck --check-prefix=SSE2-CODEGEN %s 2 …triple=x86_64-apple-darwin -mcpu=core2 -cost-model -analyze < %s | FileCheck --check-prefix=SSE2 %s 7 ; SSE2: shift2i16 8 ; SSE2: cost of 4 {{.*}} lshr 9 ; SSE2-CODEGEN: shift2i16 10 ; SSE2-CODEGEN: psrlq 19 ; SSE2: shift4i16 20 ; SSE2: cost of 16 {{.*}} lshr 21 ; SSE2-CODEGEN: shift4i16 22 ; SSE2-CODEGEN: psrld [all …]
|
D | testshiftashr.ll | 1 ; RUN: llc -mtriple=x86_64-apple-darwin -mcpu=core2 < %s | FileCheck --check-prefix=SSE2-CODEGEN %s 2 …triple=x86_64-apple-darwin -mcpu=core2 -cost-model -analyze < %s | FileCheck --check-prefix=SSE2 %s 7 ; SSE2: shift2i16 8 ; SSE2: cost of 12 {{.*}} ashr 9 ; SSE2-CODEGEN: shift2i16 10 ; SSE2-CODEGEN: psrlq 19 ; SSE2: shift4i16 20 ; SSE2: cost of 16 {{.*}} ashr 21 ; SSE2-CODEGEN: shift4i16 22 ; SSE2-CODEGEN: psrad [all …]
|
D | testshiftshl.ll | 1 ; RUN: llc -mtriple=x86_64-apple-darwin -mcpu=core2 < %s | FileCheck --check-prefix=SSE2-CODEGEN %s 2 …triple=x86_64-apple-darwin -mcpu=core2 -cost-model -analyze < %s | FileCheck --check-prefix=SSE2 %s 7 ; SSE2: shift2i16 8 ; SSE2: cost of 4 {{.*}} shl 9 ; SSE2-CODEGEN: shift2i16 10 ; SSE2-CODEGEN: psllq 19 ; SSE2: shift4i16 20 ; SSE2: cost of 10 {{.*}} shl 21 ; SSE2-CODEGEN: shift4i16 22 ; SSE2-CODEGEN: pmuludq [all …]
|
/external/llvm/test/CodeGen/X86/ |
D | vselect-minmax.ll | 2 … -mtriple=x86_64-unknown-unknown -mattr=+sse2 | FileCheck %s --check-prefix=SSE --check-prefix=SSE2 10 ; SSE2-LABEL: test1: 11 ; SSE2: # BB#0: # %entry 12 ; SSE2-NEXT: movdqa %xmm1, %xmm2 13 ; SSE2-NEXT: pcmpgtb %xmm0, %xmm2 14 ; SSE2-NEXT: pand %xmm2, %xmm0 15 ; SSE2-NEXT: pandn %xmm1, %xmm2 16 ; SSE2-NEXT: por %xmm2, %xmm0 17 ; SSE2-NEXT: retq 35 ; SSE2-LABEL: test2: [all …]
|
D | widen_conv-4.ll | 2 …c < %s -mtriple=i686-unknown -mattr=+sse2 | FileCheck %s --check-prefix=X86 --check-prefix=X86-SSE2 4 …< %s -mtriple=x86_64-unknown -mattr=+sse2 | FileCheck %s --check-prefix=X64 --check-prefix=X64-SSE2 10 ; X86-SSE2-LABEL: convert_v7i16_v7f32: 11 ; X86-SSE2: # BB#0: # %entry 12 ; X86-SSE2-NEXT: movl {{[0-9]+}}(%esp), %eax 13 ; X86-SSE2-NEXT: pxor %xmm1, %xmm1 14 ; X86-SSE2-NEXT: movdqa %xmm0, %xmm2 15 ; X86-SSE2-NEXT: punpckhwd {{.*#+}} xmm2 = xmm2[4],xmm1[4],xmm2[5],xmm1[5],xmm2[6],xmm1[6],xmm2[… 16 ; X86-SSE2-NEXT: cvtdq2ps %xmm2, %xmm2 17 ; X86-SSE2-NEXT: punpcklwd {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1],xmm0[2],xmm1[2],xmm0[… [all …]
|
D | widen_conv-3.ll | 2 …c < %s -mtriple=i686-unknown -mattr=+sse2 | FileCheck %s --check-prefix=X86 --check-prefix=X86-SSE2 4 …< %s -mtriple=x86_64-unknown -mattr=+sse2 | FileCheck %s --check-prefix=X64 --check-prefix=X64-SSE2 10 ; X86-SSE2-LABEL: convert_v2i16_to_v2f32: 11 ; X86-SSE2: # BB#0: # %entry 12 ; X86-SSE2-NEXT: movl {{[0-9]+}}(%esp), %eax 13 ; X86-SSE2-NEXT: psllq $48, %xmm0 14 ; X86-SSE2-NEXT: psrad $16, %xmm0 15 ; X86-SSE2-NEXT: pshufd {{.*#+}} xmm0 = xmm0[1,3,2,3] 16 ; X86-SSE2-NEXT: cvtdq2ps %xmm0, %xmm0 17 ; X86-SSE2-NEXT: movss %xmm0, (%eax) [all …]
|
D | vector-bitreverse.ll | 2 …known-unknown -mattr=+sse2 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE2 1022 ; SSE2-LABEL: test_bitreverse_v16i8: 1023 ; SSE2: # BB#0: 1024 ; SSE2-NEXT: movdqa %xmm0, %xmm2 1025 ; SSE2-NEXT: psrlw $7, %xmm2 1026 ; SSE2-NEXT: movdqa {{.*#+}} xmm1 = [1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1] 1027 ; SSE2-NEXT: pand %xmm1, %xmm1 1028 ; SSE2-NEXT: pand %xmm2, %xmm1 1029 ; SSE2-NEXT: movdqa %xmm0, %xmm2 1030 ; SSE2-NEXT: psllw $7, %xmm2 [all …]
|