1; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py 2; RUN: llc < %s -mtriple=i686-unknown -mattr=+sse2,-sse4.1 | FileCheck %s --check-prefix=X32 3; RUN: llc < %s -mtriple=x86_64-unknown -mattr=+sse2,-sse4.1 | FileCheck %s --check-prefix=X64 4 5define <4 x float> @t1(float %s, <4 x float> %tmp) nounwind { 6; X32-LABEL: t1: 7; X32: # BB#0: 8; X32-NEXT: movss {{.*#+}} xmm1 = mem[0],zero,zero,zero 9; X32-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[2,0] 10; X32-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,0] 11; X32-NEXT: retl 12; 13; X64-LABEL: t1: 14; X64: # BB#0: 15; X64-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,0],xmm1[2,0] 16; X64-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,1],xmm0[2,0] 17; X64-NEXT: movaps %xmm1, %xmm0 18; X64-NEXT: retq 19 %tmp1 = insertelement <4 x float> %tmp, float %s, i32 3 20 ret <4 x float> %tmp1 21} 22 23define <4 x i32> @t2(i32 %s, <4 x i32> %tmp) nounwind { 24; X32-LABEL: t2: 25; X32: # BB#0: 26; X32-NEXT: movd {{.*#+}} xmm1 = mem[0],zero,zero,zero 27; X32-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[2,0] 28; X32-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,0] 29; X32-NEXT: retl 30; 31; X64-LABEL: t2: 32; X64: # BB#0: 33; X64-NEXT: movd %edi, %xmm1 34; X64-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[2,0] 35; X64-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,0] 36; X64-NEXT: retq 37 %tmp1 = insertelement <4 x i32> %tmp, i32 %s, i32 3 38 ret <4 x i32> %tmp1 39} 40 41define <2 x double> @t3(double %s, <2 x double> %tmp) nounwind { 42; X32-LABEL: t3: 43; X32: # BB#0: 44; X32-NEXT: movhpd {{.*#+}} xmm0 = xmm0[0],mem[0] 45; X32-NEXT: retl 46; 47; X64-LABEL: t3: 48; X64: # BB#0: 49; X64-NEXT: unpcklpd {{.*#+}} xmm1 = xmm1[0],xmm0[0] 50; X64-NEXT: movapd %xmm1, %xmm0 51; X64-NEXT: retq 52 %tmp1 = insertelement <2 x double> %tmp, double %s, i32 1 53 ret <2 x double> %tmp1 54} 55 56define <8 x i16> @t4(i16 %s, <8 x i16> %tmp) nounwind { 57; X32-LABEL: t4: 58; X32: # BB#0: 59; X32-NEXT: pinsrw $5, {{[0-9]+}}(%esp), %xmm0 60; X32-NEXT: retl 61; 62; X64-LABEL: t4: 63; X64: # BB#0: 64; X64-NEXT: pinsrw $5, %edi, %xmm0 65; X64-NEXT: retq 66 %tmp1 = insertelement <8 x i16> %tmp, i16 %s, i32 5 67 ret <8 x i16> %tmp1 68} 69