1; RUN: llc < %s -march=x86-64 | FileCheck %s 2 3define <2 x double> @ld(<2 x double> %p) nounwind optsize ssp { 4; CHECK: unpcklpd 5 %shuffle = shufflevector <2 x double> %p, <2 x double> undef, <2 x i32> zeroinitializer 6 ret <2 x double> %shuffle 7} 8 9define <2 x double> @hd(<2 x double> %p) nounwind optsize ssp { 10; CHECK: unpckhpd 11 %shuffle = shufflevector <2 x double> %p, <2 x double> undef, <2 x i32> <i32 1, i32 1> 12 ret <2 x double> %shuffle 13} 14 15define <2 x i64> @ldi(<2 x i64> %p) nounwind optsize ssp { 16; CHECK: punpcklqdq 17 %shuffle = shufflevector <2 x i64> %p, <2 x i64> undef, <2 x i32> zeroinitializer 18 ret <2 x i64> %shuffle 19} 20 21define <2 x i64> @hdi(<2 x i64> %p) nounwind optsize ssp { 22; CHECK: punpckhqdq 23 %shuffle = shufflevector <2 x i64> %p, <2 x i64> undef, <2 x i32> <i32 1, i32 1> 24 ret <2 x i64> %shuffle 25} 26 27; rdar://10050549 28%struct.Float2 = type { float, float } 29 30define <4 x float> @loadhpi(%struct.Float2* %vPtr, <4 x float> %vecin1) nounwind readonly ssp { 31entry: 32; CHECK: loadhpi 33; CHECK-NOT: movq 34; CHECK: movhps ( 35 %tmp1 = bitcast %struct.Float2* %vPtr to <1 x i64>* 36 %addptr7 = getelementptr inbounds <1 x i64>* %tmp1, i64 0 37 %tmp2 = bitcast <1 x i64>* %addptr7 to float* 38 %tmp3 = load float* %tmp2, align 4 39 %vec = insertelement <4 x float> undef, float %tmp3, i32 0 40 %addptr.i12 = getelementptr inbounds float* %tmp2, i64 1 41 %tmp4 = load float* %addptr.i12, align 4 42 %vecin2 = insertelement <4 x float> %vec, float %tmp4, i32 1 43 %shuffle = shufflevector <4 x float> %vecin1, <4 x float> %vecin2, <4 x i32> <i32 0, i32 1, i32 4, i32 5> 44 ret <4 x float> %shuffle 45} 46 47; rdar://10119696 48; CHECK: f 49define <4 x float> @f(<4 x float> %x, double* nocapture %y) nounwind uwtable readonly ssp { 50entry: 51 ; CHECK: movsd (% 52 ; CHECK-NEXT: movsd %xmm 53 %u110.i = load double* %y, align 1 54 %tmp8.i = insertelement <2 x double> undef, double %u110.i, i32 0 55 %tmp9.i = bitcast <2 x double> %tmp8.i to <4 x float> 56 %shuffle.i = shufflevector <4 x float> %x, <4 x float> %tmp9.i, <4 x i32> <i32 4, i32 5, i32 2, i32 3> 57 ret <4 x float> %shuffle.i 58} 59 60