Lines Matching refs:SSE1
9 …llc < %s -mtriple=i686-unknown-unknown -mattr=+sse | FileCheck %s --check-prefixes=X86-SSE,X86-SSE1
23 ; X86-SSE1-LABEL: merge_2f64_f64_23:
24 ; X86-SSE1: # %bb.0:
25 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
26 ; X86-SSE1-NEXT: fldl 16(%eax)
27 ; X86-SSE1-NEXT: fldl 24(%eax)
28 ; X86-SSE1-NEXT: fxch %st(1)
29 ; X86-SSE1-NEXT: retl
56 ; X86-SSE1-LABEL: merge_2i64_i64_12:
57 ; X86-SSE1: # %bb.0:
58 ; X86-SSE1-NEXT: pushl %edi
59 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 8
60 ; X86-SSE1-NEXT: pushl %esi
61 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 12
62 ; X86-SSE1-NEXT: .cfi_offset %esi, -12
63 ; X86-SSE1-NEXT: .cfi_offset %edi, -8
64 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
65 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %ecx
66 ; X86-SSE1-NEXT: movl 8(%ecx), %edx
67 ; X86-SSE1-NEXT: movl 12(%ecx), %esi
68 ; X86-SSE1-NEXT: movl 16(%ecx), %edi
69 ; X86-SSE1-NEXT: movl 20(%ecx), %ecx
70 ; X86-SSE1-NEXT: movl %ecx, 12(%eax)
71 ; X86-SSE1-NEXT: movl %edi, 8(%eax)
72 ; X86-SSE1-NEXT: movl %esi, 4(%eax)
73 ; X86-SSE1-NEXT: movl %edx, (%eax)
74 ; X86-SSE1-NEXT: popl %esi
75 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 8
76 ; X86-SSE1-NEXT: popl %edi
77 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 4
78 ; X86-SSE1-NEXT: retl $4
159 ; X86-SSE1-LABEL: merge_4f32_f32_34uu:
160 ; X86-SSE1: # %bb.0:
161 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
162 ; X86-SSE1-NEXT: xorps %xmm0, %xmm0
163 ; X86-SSE1-NEXT: movlps {{.*#+}} xmm0 = mem[0,1],xmm0[2,3]
164 ; X86-SSE1-NEXT: retl
202 ; X86-SSE1-LABEL: merge_4f32_f32_34z6:
203 ; X86-SSE1: # %bb.0:
204 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
205 ; X86-SSE1-NEXT: movups 12(%eax), %xmm0
206 ; X86-SSE1-NEXT: xorps %xmm1, %xmm1
207 ; X86-SSE1-NEXT: shufps {{.*#+}} xmm1 = xmm1[2,0],xmm0[3,0]
208 ; X86-SSE1-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[0,2]
209 ; X86-SSE1-NEXT: retl
241 ; X86-SSE1-LABEL: merge_4f32_f32_45zz:
242 ; X86-SSE1: # %bb.0:
243 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
244 ; X86-SSE1-NEXT: xorps %xmm0, %xmm0
245 ; X86-SSE1-NEXT: movlps {{.*#+}} xmm0 = mem[0,1],xmm0[2,3]
246 ; X86-SSE1-NEXT: retl
282 ; X86-SSE1-LABEL: merge_4f32_f32_012u:
283 ; X86-SSE1: # %bb.0:
284 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
285 ; X86-SSE1-NEXT: xorps %xmm0, %xmm0
286 ; X86-SSE1-NEXT: movlps {{.*#+}} xmm0 = mem[0,1],xmm0[2,3]
287 ; X86-SSE1-NEXT: movss {{.*#+}} xmm1 = mem[0],zero,zero,zero
288 ; X86-SSE1-NEXT: movlhps {{.*#+}} xmm0 = xmm0[0],xmm1[0]
289 ; X86-SSE1-NEXT: retl
330 ; X86-SSE1-LABEL: merge_4f32_f32_019u:
331 ; X86-SSE1: # %bb.0:
332 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
333 ; X86-SSE1-NEXT: xorps %xmm0, %xmm0
334 ; X86-SSE1-NEXT: movlps {{.*#+}} xmm0 = mem[0,1],xmm0[2,3]
335 ; X86-SSE1-NEXT: movss {{.*#+}} xmm1 = mem[0],zero,zero,zero
336 ; X86-SSE1-NEXT: movlhps {{.*#+}} xmm0 = xmm0[0],xmm1[0]
337 ; X86-SSE1-NEXT: retl
369 ; X86-SSE1-LABEL: merge_4i32_i32_23u5:
370 ; X86-SSE1: # %bb.0:
371 ; X86-SSE1-NEXT: pushl %esi
372 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 8
373 ; X86-SSE1-NEXT: .cfi_offset %esi, -8
374 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
375 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %ecx
376 ; X86-SSE1-NEXT: movl 8(%ecx), %edx
377 ; X86-SSE1-NEXT: movl 12(%ecx), %esi
378 ; X86-SSE1-NEXT: movl 20(%ecx), %ecx
379 ; X86-SSE1-NEXT: movl %esi, 4(%eax)
380 ; X86-SSE1-NEXT: movl %edx, (%eax)
381 ; X86-SSE1-NEXT: movl %ecx, 12(%eax)
382 ; X86-SSE1-NEXT: popl %esi
383 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 4
384 ; X86-SSE1-NEXT: retl $4
416 ; X86-SSE1-LABEL: merge_4i32_i32_23u5_inc2:
417 ; X86-SSE1: # %bb.0:
418 ; X86-SSE1-NEXT: pushl %edi
419 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 8
420 ; X86-SSE1-NEXT: pushl %esi
421 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 12
422 ; X86-SSE1-NEXT: .cfi_offset %esi, -12
423 ; X86-SSE1-NEXT: .cfi_offset %edi, -8
424 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
425 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %ecx
426 ; X86-SSE1-NEXT: movl 8(%ecx), %edx
427 ; X86-SSE1-NEXT: movl 12(%ecx), %esi
428 ; X86-SSE1-NEXT: leal 1(%edx), %edi
429 ; X86-SSE1-NEXT: movl %edi, 8(%ecx)
430 ; X86-SSE1-NEXT: movl 20(%ecx), %ecx
431 ; X86-SSE1-NEXT: movl %esi, 4(%eax)
432 ; X86-SSE1-NEXT: movl %edx, (%eax)
433 ; X86-SSE1-NEXT: movl %ecx, 12(%eax)
434 ; X86-SSE1-NEXT: popl %esi
435 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 8
436 ; X86-SSE1-NEXT: popl %edi
437 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 4
438 ; X86-SSE1-NEXT: retl $4
473 ; X86-SSE1-LABEL: merge_4i32_i32_23u5_inc3:
474 ; X86-SSE1: # %bb.0:
475 ; X86-SSE1-NEXT: pushl %edi
476 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 8
477 ; X86-SSE1-NEXT: pushl %esi
478 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 12
479 ; X86-SSE1-NEXT: .cfi_offset %esi, -12
480 ; X86-SSE1-NEXT: .cfi_offset %edi, -8
481 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
482 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %ecx
483 ; X86-SSE1-NEXT: movl 8(%ecx), %edx
484 ; X86-SSE1-NEXT: movl 12(%ecx), %esi
485 ; X86-SSE1-NEXT: leal 1(%esi), %edi
486 ; X86-SSE1-NEXT: movl %edi, 12(%ecx)
487 ; X86-SSE1-NEXT: movl 20(%ecx), %ecx
488 ; X86-SSE1-NEXT: movl %esi, 4(%eax)
489 ; X86-SSE1-NEXT: movl %edx, (%eax)
490 ; X86-SSE1-NEXT: movl %ecx, 12(%eax)
491 ; X86-SSE1-NEXT: popl %esi
492 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 8
493 ; X86-SSE1-NEXT: popl %edi
494 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 4
495 ; X86-SSE1-NEXT: retl $4
528 ; X86-SSE1-LABEL: merge_4i32_i32_3zuu:
529 ; X86-SSE1: # %bb.0:
530 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
531 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %ecx
532 ; X86-SSE1-NEXT: movl 12(%ecx), %ecx
533 ; X86-SSE1-NEXT: movl %ecx, (%eax)
534 ; X86-SSE1-NEXT: movl $0, 4(%eax)
535 ; X86-SSE1-NEXT: retl $4
560 ; X86-SSE1-LABEL: merge_4i32_i32_34uu:
561 ; X86-SSE1: # %bb.0:
562 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
563 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %ecx
564 ; X86-SSE1-NEXT: movl 12(%ecx), %edx
565 ; X86-SSE1-NEXT: movl 16(%ecx), %ecx
566 ; X86-SSE1-NEXT: movl %ecx, 4(%eax)
567 ; X86-SSE1-NEXT: movl %edx, (%eax)
568 ; X86-SSE1-NEXT: retl $4
595 ; X86-SSE1-LABEL: merge_4i32_i32_45zz:
596 ; X86-SSE1: # %bb.0:
597 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
598 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %ecx
599 ; X86-SSE1-NEXT: movl 16(%ecx), %edx
600 ; X86-SSE1-NEXT: movl 20(%ecx), %ecx
601 ; X86-SSE1-NEXT: movl %ecx, 4(%eax)
602 ; X86-SSE1-NEXT: movl %edx, (%eax)
603 ; X86-SSE1-NEXT: movl $0, 12(%eax)
604 ; X86-SSE1-NEXT: movl $0, 8(%eax)
605 ; X86-SSE1-NEXT: retl $4
634 ; X86-SSE1-LABEL: merge_4i32_i32_45zz_inc4:
635 ; X86-SSE1: # %bb.0:
636 ; X86-SSE1-NEXT: pushl %edi
637 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 8
638 ; X86-SSE1-NEXT: pushl %esi
639 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 12
640 ; X86-SSE1-NEXT: .cfi_offset %esi, -12
641 ; X86-SSE1-NEXT: .cfi_offset %edi, -8
642 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
643 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %ecx
644 ; X86-SSE1-NEXT: movl 16(%ecx), %edx
645 ; X86-SSE1-NEXT: movl 20(%ecx), %esi
646 ; X86-SSE1-NEXT: leal 1(%edx), %edi
647 ; X86-SSE1-NEXT: movl %edi, 16(%ecx)
648 ; X86-SSE1-NEXT: movl %esi, 4(%eax)
649 ; X86-SSE1-NEXT: movl %edx, (%eax)
650 ; X86-SSE1-NEXT: movl $0, 12(%eax)
651 ; X86-SSE1-NEXT: movl $0, 8(%eax)
652 ; X86-SSE1-NEXT: popl %esi
653 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 8
654 ; X86-SSE1-NEXT: popl %edi
655 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 4
656 ; X86-SSE1-NEXT: retl $4
688 ; X86-SSE1-LABEL: merge_4i32_i32_45zz_inc5:
689 ; X86-SSE1: # %bb.0:
690 ; X86-SSE1-NEXT: pushl %edi
691 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 8
692 ; X86-SSE1-NEXT: pushl %esi
693 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 12
694 ; X86-SSE1-NEXT: .cfi_offset %esi, -12
695 ; X86-SSE1-NEXT: .cfi_offset %edi, -8
696 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
697 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %ecx
698 ; X86-SSE1-NEXT: movl 16(%ecx), %edx
699 ; X86-SSE1-NEXT: movl 20(%ecx), %esi
700 ; X86-SSE1-NEXT: leal 1(%esi), %edi
701 ; X86-SSE1-NEXT: movl %edi, 20(%ecx)
702 ; X86-SSE1-NEXT: movl %esi, 4(%eax)
703 ; X86-SSE1-NEXT: movl %edx, (%eax)
704 ; X86-SSE1-NEXT: movl $0, 12(%eax)
705 ; X86-SSE1-NEXT: movl $0, 8(%eax)
706 ; X86-SSE1-NEXT: popl %esi
707 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 8
708 ; X86-SSE1-NEXT: popl %edi
709 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 4
710 ; X86-SSE1-NEXT: retl $4
740 ; X86-SSE1-LABEL: merge_8i16_i16_23u567u9:
741 ; X86-SSE1: # %bb.0:
742 ; X86-SSE1-NEXT: pushl %edi
743 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 8
744 ; X86-SSE1-NEXT: pushl %esi
745 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 12
746 ; X86-SSE1-NEXT: .cfi_offset %esi, -12
747 ; X86-SSE1-NEXT: .cfi_offset %edi, -8
748 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
749 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %ecx
750 ; X86-SSE1-NEXT: movl 4(%ecx), %edx
751 ; X86-SSE1-NEXT: movl 10(%ecx), %esi
752 ; X86-SSE1-NEXT: movzwl 14(%ecx), %edi
753 ; X86-SSE1-NEXT: movzwl 18(%ecx), %ecx
754 ; X86-SSE1-NEXT: movw %di, 10(%eax)
755 ; X86-SSE1-NEXT: movw %cx, 14(%eax)
756 ; X86-SSE1-NEXT: movl %esi, 6(%eax)
757 ; X86-SSE1-NEXT: movl %edx, (%eax)
758 ; X86-SSE1-NEXT: popl %esi
759 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 8
760 ; X86-SSE1-NEXT: popl %edi
761 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 4
762 ; X86-SSE1-NEXT: retl $4
801 ; X86-SSE1-LABEL: merge_8i16_i16_34uuuuuu:
802 ; X86-SSE1: # %bb.0:
803 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
804 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %ecx
805 ; X86-SSE1-NEXT: movl 6(%ecx), %ecx
806 ; X86-SSE1-NEXT: movl %ecx, (%eax)
807 ; X86-SSE1-NEXT: retl $4
834 ; X86-SSE1-LABEL: merge_8i16_i16_45u7zzzz:
835 ; X86-SSE1: # %bb.0:
836 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
837 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %ecx
838 ; X86-SSE1-NEXT: movl 8(%ecx), %edx
839 ; X86-SSE1-NEXT: movzwl 14(%ecx), %ecx
840 ; X86-SSE1-NEXT: movw %cx, 6(%eax)
841 ; X86-SSE1-NEXT: movl %edx, (%eax)
842 ; X86-SSE1-NEXT: movl $0, 12(%eax)
843 ; X86-SSE1-NEXT: movl $0, 8(%eax)
844 ; X86-SSE1-NEXT: retl $4
878 ; X86-SSE1-LABEL: merge_16i8_i8_01u3456789ABCDuF:
879 ; X86-SSE1: # %bb.0:
880 ; X86-SSE1-NEXT: pushl %ebp
881 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 8
882 ; X86-SSE1-NEXT: pushl %ebx
883 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 12
884 ; X86-SSE1-NEXT: pushl %edi
885 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 16
886 ; X86-SSE1-NEXT: pushl %esi
887 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 20
888 ; X86-SSE1-NEXT: .cfi_offset %esi, -20
889 ; X86-SSE1-NEXT: .cfi_offset %edi, -16
890 ; X86-SSE1-NEXT: .cfi_offset %ebx, -12
891 ; X86-SSE1-NEXT: .cfi_offset %ebp, -8
892 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
893 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %ecx
894 ; X86-SSE1-NEXT: movzwl (%ecx), %ebp
895 ; X86-SSE1-NEXT: movl 3(%ecx), %esi
896 ; X86-SSE1-NEXT: movl 7(%ecx), %edi
897 ; X86-SSE1-NEXT: movzwl 11(%ecx), %ebx
898 ; X86-SSE1-NEXT: movb 13(%ecx), %dl
899 ; X86-SSE1-NEXT: movb 15(%ecx), %cl
900 ; X86-SSE1-NEXT: movb %dl, 13(%eax)
901 ; X86-SSE1-NEXT: movb %cl, 15(%eax)
902 ; X86-SSE1-NEXT: movw %bx, 11(%eax)
903 ; X86-SSE1-NEXT: movl %edi, 7(%eax)
904 ; X86-SSE1-NEXT: movl %esi, 3(%eax)
905 ; X86-SSE1-NEXT: movw %bp, (%eax)
906 ; X86-SSE1-NEXT: popl %esi
907 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 16
908 ; X86-SSE1-NEXT: popl %edi
909 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 12
910 ; X86-SSE1-NEXT: popl %ebx
911 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 8
912 ; X86-SSE1-NEXT: popl %ebp
913 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 4
914 ; X86-SSE1-NEXT: retl $4
977 ; X86-SSE1-LABEL: merge_16i8_i8_01u3uuzzuuuuuzzz:
978 ; X86-SSE1: # %bb.0:
979 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
980 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %ecx
981 ; X86-SSE1-NEXT: movzwl (%ecx), %edx
982 ; X86-SSE1-NEXT: movb 3(%ecx), %cl
983 ; X86-SSE1-NEXT: movb %cl, 3(%eax)
984 ; X86-SSE1-NEXT: movw %dx, (%eax)
985 ; X86-SSE1-NEXT: movb $0, 15(%eax)
986 ; X86-SSE1-NEXT: movw $0, 13(%eax)
987 ; X86-SSE1-NEXT: movw $0, 6(%eax)
988 ; X86-SSE1-NEXT: retl $4
1023 ; X86-SSE1-LABEL: merge_16i8_i8_0123uu67uuuuuzzz:
1024 ; X86-SSE1: # %bb.0:
1025 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
1026 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %ecx
1027 ; X86-SSE1-NEXT: movl (%ecx), %edx
1028 ; X86-SSE1-NEXT: movzwl 6(%ecx), %ecx
1029 ; X86-SSE1-NEXT: movw %cx, 6(%eax)
1030 ; X86-SSE1-NEXT: movl %edx, (%eax)
1031 ; X86-SSE1-NEXT: movb $0, 15(%eax)
1032 ; X86-SSE1-NEXT: movw $0, 13(%eax)
1033 ; X86-SSE1-NEXT: retl $4
1077 ; X86-SSE1-LABEL: merge_4i32_i32_combine:
1078 ; X86-SSE1: # %bb.0:
1079 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
1080 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %ecx
1081 ; X86-SSE1-NEXT: movss {{.*#+}} xmm0 = mem[0],zero,zero,zero
1082 ; X86-SSE1-NEXT: movss {{.*#+}} xmm1 = mem[0],zero,zero,zero
1083 ; X86-SSE1-NEXT: andps %xmm0, %xmm1
1084 ; X86-SSE1-NEXT: movaps %xmm1, (%eax)
1085 ; X86-SSE1-NEXT: retl
1123 ; X86-SSE1-LABEL: merge_2i64_i64_12_volatile:
1124 ; X86-SSE1: # %bb.0:
1125 ; X86-SSE1-NEXT: pushl %edi
1126 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 8
1127 ; X86-SSE1-NEXT: pushl %esi
1128 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 12
1129 ; X86-SSE1-NEXT: .cfi_offset %esi, -12
1130 ; X86-SSE1-NEXT: .cfi_offset %edi, -8
1131 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
1132 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %ecx
1133 ; X86-SSE1-NEXT: movl 8(%ecx), %edx
1134 ; X86-SSE1-NEXT: movl 12(%ecx), %esi
1135 ; X86-SSE1-NEXT: movl 16(%ecx), %edi
1136 ; X86-SSE1-NEXT: movl 20(%ecx), %ecx
1137 ; X86-SSE1-NEXT: movl %ecx, 12(%eax)
1138 ; X86-SSE1-NEXT: movl %edi, 8(%eax)
1139 ; X86-SSE1-NEXT: movl %esi, 4(%eax)
1140 ; X86-SSE1-NEXT: movl %edx, (%eax)
1141 ; X86-SSE1-NEXT: popl %esi
1142 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 8
1143 ; X86-SSE1-NEXT: popl %edi
1144 ; X86-SSE1-NEXT: .cfi_def_cfa_offset 4
1145 ; X86-SSE1-NEXT: retl $4
1189 ; X86-SSE1-LABEL: merge_4f32_f32_2345_volatile:
1190 ; X86-SSE1: # %bb.0:
1191 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
1192 ; X86-SSE1-NEXT: movss {{.*#+}} xmm0 = mem[0],zero,zero,zero
1193 ; X86-SSE1-NEXT: movss {{.*#+}} xmm1 = mem[0],zero,zero,zero
1194 ; X86-SSE1-NEXT: unpcklps {{.*#+}} xmm0 = xmm0[0],xmm1[0],xmm0[1],xmm1[1]
1195 ; X86-SSE1-NEXT: movhps {{.*#+}} xmm0 = xmm0[0,1],mem[0,1]
1196 ; X86-SSE1-NEXT: retl
1273 ; X86-SSE1-LABEL: load_i32_zext_i128_v4i32:
1274 ; X86-SSE1: # %bb.0:
1275 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %eax
1276 ; X86-SSE1-NEXT: movl {{[0-9]+}}(%esp), %ecx
1277 ; X86-SSE1-NEXT: movl (%ecx), %ecx
1278 ; X86-SSE1-NEXT: movl %ecx, (%eax)
1279 ; X86-SSE1-NEXT: movl $0, 12(%eax)
1280 ; X86-SSE1-NEXT: movl $0, 8(%eax)
1281 ; X86-SSE1-NEXT: movl $0, 4(%eax)
1282 ; X86-SSE1-NEXT: retl $4