• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
2; RUN: opt -loop-idiom -S %s | FileCheck %s
3
4define void @reuse_cast_1(float** %ptr, i1 %c) {
5; CHECK-LABEL: @reuse_cast_1(
6; CHECK-NEXT:  entry:
7; CHECK-NEXT:    br label [[LOOP_0:%.*]]
8; CHECK:       loop.0:
9; CHECK-NEXT:    [[TMP:%.*]] = load float*, float** [[PTR:%.*]], align 8
10; CHECK-NEXT:    [[TMP2:%.*]] = bitcast float* [[TMP]] to i8*
11; CHECK-NEXT:    br i1 [[C:%.*]], label [[LOOP_2_PREHEADER:%.*]], label [[LOOP_1_PREHEADER:%.*]]
12; CHECK:       loop.1.preheader:
13; CHECK-NEXT:    call void @llvm.memset.p0i8.i64(i8* align 4 [[TMP2]], i8 0, i64 400, i1 false)
14; CHECK-NEXT:    br label [[LOOP_1:%.*]]
15; CHECK:       loop.2.preheader:
16; CHECK-NEXT:    br label [[LOOP_2:%.*]]
17; CHECK:       loop.1:
18; CHECK-NEXT:    [[IV_1:%.*]] = phi i64 [ [[IV_1_NEXT:%.*]], [[LOOP_1]] ], [ 0, [[LOOP_1_PREHEADER]] ]
19; CHECK-NEXT:    [[TMP4:%.*]] = getelementptr inbounds float, float* [[TMP]], i64 [[IV_1]]
20; CHECK-NEXT:    [[IV_1_NEXT]] = add nuw nsw i64 [[IV_1]], 1
21; CHECK-NEXT:    [[C_1:%.*]] = icmp ne i64 [[IV_1_NEXT]], 100
22; CHECK-NEXT:    br i1 [[C_1]], label [[LOOP_1]], label [[LOOP_0_LATCH_LOOPEXIT1:%.*]]
23; CHECK:       loop.2:
24; CHECK-NEXT:    [[IV_2:%.*]] = phi i64 [ [[IV_2_NEXT:%.*]], [[LOOP_2]] ], [ 0, [[LOOP_2_PREHEADER]] ]
25; CHECK-NEXT:    [[TMP10:%.*]] = getelementptr inbounds float, float* [[TMP]], i64 [[IV_2]]
26; CHECK-NEXT:    store float 0.000000e+00, float* [[TMP10]], align 4
27; CHECK-NEXT:    [[TMP11:%.*]] = load float*, float** [[PTR]], align 8
28; CHECK-NEXT:    [[TMP12:%.*]] = getelementptr inbounds float, float* [[TMP11]], i64 [[IV_2]]
29; CHECK-NEXT:    [[TMP13:%.*]] = load float, float* [[TMP12]], align 4
30; CHECK-NEXT:    [[IV_2_NEXT]] = add nuw nsw i64 [[IV_2]], 1
31; CHECK-NEXT:    [[C_2:%.*]] = icmp ne i64 [[IV_2_NEXT]], 100
32; CHECK-NEXT:    br i1 [[C_2]], label [[LOOP_2]], label [[LOOP_0_LATCH_LOOPEXIT:%.*]]
33; CHECK:       loop.0.latch.loopexit:
34; CHECK-NEXT:    br label [[LOOP_0_LATCH:%.*]]
35; CHECK:       loop.0.latch.loopexit1:
36; CHECK-NEXT:    br label [[LOOP_0_LATCH]]
37; CHECK:       loop.0.latch:
38; CHECK-NEXT:    [[C_0:%.*]] = call i1 @cond()
39; CHECK-NEXT:    br i1 [[C_0]], label [[LOOP_0]], label [[END:%.*]]
40; CHECK:       end:
41; CHECK-NEXT:    ret void
42;
43entry:
44  br label %loop.0
45
46loop.0:                                           ; preds = %loop.0.latch, %entry
47  %tmp = load float*, float** %ptr, align 8
48  br i1 %c, label %loop.2, label %loop.1
49
50loop.1:                                           ; preds = %loop.1, %loop.0
51  %iv.1 = phi i64 [ %iv.1.next, %loop.1 ], [ 0, %loop.0 ]
52  %tmp4 = getelementptr inbounds float, float* %tmp, i64 %iv.1
53  store float 0.000000e+00, float* %tmp4, align 4
54  %iv.1.next = add nuw nsw i64 %iv.1, 1
55  %c.1 = icmp ne i64 %iv.1.next, 100
56  br i1 %c.1, label %loop.1, label %loop.0.latch
57
58loop.2:                                           ; preds = %loop.2, %loop.0
59  %iv.2 = phi i64 [ %iv.2.next, %loop.2 ], [ 0, %loop.0 ]
60  %tmp10 = getelementptr inbounds float, float* %tmp, i64 %iv.2
61  store float 0.000000e+00, float* %tmp10, align 4
62  %tmp11 = load float*, float** %ptr, align 8
63  %tmp12 = getelementptr inbounds float, float* %tmp11, i64 %iv.2
64  %tmp13 = load float, float* %tmp12, align 4
65  %iv.2.next = add nuw nsw i64 %iv.2, 1
66  %c.2 = icmp ne i64 %iv.2.next, 100
67  br i1 %c.2, label %loop.2, label %loop.0.latch
68
69loop.0.latch:                                     ; preds = %loop.2, %loop.1
70  %c.0 = call i1 @cond()
71  br i1 %c.0, label %loop.0, label %end
72
73end:                                              ; preds = %loop.0.latch
74  ret void
75}
76
77declare i1 @cond()
78
79declare void @use.i8(i8*)
80
81declare void @use.i1(i1)
82
83define void @reuse_cast_2(i32 %x, i32* %ptr.1.start) {
84; CHECK-LABEL: @reuse_cast_2(
85; CHECK-NEXT:  entry:
86; CHECK-NEXT:    [[PTR_1_START2:%.*]] = bitcast i32* [[PTR_1_START:%.*]] to i8*
87; CHECK-NEXT:    [[STACK:%.*]] = alloca [2 x i32], align 4
88; CHECK-NEXT:    [[STACK1:%.*]] = bitcast [2 x i32]* [[STACK]] to i8*
89; CHECK-NEXT:    [[C_0:%.*]] = icmp sgt i32 [[X:%.*]], 0
90; CHECK-NEXT:    [[CAST_TO_REUSE:%.*]] = bitcast [2 x i32]* [[STACK]] to i8*
91; CHECK-NEXT:    [[PTR_2_START:%.*]] = getelementptr inbounds [2 x i32], [2 x i32]* [[STACK]], i64 0, i64 0
92; CHECK-NEXT:    call void @use.i8(i8* [[CAST_TO_REUSE]])
93; CHECK-NEXT:    call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 4 [[STACK1]], i8* align 4 [[PTR_1_START2]], i64 8, i1 false)
94; CHECK-NEXT:    br label [[LOOP:%.*]]
95; CHECK:       loop:
96; CHECK-NEXT:    [[IV:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[IV_NEXT:%.*]], [[LOOP]] ]
97; CHECK-NEXT:    [[PTR_1:%.*]] = phi i32* [ [[PTR_1_START]], [[ENTRY]] ], [ [[PTR_1_NEXT:%.*]], [[LOOP]] ]
98; CHECK-NEXT:    [[PTR_2:%.*]] = phi i32* [ [[PTR_2_START]], [[ENTRY]] ], [ [[PTR_2_NEXT:%.*]], [[LOOP]] ]
99; CHECK-NEXT:    [[PTR_1_NEXT]] = getelementptr inbounds i32, i32* [[PTR_1]], i64 1
100; CHECK-NEXT:    [[LV:%.*]] = load i32, i32* [[PTR_1]], align 4
101; CHECK-NEXT:    [[PTR_2_NEXT]] = getelementptr inbounds i32, i32* [[PTR_2]], i64 1
102; CHECK-NEXT:    [[IV_NEXT]] = add nuw nsw i32 [[IV]], 1
103; CHECK-NEXT:    [[C_1:%.*]] = icmp eq i32 [[IV]], 0
104; CHECK-NEXT:    br i1 [[C_1]], label [[LOOP]], label [[EXIT:%.*]]
105; CHECK:       exit:
106; CHECK-NEXT:    call void @use.i1(i1 [[C_0]])
107; CHECK-NEXT:    ret void
108;
109entry:
110  %stack = alloca [2 x i32], align 4
111  %c.0 = icmp sgt i32 %x, 0
112  %cast.to.reuse = bitcast [2 x i32]* %stack to i8*
113  %ptr.2.start = getelementptr inbounds [2 x i32], [2 x i32]* %stack, i64 0, i64 0
114  call void @use.i8(i8* %cast.to.reuse)
115  br label %loop
116
117loop:                                             ; preds = %loop, %entry
118  %iv = phi i32 [ 0, %entry ], [ %iv.next, %loop ]
119  %ptr.1 = phi i32* [ %ptr.1.start, %entry ], [ %ptr.1.next, %loop ]
120  %ptr.2 = phi i32* [ %ptr.2.start, %entry ], [ %ptr.2.next, %loop ]
121  %ptr.1.next = getelementptr inbounds i32, i32* %ptr.1, i64 1
122  %lv = load i32, i32* %ptr.1, align 4
123  %ptr.2.next = getelementptr inbounds i32, i32* %ptr.2, i64 1
124  store i32 %lv, i32* %ptr.2, align 4
125  %iv.next = add nuw nsw i32 %iv, 1
126  %c.1 = icmp eq i32 %iv, 0
127  br i1 %c.1, label %loop, label %exit
128
129exit:                                             ; preds = %loop
130  call void @use.i1(i1 %c.0)
131  ret void
132}
133