1; ModuleID = '<stdin>' 2source_filename = "matmul.c" 3target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128" 4target triple = "x86_64-unknown-linux-gnu" 5 6%struct._IO_FILE = type { i32, i8*, i8*, i8*, i8*, i8*, i8*, i8*, i8*, i8*, i8*, i8*, %struct._IO_marker*, %struct._IO_FILE*, i32, i32, i64, i16, i8, [1 x i8], i8*, i64, i8*, i8*, i8*, i8*, i64, i32, [20 x i8] } 7%struct._IO_marker = type { %struct._IO_marker*, %struct._IO_FILE*, i32 } 8 9@A = common dso_local local_unnamed_addr global [1536 x [1536 x float]] zeroinitializer, align 16 10@B = common dso_local local_unnamed_addr global [1536 x [1536 x float]] zeroinitializer, align 16 11@stdout = external dso_local local_unnamed_addr global %struct._IO_FILE*, align 8 12@.str = private unnamed_addr constant [5 x i8] c"%lf \00", align 1 13@C = common dso_local local_unnamed_addr global [1536 x [1536 x float]] zeroinitializer, align 16 14 15; Function Attrs: noinline norecurse nounwind uwtable writeonly 16define dso_local void @init_array() local_unnamed_addr #0 { 17entry: 18 br label %polly.loop_header 19 20polly.exiting: ; preds = %polly.loop_exit3 21 ret void 22 23polly.loop_header: ; preds = %polly.loop_exit3, %entry 24 %polly.indvar = phi i64 [ 0, %entry ], [ %polly.indvar_next, %polly.loop_exit3 ] 25 %0 = trunc i64 %polly.indvar to i32 26 br label %polly.loop_header1 27 28polly.loop_exit3: ; preds = %polly.loop_header1 29 %polly.indvar_next = add nuw nsw i64 %polly.indvar, 1 30 %exitcond1 = icmp eq i64 %polly.indvar_next, 1536 31 br i1 %exitcond1, label %polly.exiting, label %polly.loop_header 32 33polly.loop_header1: ; preds = %polly.loop_header1, %polly.loop_header 34 %polly.indvar4 = phi i64 [ 0, %polly.loop_header ], [ %polly.indvar_next5.1, %polly.loop_header1 ] 35 %1 = trunc i64 %polly.indvar4 to i32 36 %2 = mul nuw nsw i32 %1, %0 37 %3 = and i32 %2, 1022 38 %4 = or i32 %3, 1 39 %p_conv = sitofp i32 %4 to double 40 %p_div = fmul double %p_conv, 5.000000e-01 41 %p_conv4 = fptrunc double %p_div to float 42 %scevgep7 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @A, i64 0, i64 %polly.indvar, i64 %polly.indvar4 43 store float %p_conv4, float* %scevgep7, align 8, !alias.scope !2, !noalias !4 44 %scevgep9 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @B, i64 0, i64 %polly.indvar, i64 %polly.indvar4 45 store float %p_conv4, float* %scevgep9, align 8, !alias.scope !5, !noalias !6 46 %polly.indvar_next5 = or i64 %polly.indvar4, 1 47 %5 = trunc i64 %polly.indvar_next5 to i32 48 %6 = mul nuw nsw i32 %5, %0 49 %7 = and i32 %6, 1023 50 %8 = add nuw nsw i32 %7, 1 51 %p_conv.1 = sitofp i32 %8 to double 52 %p_div.1 = fmul double %p_conv.1, 5.000000e-01 53 %p_conv4.1 = fptrunc double %p_div.1 to float 54 %scevgep7.1 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @A, i64 0, i64 %polly.indvar, i64 %polly.indvar_next5 55 store float %p_conv4.1, float* %scevgep7.1, align 4, !alias.scope !2, !noalias !4 56 %scevgep9.1 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @B, i64 0, i64 %polly.indvar, i64 %polly.indvar_next5 57 store float %p_conv4.1, float* %scevgep9.1, align 4, !alias.scope !5, !noalias !6 58 %polly.indvar_next5.1 = add nuw nsw i64 %polly.indvar4, 2 59 %exitcond.1 = icmp eq i64 %polly.indvar_next5.1, 1536 60 br i1 %exitcond.1, label %polly.loop_exit3, label %polly.loop_header1 61} 62 63; Function Attrs: noinline nounwind uwtable 64define dso_local void @print_array() local_unnamed_addr #1 { 65entry: 66 br label %for.cond1.preheader 67 68for.cond1.preheader: ; preds = %for.end, %entry 69 %indvars.iv6 = phi i64 [ 0, %entry ], [ %indvars.iv.next7, %for.end ] 70 %0 = load %struct._IO_FILE*, %struct._IO_FILE** @stdout, align 8 71 br label %for.body3 72 73for.body3: ; preds = %for.inc, %for.cond1.preheader 74 %indvars.iv = phi i64 [ 0, %for.cond1.preheader ], [ %indvars.iv.next, %for.inc ] 75 %1 = phi %struct._IO_FILE* [ %0, %for.cond1.preheader ], [ %5, %for.inc ] 76 %arrayidx5 = getelementptr inbounds [1536 x [1536 x float]], [1536 x [1536 x float]]* @C, i64 0, i64 %indvars.iv6, i64 %indvars.iv 77 %2 = load float, float* %arrayidx5, align 4 78 %conv = fpext float %2 to double 79 %call = tail call i32 (%struct._IO_FILE*, i8*, ...) @fprintf(%struct._IO_FILE* %1, i8* getelementptr inbounds ([5 x i8], [5 x i8]* @.str, i64 0, i64 0), double %conv) #4 80 %3 = trunc i64 %indvars.iv to i32 81 %rem = urem i32 %3, 80 82 %cmp6 = icmp eq i32 %rem, 79 83 br i1 %cmp6, label %if.then, label %for.inc 84 85if.then: ; preds = %for.body3 86 %4 = load %struct._IO_FILE*, %struct._IO_FILE** @stdout, align 8 87 %fputc3 = tail call i32 @fputc(i32 10, %struct._IO_FILE* %4) 88 br label %for.inc 89 90for.inc: ; preds = %if.then, %for.body3 91 %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1 92 %5 = load %struct._IO_FILE*, %struct._IO_FILE** @stdout, align 8 93 %exitcond = icmp eq i64 %indvars.iv.next, 1536 94 br i1 %exitcond, label %for.end, label %for.body3 95 96for.end: ; preds = %for.inc 97 %fputc = tail call i32 @fputc(i32 10, %struct._IO_FILE* %5) 98 %indvars.iv.next7 = add nuw nsw i64 %indvars.iv6, 1 99 %exitcond8 = icmp eq i64 %indvars.iv.next7, 1536 100 br i1 %exitcond8, label %for.end12, label %for.cond1.preheader 101 102for.end12: ; preds = %for.end 103 ret void 104} 105 106; Function Attrs: nounwind 107declare dso_local i32 @fprintf(%struct._IO_FILE* nocapture, i8* nocapture readonly, ...) local_unnamed_addr #2 108 109; Function Attrs: noinline norecurse nounwind uwtable 110define dso_local i32 @main() local_unnamed_addr #3 { 111entry: 112 tail call void @init_array() 113 call void @llvm.memset.p0i8.i64(i8* align 16 bitcast ([1536 x [1536 x float]]* @C to i8*), i8 0, i64 9437184, i1 false) 114 br label %polly.loop_header8 115 116polly.exiting: ; preds = %polly.loop_exit16 117 ret i32 0 118 119polly.loop_header8: ; preds = %entry, %polly.loop_exit16 120 %indvars.iv4 = phi i64 [ 64, %entry ], [ %indvars.iv.next5, %polly.loop_exit16 ] 121 %polly.indvar11 = phi i64 [ 0, %entry ], [ %polly.indvar_next12, %polly.loop_exit16 ] 122 br label %polly.loop_header14 123 124polly.loop_exit16: ; preds = %polly.loop_exit22 125 %polly.indvar_next12 = add nuw nsw i64 %polly.indvar11, 64 126 %polly.loop_cond13 = icmp ult i64 %polly.indvar_next12, 1536 127 %indvars.iv.next5 = add nuw nsw i64 %indvars.iv4, 64 128 br i1 %polly.loop_cond13, label %polly.loop_header8, label %polly.exiting 129 130polly.loop_header14: ; preds = %polly.loop_header8, %polly.loop_exit22 131 %polly.indvar17 = phi i64 [ 0, %polly.loop_header8 ], [ %polly.indvar_next18, %polly.loop_exit22 ] 132 %offset.idx.1 = or i64 %polly.indvar17, 4 133 %offset.idx.2 = or i64 %polly.indvar17, 8 134 %offset.idx.3 = or i64 %polly.indvar17, 12 135 %offset.idx.4 = or i64 %polly.indvar17, 16 136 %offset.idx.5 = or i64 %polly.indvar17, 20 137 %offset.idx.6 = or i64 %polly.indvar17, 24 138 %offset.idx.7 = or i64 %polly.indvar17, 28 139 %offset.idx.8 = or i64 %polly.indvar17, 32 140 %offset.idx.9 = or i64 %polly.indvar17, 36 141 %offset.idx.10 = or i64 %polly.indvar17, 40 142 %offset.idx.11 = or i64 %polly.indvar17, 44 143 %offset.idx.12 = or i64 %polly.indvar17, 48 144 %offset.idx.13 = or i64 %polly.indvar17, 52 145 %offset.idx.14 = or i64 %polly.indvar17, 56 146 %offset.idx.15 = or i64 %polly.indvar17, 60 147 br label %polly.loop_header20 148 149polly.loop_exit22: ; preds = %polly.loop_exit28 150 %polly.indvar_next18 = add nuw nsw i64 %polly.indvar17, 64 151 %polly.loop_cond19 = icmp ult i64 %polly.indvar_next18, 1536 152 br i1 %polly.loop_cond19, label %polly.loop_header14, label %polly.loop_exit16 153 154polly.loop_header20: ; preds = %polly.loop_header14, %polly.loop_exit28 155 %indvars.iv1 = phi i64 [ 64, %polly.loop_header14 ], [ %indvars.iv.next2, %polly.loop_exit28 ] 156 %polly.indvar23 = phi i64 [ 0, %polly.loop_header14 ], [ %polly.indvar_next24, %polly.loop_exit28 ] 157 br label %polly.loop_header26 158 159polly.loop_exit28: ; preds = %polly.loop_exit34 160 %polly.indvar_next24 = add nuw nsw i64 %polly.indvar23, 64 161 %polly.loop_cond25 = icmp ult i64 %polly.indvar_next24, 1536 162 %indvars.iv.next2 = add nuw nsw i64 %indvars.iv1, 64 163 br i1 %polly.loop_cond25, label %polly.loop_header20, label %polly.loop_exit22 164 165polly.loop_header26: ; preds = %polly.loop_exit34, %polly.loop_header20 166 %polly.indvar29 = phi i64 [ %polly.indvar11, %polly.loop_header20 ], [ %polly.indvar_next30, %polly.loop_exit34 ] 167 %0 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @C, i64 0, i64 %polly.indvar29, i64 %polly.indvar17 168 %1 = bitcast float* %0 to <4 x float>* 169 %2 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @C, i64 0, i64 %polly.indvar29, i64 %offset.idx.1 170 %3 = bitcast float* %2 to <4 x float>* 171 %4 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @C, i64 0, i64 %polly.indvar29, i64 %offset.idx.2 172 %5 = bitcast float* %4 to <4 x float>* 173 %6 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @C, i64 0, i64 %polly.indvar29, i64 %offset.idx.3 174 %7 = bitcast float* %6 to <4 x float>* 175 %8 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @C, i64 0, i64 %polly.indvar29, i64 %offset.idx.4 176 %9 = bitcast float* %8 to <4 x float>* 177 %10 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @C, i64 0, i64 %polly.indvar29, i64 %offset.idx.5 178 %11 = bitcast float* %10 to <4 x float>* 179 %12 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @C, i64 0, i64 %polly.indvar29, i64 %offset.idx.6 180 %13 = bitcast float* %12 to <4 x float>* 181 %14 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @C, i64 0, i64 %polly.indvar29, i64 %offset.idx.7 182 %15 = bitcast float* %14 to <4 x float>* 183 %16 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @C, i64 0, i64 %polly.indvar29, i64 %offset.idx.8 184 %17 = bitcast float* %16 to <4 x float>* 185 %18 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @C, i64 0, i64 %polly.indvar29, i64 %offset.idx.9 186 %19 = bitcast float* %18 to <4 x float>* 187 %20 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @C, i64 0, i64 %polly.indvar29, i64 %offset.idx.10 188 %21 = bitcast float* %20 to <4 x float>* 189 %22 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @C, i64 0, i64 %polly.indvar29, i64 %offset.idx.11 190 %23 = bitcast float* %22 to <4 x float>* 191 %24 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @C, i64 0, i64 %polly.indvar29, i64 %offset.idx.12 192 %25 = bitcast float* %24 to <4 x float>* 193 %26 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @C, i64 0, i64 %polly.indvar29, i64 %offset.idx.13 194 %27 = bitcast float* %26 to <4 x float>* 195 %28 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @C, i64 0, i64 %polly.indvar29, i64 %offset.idx.14 196 %29 = bitcast float* %28 to <4 x float>* 197 %30 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @C, i64 0, i64 %polly.indvar29, i64 %offset.idx.15 198 %31 = bitcast float* %30 to <4 x float>* 199 %.promoted = load <4 x float>, <4 x float>* %1, align 16, !alias.scope !7, !noalias !9 200 %.promoted14 = load <4 x float>, <4 x float>* %3, align 16, !alias.scope !7, !noalias !9 201 %.promoted17 = load <4 x float>, <4 x float>* %5, align 16, !alias.scope !7, !noalias !9 202 %.promoted20 = load <4 x float>, <4 x float>* %7, align 16, !alias.scope !7, !noalias !9 203 %.promoted23 = load <4 x float>, <4 x float>* %9, align 16, !alias.scope !7, !noalias !9 204 %.promoted26 = load <4 x float>, <4 x float>* %11, align 16, !alias.scope !7, !noalias !9 205 %.promoted29 = load <4 x float>, <4 x float>* %13, align 16, !alias.scope !7, !noalias !9 206 %.promoted32 = load <4 x float>, <4 x float>* %15, align 16, !alias.scope !7, !noalias !9 207 %.promoted35 = load <4 x float>, <4 x float>* %17, align 16, !alias.scope !7, !noalias !9 208 %.promoted38 = load <4 x float>, <4 x float>* %19, align 16, !alias.scope !7, !noalias !9 209 %.promoted41 = load <4 x float>, <4 x float>* %21, align 16, !alias.scope !7, !noalias !9 210 %.promoted44 = load <4 x float>, <4 x float>* %23, align 16, !alias.scope !7, !noalias !9 211 %.promoted47 = load <4 x float>, <4 x float>* %25, align 16, !alias.scope !7, !noalias !9 212 %.promoted50 = load <4 x float>, <4 x float>* %27, align 16, !alias.scope !7, !noalias !9 213 %.promoted53 = load <4 x float>, <4 x float>* %29, align 16, !alias.scope !7, !noalias !9 214 %.promoted56 = load <4 x float>, <4 x float>* %31, align 16, !alias.scope !7, !noalias !9 215 br label %vector.ph 216 217polly.loop_exit34: ; preds = %vector.ph 218 store <4 x float> %35, <4 x float>* %1, align 16, !alias.scope !7, !noalias !9 219 store <4 x float> %39, <4 x float>* %3, align 16, !alias.scope !7, !noalias !9 220 store <4 x float> %43, <4 x float>* %5, align 16, !alias.scope !7, !noalias !9 221 store <4 x float> %47, <4 x float>* %7, align 16, !alias.scope !7, !noalias !9 222 store <4 x float> %51, <4 x float>* %9, align 16, !alias.scope !7, !noalias !9 223 store <4 x float> %55, <4 x float>* %11, align 16, !alias.scope !7, !noalias !9 224 store <4 x float> %59, <4 x float>* %13, align 16, !alias.scope !7, !noalias !9 225 store <4 x float> %63, <4 x float>* %15, align 16, !alias.scope !7, !noalias !9 226 store <4 x float> %67, <4 x float>* %17, align 16, !alias.scope !7, !noalias !9 227 store <4 x float> %71, <4 x float>* %19, align 16, !alias.scope !7, !noalias !9 228 store <4 x float> %75, <4 x float>* %21, align 16, !alias.scope !7, !noalias !9 229 store <4 x float> %79, <4 x float>* %23, align 16, !alias.scope !7, !noalias !9 230 store <4 x float> %83, <4 x float>* %25, align 16, !alias.scope !7, !noalias !9 231 store <4 x float> %87, <4 x float>* %27, align 16, !alias.scope !7, !noalias !9 232 store <4 x float> %91, <4 x float>* %29, align 16, !alias.scope !7, !noalias !9 233 store <4 x float> %95, <4 x float>* %31, align 16, !alias.scope !7, !noalias !9 234 %polly.indvar_next30 = add nuw nsw i64 %polly.indvar29, 1 235 %exitcond6 = icmp eq i64 %polly.indvar_next30, %indvars.iv4 236 br i1 %exitcond6, label %polly.loop_exit28, label %polly.loop_header26 237 238vector.ph: ; preds = %polly.loop_header26, %vector.ph 239 %wide.load.1557 = phi <4 x float> [ %.promoted56, %polly.loop_header26 ], [ %95, %vector.ph ] 240 %wide.load.1454 = phi <4 x float> [ %.promoted53, %polly.loop_header26 ], [ %91, %vector.ph ] 241 %wide.load.1351 = phi <4 x float> [ %.promoted50, %polly.loop_header26 ], [ %87, %vector.ph ] 242 %wide.load.1248 = phi <4 x float> [ %.promoted47, %polly.loop_header26 ], [ %83, %vector.ph ] 243 %wide.load.1145 = phi <4 x float> [ %.promoted44, %polly.loop_header26 ], [ %79, %vector.ph ] 244 %wide.load.1042 = phi <4 x float> [ %.promoted41, %polly.loop_header26 ], [ %75, %vector.ph ] 245 %wide.load.939 = phi <4 x float> [ %.promoted38, %polly.loop_header26 ], [ %71, %vector.ph ] 246 %wide.load.836 = phi <4 x float> [ %.promoted35, %polly.loop_header26 ], [ %67, %vector.ph ] 247 %wide.load.733 = phi <4 x float> [ %.promoted32, %polly.loop_header26 ], [ %63, %vector.ph ] 248 %wide.load.630 = phi <4 x float> [ %.promoted29, %polly.loop_header26 ], [ %59, %vector.ph ] 249 %wide.load.527 = phi <4 x float> [ %.promoted26, %polly.loop_header26 ], [ %55, %vector.ph ] 250 %wide.load.424 = phi <4 x float> [ %.promoted23, %polly.loop_header26 ], [ %51, %vector.ph ] 251 %wide.load.321 = phi <4 x float> [ %.promoted20, %polly.loop_header26 ], [ %47, %vector.ph ] 252 %wide.load.218 = phi <4 x float> [ %.promoted17, %polly.loop_header26 ], [ %43, %vector.ph ] 253 %wide.load.115 = phi <4 x float> [ %.promoted14, %polly.loop_header26 ], [ %39, %vector.ph ] 254 %wide.load13 = phi <4 x float> [ %.promoted, %polly.loop_header26 ], [ %35, %vector.ph ] 255 %polly.indvar35 = phi i64 [ %polly.indvar23, %polly.loop_header26 ], [ %polly.indvar_next36, %vector.ph ] 256 %scevgep47 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @A, i64 0, i64 %polly.indvar29, i64 %polly.indvar35 257 %_p_scalar_48 = load float, float* %scevgep47, align 4, !alias.scope !10, !noalias !12 258 %broadcast.splatinsert11 = insertelement <4 x float> undef, float %_p_scalar_48, i32 0 259 %broadcast.splat12 = shufflevector <4 x float> %broadcast.splatinsert11, <4 x float> undef, <4 x i32> zeroinitializer 260 %32 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @B, i64 0, i64 %polly.indvar35, i64 %polly.indvar17 261 %33 = bitcast float* %32 to <4 x float>* 262 %wide.load10 = load <4 x float>, <4 x float>* %33, align 16, !alias.scope !11, !noalias !13 263 %34 = fmul <4 x float> %broadcast.splat12, %wide.load10 264 %35 = fadd <4 x float> %wide.load13, %34 265 %36 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @B, i64 0, i64 %polly.indvar35, i64 %offset.idx.1 266 %37 = bitcast float* %36 to <4 x float>* 267 %wide.load10.1 = load <4 x float>, <4 x float>* %37, align 16, !alias.scope !11, !noalias !13 268 %38 = fmul <4 x float> %broadcast.splat12, %wide.load10.1 269 %39 = fadd <4 x float> %wide.load.115, %38 270 %40 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @B, i64 0, i64 %polly.indvar35, i64 %offset.idx.2 271 %41 = bitcast float* %40 to <4 x float>* 272 %wide.load10.2 = load <4 x float>, <4 x float>* %41, align 16, !alias.scope !11, !noalias !13 273 %42 = fmul <4 x float> %broadcast.splat12, %wide.load10.2 274 %43 = fadd <4 x float> %wide.load.218, %42 275 %44 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @B, i64 0, i64 %polly.indvar35, i64 %offset.idx.3 276 %45 = bitcast float* %44 to <4 x float>* 277 %wide.load10.3 = load <4 x float>, <4 x float>* %45, align 16, !alias.scope !11, !noalias !13 278 %46 = fmul <4 x float> %broadcast.splat12, %wide.load10.3 279 %47 = fadd <4 x float> %wide.load.321, %46 280 %48 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @B, i64 0, i64 %polly.indvar35, i64 %offset.idx.4 281 %49 = bitcast float* %48 to <4 x float>* 282 %wide.load10.4 = load <4 x float>, <4 x float>* %49, align 16, !alias.scope !11, !noalias !13 283 %50 = fmul <4 x float> %broadcast.splat12, %wide.load10.4 284 %51 = fadd <4 x float> %wide.load.424, %50 285 %52 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @B, i64 0, i64 %polly.indvar35, i64 %offset.idx.5 286 %53 = bitcast float* %52 to <4 x float>* 287 %wide.load10.5 = load <4 x float>, <4 x float>* %53, align 16, !alias.scope !11, !noalias !13 288 %54 = fmul <4 x float> %broadcast.splat12, %wide.load10.5 289 %55 = fadd <4 x float> %wide.load.527, %54 290 %56 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @B, i64 0, i64 %polly.indvar35, i64 %offset.idx.6 291 %57 = bitcast float* %56 to <4 x float>* 292 %wide.load10.6 = load <4 x float>, <4 x float>* %57, align 16, !alias.scope !11, !noalias !13 293 %58 = fmul <4 x float> %broadcast.splat12, %wide.load10.6 294 %59 = fadd <4 x float> %wide.load.630, %58 295 %60 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @B, i64 0, i64 %polly.indvar35, i64 %offset.idx.7 296 %61 = bitcast float* %60 to <4 x float>* 297 %wide.load10.7 = load <4 x float>, <4 x float>* %61, align 16, !alias.scope !11, !noalias !13 298 %62 = fmul <4 x float> %broadcast.splat12, %wide.load10.7 299 %63 = fadd <4 x float> %wide.load.733, %62 300 %64 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @B, i64 0, i64 %polly.indvar35, i64 %offset.idx.8 301 %65 = bitcast float* %64 to <4 x float>* 302 %wide.load10.8 = load <4 x float>, <4 x float>* %65, align 16, !alias.scope !11, !noalias !13 303 %66 = fmul <4 x float> %broadcast.splat12, %wide.load10.8 304 %67 = fadd <4 x float> %wide.load.836, %66 305 %68 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @B, i64 0, i64 %polly.indvar35, i64 %offset.idx.9 306 %69 = bitcast float* %68 to <4 x float>* 307 %wide.load10.9 = load <4 x float>, <4 x float>* %69, align 16, !alias.scope !11, !noalias !13 308 %70 = fmul <4 x float> %broadcast.splat12, %wide.load10.9 309 %71 = fadd <4 x float> %wide.load.939, %70 310 %72 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @B, i64 0, i64 %polly.indvar35, i64 %offset.idx.10 311 %73 = bitcast float* %72 to <4 x float>* 312 %wide.load10.10 = load <4 x float>, <4 x float>* %73, align 16, !alias.scope !11, !noalias !13 313 %74 = fmul <4 x float> %broadcast.splat12, %wide.load10.10 314 %75 = fadd <4 x float> %wide.load.1042, %74 315 %76 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @B, i64 0, i64 %polly.indvar35, i64 %offset.idx.11 316 %77 = bitcast float* %76 to <4 x float>* 317 %wide.load10.11 = load <4 x float>, <4 x float>* %77, align 16, !alias.scope !11, !noalias !13 318 %78 = fmul <4 x float> %broadcast.splat12, %wide.load10.11 319 %79 = fadd <4 x float> %wide.load.1145, %78 320 %80 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @B, i64 0, i64 %polly.indvar35, i64 %offset.idx.12 321 %81 = bitcast float* %80 to <4 x float>* 322 %wide.load10.12 = load <4 x float>, <4 x float>* %81, align 16, !alias.scope !11, !noalias !13 323 %82 = fmul <4 x float> %broadcast.splat12, %wide.load10.12 324 %83 = fadd <4 x float> %wide.load.1248, %82 325 %84 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @B, i64 0, i64 %polly.indvar35, i64 %offset.idx.13 326 %85 = bitcast float* %84 to <4 x float>* 327 %wide.load10.13 = load <4 x float>, <4 x float>* %85, align 16, !alias.scope !11, !noalias !13 328 %86 = fmul <4 x float> %broadcast.splat12, %wide.load10.13 329 %87 = fadd <4 x float> %wide.load.1351, %86 330 %88 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @B, i64 0, i64 %polly.indvar35, i64 %offset.idx.14 331 %89 = bitcast float* %88 to <4 x float>* 332 %wide.load10.14 = load <4 x float>, <4 x float>* %89, align 16, !alias.scope !11, !noalias !13 333 %90 = fmul <4 x float> %broadcast.splat12, %wide.load10.14 334 %91 = fadd <4 x float> %wide.load.1454, %90 335 %92 = getelementptr [1536 x [1536 x float]], [1536 x [1536 x float]]* @B, i64 0, i64 %polly.indvar35, i64 %offset.idx.15 336 %93 = bitcast float* %92 to <4 x float>* 337 %wide.load10.15 = load <4 x float>, <4 x float>* %93, align 16, !alias.scope !11, !noalias !13 338 %94 = fmul <4 x float> %broadcast.splat12, %wide.load10.15 339 %95 = fadd <4 x float> %wide.load.1557, %94 340 %polly.indvar_next36 = add nuw nsw i64 %polly.indvar35, 1 341 %exitcond3 = icmp eq i64 %polly.indvar_next36, %indvars.iv1 342 br i1 %exitcond3, label %polly.loop_exit34, label %vector.ph 343} 344 345; Function Attrs: nounwind 346declare i32 @fputc(i32, %struct._IO_FILE* nocapture) local_unnamed_addr #4 347 348; Function Attrs: argmemonly nounwind 349declare void @llvm.memset.p0i8.i64(i8* nocapture writeonly, i8, i64, i1) #5 350 351attributes #0 = { noinline norecurse nounwind uwtable writeonly "correctly-rounded-divide-sqrt-fp-math"="false" "disable-tail-calls"="false" "less-precise-fpmad"="false" "frame-pointer"="all" "no-infs-fp-math"="false" "no-jump-tables"="false" "no-nans-fp-math"="false" "no-signed-zeros-fp-math"="false" "no-trapping-math"="false" "polly-optimized" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+fxsr,+mmx,+sse,+sse2,+x87" "unsafe-fp-math"="false" "use-soft-float"="false" } 352attributes #1 = { noinline nounwind uwtable "correctly-rounded-divide-sqrt-fp-math"="false" "disable-tail-calls"="false" "less-precise-fpmad"="false" "frame-pointer"="all" "no-infs-fp-math"="false" "no-jump-tables"="false" "no-nans-fp-math"="false" "no-signed-zeros-fp-math"="false" "no-trapping-math"="false" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+fxsr,+mmx,+sse,+sse2,+x87" "unsafe-fp-math"="false" "use-soft-float"="false" } 353attributes #2 = { nounwind "correctly-rounded-divide-sqrt-fp-math"="false" "disable-tail-calls"="false" "less-precise-fpmad"="false" "frame-pointer"="all" "no-infs-fp-math"="false" "no-nans-fp-math"="false" "no-signed-zeros-fp-math"="false" "no-trapping-math"="false" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+fxsr,+mmx,+sse,+sse2,+x87" "unsafe-fp-math"="false" "use-soft-float"="false" } 354attributes #3 = { noinline norecurse nounwind uwtable "correctly-rounded-divide-sqrt-fp-math"="false" "disable-tail-calls"="false" "less-precise-fpmad"="false" "frame-pointer"="all" "no-infs-fp-math"="false" "no-jump-tables"="false" "no-nans-fp-math"="false" "no-signed-zeros-fp-math"="false" "no-trapping-math"="false" "polly-optimized" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+fxsr,+mmx,+sse,+sse2,+x87" "unsafe-fp-math"="false" "use-soft-float"="false" } 355attributes #4 = { nounwind } 356attributes #5 = { argmemonly nounwind } 357 358!llvm.module.flags = !{!0} 359!llvm.ident = !{!1} 360 361!0 = !{i32 1, !"wchar_size", i32 4} 362!1 = !{!"clang version 8.0.0 (trunk 342834) (llvm/trunk 342856)"} 363!2 = distinct !{!2, !3, !"polly.alias.scope.MemRef_A"} 364!3 = distinct !{!3, !"polly.alias.scope.domain"} 365!4 = !{!5} 366!5 = distinct !{!5, !3, !"polly.alias.scope.MemRef_B"} 367!6 = !{!2} 368!7 = distinct !{!7, !8, !"polly.alias.scope.MemRef_C"} 369!8 = distinct !{!8, !"polly.alias.scope.domain"} 370!9 = !{!10, !11} 371!10 = distinct !{!10, !8, !"polly.alias.scope.MemRef_A"} 372!11 = distinct !{!11, !8, !"polly.alias.scope.MemRef_B"} 373!12 = !{!7, !11} 374!13 = !{!7, !10} 375