Lines Matching refs:KERNEL
5 ; RUN: -polly-acc-dump-kernel-ir < %s | FileCheck %s -check-prefix=KERNEL-IR
44 ; KERNEL-IR: define ptx_kernel void @FUNC_foo_SCOP_0_KERNEL_0(i8 addrspace(1)* %MemRef_A, i64 %c0)
45 ; KERNEL-IR-LABEL: entry:
46 ; KERNEL-IR-NEXT: %0 = call i32 @llvm.nvvm.read.ptx.sreg.ctaid.x()
47 ; KERNEL-IR-NEXT: %b0 = zext i32 %0 to i64
48 ; KERNEL-IR-NEXT: %1 = call i32 @llvm.nvvm.read.ptx.sreg.tid.x()
49 ; KERNEL-IR-NEXT: %t0 = zext i32 %1 to i64
50 ; KERNEL-IR-NEXT: br label %polly.cond
52 ; KERNEL-IR-LABEL: polly.cond: ; preds = %entry
53 ; KERNEL-IR-NEXT: %2 = mul nsw i64 32, %b0
54 ; KERNEL-IR-NEXT: %3 = add nsw i64 %2, %t0
55 ; KERNEL-IR-NEXT: %4 = icmp sle i64 %3, 97
56 ; KERNEL-IR-NEXT: br i1 %4, label %polly.then, label %polly.else
58 ; KERNEL-IR-LABEL: polly.merge: ; preds = %polly.else, %polly.…
59 ; KERNEL-IR-NEXT: ret void
61 ; KERNEL-IR-LABEL: polly.then: ; preds = %polly.cond
62 ; KERNEL-IR-NEXT: %5 = mul nsw i64 32, %b0
63 ; KERNEL-IR-NEXT: %6 = add nsw i64 %5, %t0
64 ; KERNEL-IR-NEXT: br label %polly.stmt.for.body3
66 ; KERNEL-IR-LABEL: polly.stmt.for.body3: ; preds = %polly.then
67 ; KERNEL-IR-NEXT: %polly.access.cast.MemRef_A = bitcast i8 addrspace(1)* %MemRef_A to float addrs…
68 ; KERNEL-IR-NEXT: %pexp.pdiv_r = urem i64 %c0, 2
69 ; KERNEL-IR-NEXT: %polly.access.mul.MemRef_A = mul nsw i64 %pexp.pdiv_r, 100
70 ; KERNEL-IR-NEXT: %7 = mul nsw i64 32, %b0
71 ; KERNEL-IR-NEXT: %8 = add nsw i64 %7, %t0
72 ; KERNEL-IR-NEXT: %polly.access.add.MemRef_A = add nsw i64 %polly.access.mul.MemRef_A, %8
73 ; KERNEL-IR-NEXT: %polly.access.MemRef_A = getelementptr float, float addrspace(1)* %polly.access…
74 ; KERNEL-IR-NEXT: %tmp_p_scalar_ = load float, float addrspace(1)* %polly.access.MemRef_A, align 4
75 ; KERNEL-IR-NEXT: %polly.access.cast.MemRef_A1 = bitcast i8 addrspace(1)* %MemRef_A to float addr…
76 ; KERNEL-IR-NEXT: %pexp.pdiv_r2 = urem i64 %c0, 2
77 ; KERNEL-IR-NEXT: %polly.access.mul.MemRef_A3 = mul nsw i64 %pexp.pdiv_r2, 100
78 ; KERNEL-IR-NEXT: %9 = mul nsw i64 32, %b0
79 ; KERNEL-IR-NEXT: %10 = add nsw i64 %9, %t0
80 ; KERNEL-IR-NEXT: %11 = add nsw i64 %10, 1
81 ; KERNEL-IR-NEXT: %polly.access.add.MemRef_A4 = add nsw i64 %polly.access.mul.MemRef_A3, %11
82 ; KERNEL-IR-NEXT: %polly.access.MemRef_A5 = getelementptr float, float addrspace(1)* %polly.acces…
83 ; KERNEL-IR-NEXT: %tmp2_p_scalar_ = load float, float addrspace(1)* %polly.access.MemRef_A5, alig…
84 ; KERNEL-IR-NEXT: %p_add = fadd float %tmp_p_scalar_, %tmp2_p_scalar_
85 ; KERNEL-IR-NEXT: %polly.access.cast.MemRef_A6 = bitcast i8 addrspace(1)* %MemRef_A to float addr…
86 ; KERNEL-IR-NEXT: %pexp.pdiv_r7 = urem i64 %c0, 2
87 ; KERNEL-IR-NEXT: %polly.access.mul.MemRef_A8 = mul nsw i64 %pexp.pdiv_r7, 100
88 ; KERNEL-IR-NEXT: %12 = mul nsw i64 32, %b0
89 ; KERNEL-IR-NEXT: %13 = add nsw i64 %12, %t0
90 ; KERNEL-IR-NEXT: %14 = add nsw i64 %13, 2
91 ; KERNEL-IR-NEXT: %polly.access.add.MemRef_A9 = add nsw i64 %polly.access.mul.MemRef_A8, %14
92 ; KERNEL-IR-NEXT: %polly.access.MemRef_A10 = getelementptr float, float addrspace(1)* %polly.acce…
93 ; KERNEL-IR-NEXT: %tmp3_p_scalar_ = load float, float addrspace(1)* %polly.access.MemRef_A10, ali…
94 ; KERNEL-IR-NEXT: %p_add12 = fadd float %p_add, %tmp3_p_scalar_
95 ; KERNEL-IR-NEXT: %polly.access.cast.MemRef_A11 = bitcast i8 addrspace(1)* %MemRef_A to float add…
96 ; KERNEL-IR-NEXT: %15 = add nsw i64 %c0, 1
97 ; KERNEL-IR-NEXT: %pexp.pdiv_r12 = urem i64 %15, 2
98 ; KERNEL-IR-NEXT: %polly.access.mul.MemRef_A13 = mul nsw i64 %pexp.pdiv_r12, 100
99 ; KERNEL-IR-NEXT: %16 = mul nsw i64 32, %b0
100 ; KERNEL-IR-NEXT: %17 = add nsw i64 %16, %t0
101 ; KERNEL-IR-NEXT: %18 = add nsw i64 %17, 1
102 ; KERNEL-IR-NEXT: %polly.access.add.MemRef_A14 = add nsw i64 %polly.access.mul.MemRef_A13, %18
103 ; KERNEL-IR-NEXT: %polly.access.MemRef_A15 = getelementptr float, float addrspace(1)* %polly.acce…
104 ; KERNEL-IR-NEXT: %tmp4_p_scalar_ = load float, float addrspace(1)* %polly.access.MemRef_A15, ali…
105 ; KERNEL-IR-NEXT: %p_add17 = fadd float %tmp4_p_scalar_, %p_add12
106 ; KERNEL-IR-NEXT: %polly.access.cast.MemRef_A16 = bitcast i8 addrspace(1)* %MemRef_A to float add…
107 ; KERNEL-IR-NEXT: %19 = add nsw i64 %c0, 1
108 ; KERNEL-IR-NEXT: %pexp.pdiv_r17 = urem i64 %19, 2
109 ; KERNEL-IR-NEXT: %polly.access.mul.MemRef_A18 = mul nsw i64 %pexp.pdiv_r17, 100
110 ; KERNEL-IR-NEXT: %20 = mul nsw i64 32, %b0
111 ; KERNEL-IR-NEXT: %21 = add nsw i64 %20, %t0
112 ; KERNEL-IR-NEXT: %22 = add nsw i64 %21, 1
113 ; KERNEL-IR-NEXT: %polly.access.add.MemRef_A19 = add nsw i64 %polly.access.mul.MemRef_A18, %22
114 ; KERNEL-IR-NEXT: %polly.access.MemRef_A20 = getelementptr float, float addrspace(1)* %polly.acce…
115 ; KERNEL-IR-NEXT: store float %p_add17, float addrspace(1)* %polly.access.MemRef_A20, align 4
116 ; KERNEL-IR-NEXT: br label %polly.merge
118 ; KERNEL-IR-LABEL: polly.else: ; preds = %polly.cond
119 ; KERNEL-IR-NEXT: br label %polly.merge
120 ; KERNEL-IR-NEXT: }