1; RUN: llc -verify-machineinstrs -o - %s -mtriple=aarch64-none-linux-gnu | FileCheck %s 2; RUN: llc -verify-machineinstrs < %s -mtriple=aarch64-none-linux-gnu -mattr=-fp-armv8 | FileCheck --check-prefix=CHECK-NOFP %s 3 4@var_8bit = global i8 0 5@var_16bit = global i16 0 6@var_32bit = global i32 0 7@var_64bit = global i64 0 8 9@var_float = global float 0.0 10@var_double = global double 0.0 11 12define void @ldst_8bit(i8* %base, i32 %off32, i64 %off64) minsize { 13; CHECK-LABEL: ldst_8bit: 14 15 %addr8_sxtw = getelementptr i8, i8* %base, i32 %off32 16 %val8_sxtw = load volatile i8, i8* %addr8_sxtw 17 %val32_signed = sext i8 %val8_sxtw to i32 18 store volatile i32 %val32_signed, i32* @var_32bit 19; CHECK: ldrsb {{w[0-9]+}}, [{{x[0-9]+}}, {{[wx][0-9]+}}, sxtw] 20 21 %addr_lsl = getelementptr i8, i8* %base, i64 %off64 22 %val8_lsl = load volatile i8, i8* %addr_lsl 23 %val32_unsigned = zext i8 %val8_lsl to i32 24 store volatile i32 %val32_unsigned, i32* @var_32bit 25; CHECK: ldrb {{w[0-9]+}}, [{{x[0-9]+}}, {{x[0-9]+}}] 26 27 %addrint_uxtw = ptrtoint i8* %base to i64 28 %offset_uxtw = zext i32 %off32 to i64 29 %addrint1_uxtw = add i64 %addrint_uxtw, %offset_uxtw 30 %addr_uxtw = inttoptr i64 %addrint1_uxtw to i8* 31 %val8_uxtw = load volatile i8, i8* %addr_uxtw 32 %newval8 = add i8 %val8_uxtw, 1 33 store volatile i8 %newval8, i8* @var_8bit 34; CHECK: ldrb {{w[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, uxtw] 35 36 ret void 37} 38 39 40define void @ldst_16bit(i16* %base, i32 %off32, i64 %off64) minsize { 41; CHECK-LABEL: ldst_16bit: 42 43 %addr8_sxtwN = getelementptr i16, i16* %base, i32 %off32 44 %val8_sxtwN = load volatile i16, i16* %addr8_sxtwN 45 %val32_signed = sext i16 %val8_sxtwN to i32 46 store volatile i32 %val32_signed, i32* @var_32bit 47; CHECK: ldrsh {{w[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, sxtw #1] 48 49 %addr_lslN = getelementptr i16, i16* %base, i64 %off64 50 %val8_lslN = load volatile i16, i16* %addr_lslN 51 %val32_unsigned = zext i16 %val8_lslN to i32 52 store volatile i32 %val32_unsigned, i32* @var_32bit 53; CHECK: ldrh {{w[0-9]+}}, [{{x[0-9]+}}, {{x[0-9]+}}, lsl #1] 54 55 %addrint_uxtw = ptrtoint i16* %base to i64 56 %offset_uxtw = zext i32 %off32 to i64 57 %addrint1_uxtw = add i64 %addrint_uxtw, %offset_uxtw 58 %addr_uxtw = inttoptr i64 %addrint1_uxtw to i16* 59 %val8_uxtw = load volatile i16, i16* %addr_uxtw 60 %newval8 = add i16 %val8_uxtw, 1 61 store volatile i16 %newval8, i16* @var_16bit 62; CHECK: ldrh {{w[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, uxtw] 63 64 %base_sxtw = ptrtoint i16* %base to i64 65 %offset_sxtw = sext i32 %off32 to i64 66 %addrint_sxtw = add i64 %base_sxtw, %offset_sxtw 67 %addr_sxtw = inttoptr i64 %addrint_sxtw to i16* 68 %val16_sxtw = load volatile i16, i16* %addr_sxtw 69 %val64_signed = sext i16 %val16_sxtw to i64 70 store volatile i64 %val64_signed, i64* @var_64bit 71; CHECK: ldrsh {{x[0-9]+}}, [{{x[0-9]+}}, {{[wx][0-9]+}}, sxtw] 72 73 74 %base_lsl = ptrtoint i16* %base to i64 75 %addrint_lsl = add i64 %base_lsl, %off64 76 %addr_lsl = inttoptr i64 %addrint_lsl to i16* 77 %val16_lsl = load volatile i16, i16* %addr_lsl 78 %val64_unsigned = zext i16 %val16_lsl to i64 79 store volatile i64 %val64_unsigned, i64* @var_64bit 80; CHECK: ldrh {{w[0-9]+}}, [{{x[0-9]+}}, {{x[0-9]+}}] 81 82 %base_uxtwN = ptrtoint i16* %base to i64 83 %offset_uxtwN = zext i32 %off32 to i64 84 %offset2_uxtwN = shl i64 %offset_uxtwN, 1 85 %addrint_uxtwN = add i64 %base_uxtwN, %offset2_uxtwN 86 %addr_uxtwN = inttoptr i64 %addrint_uxtwN to i16* 87 %val32 = load volatile i32, i32* @var_32bit 88 %val16_trunc32 = trunc i32 %val32 to i16 89 store volatile i16 %val16_trunc32, i16* %addr_uxtwN 90; CHECK: strh {{w[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, uxtw #1] 91 ret void 92} 93 94define void @ldst_32bit(i32* %base, i32 %off32, i64 %off64) minsize { 95; CHECK-LABEL: ldst_32bit: 96 97 %addr_sxtwN = getelementptr i32, i32* %base, i32 %off32 98 %val_sxtwN = load volatile i32, i32* %addr_sxtwN 99 store volatile i32 %val_sxtwN, i32* @var_32bit 100; CHECK: ldr {{w[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, sxtw #2] 101 102 %addr_lslN = getelementptr i32, i32* %base, i64 %off64 103 %val_lslN = load volatile i32, i32* %addr_lslN 104 store volatile i32 %val_lslN, i32* @var_32bit 105; CHECK: ldr {{w[0-9]+}}, [{{x[0-9]+}}, {{x[0-9]+}}, lsl #2] 106 107 %addrint_uxtw = ptrtoint i32* %base to i64 108 %offset_uxtw = zext i32 %off32 to i64 109 %addrint1_uxtw = add i64 %addrint_uxtw, %offset_uxtw 110 %addr_uxtw = inttoptr i64 %addrint1_uxtw to i32* 111 %val_uxtw = load volatile i32, i32* %addr_uxtw 112 %newval8 = add i32 %val_uxtw, 1 113 store volatile i32 %newval8, i32* @var_32bit 114; CHECK: ldr {{w[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, uxtw] 115 116 117 %base_sxtw = ptrtoint i32* %base to i64 118 %offset_sxtw = sext i32 %off32 to i64 119 %addrint_sxtw = add i64 %base_sxtw, %offset_sxtw 120 %addr_sxtw = inttoptr i64 %addrint_sxtw to i32* 121 %val16_sxtw = load volatile i32, i32* %addr_sxtw 122 %val64_signed = sext i32 %val16_sxtw to i64 123 store volatile i64 %val64_signed, i64* @var_64bit 124; CHECK: ldrsw {{x[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, sxtw] 125 126 127 %base_lsl = ptrtoint i32* %base to i64 128 %addrint_lsl = add i64 %base_lsl, %off64 129 %addr_lsl = inttoptr i64 %addrint_lsl to i32* 130 %val16_lsl = load volatile i32, i32* %addr_lsl 131 %val64_unsigned = zext i32 %val16_lsl to i64 132 store volatile i64 %val64_unsigned, i64* @var_64bit 133; CHECK: ldr {{w[0-9]+}}, [{{x[0-9]+}}, {{x[0-9]+}}] 134 135 %base_uxtwN = ptrtoint i32* %base to i64 136 %offset_uxtwN = zext i32 %off32 to i64 137 %offset2_uxtwN = shl i64 %offset_uxtwN, 2 138 %addrint_uxtwN = add i64 %base_uxtwN, %offset2_uxtwN 139 %addr_uxtwN = inttoptr i64 %addrint_uxtwN to i32* 140 %val32 = load volatile i32, i32* @var_32bit 141 store volatile i32 %val32, i32* %addr_uxtwN 142; CHECK: str {{w[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, uxtw #2] 143 ret void 144} 145 146define void @ldst_64bit(i64* %base, i32 %off32, i64 %off64) minsize { 147; CHECK-LABEL: ldst_64bit: 148 149 %addr_sxtwN = getelementptr i64, i64* %base, i32 %off32 150 %val_sxtwN = load volatile i64, i64* %addr_sxtwN 151 store volatile i64 %val_sxtwN, i64* @var_64bit 152; CHECK: ldr {{x[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, sxtw #3] 153 154 %addr_lslN = getelementptr i64, i64* %base, i64 %off64 155 %val_lslN = load volatile i64, i64* %addr_lslN 156 store volatile i64 %val_lslN, i64* @var_64bit 157; CHECK: ldr {{x[0-9]+}}, [{{x[0-9]+}}, {{x[0-9]+}}, lsl #3] 158 159 %addrint_uxtw = ptrtoint i64* %base to i64 160 %offset_uxtw = zext i32 %off32 to i64 161 %addrint1_uxtw = add i64 %addrint_uxtw, %offset_uxtw 162 %addr_uxtw = inttoptr i64 %addrint1_uxtw to i64* 163 %val8_uxtw = load volatile i64, i64* %addr_uxtw 164 %newval8 = add i64 %val8_uxtw, 1 165 store volatile i64 %newval8, i64* @var_64bit 166; CHECK: ldr {{x[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, uxtw] 167 168 %base_sxtw = ptrtoint i64* %base to i64 169 %offset_sxtw = sext i32 %off32 to i64 170 %addrint_sxtw = add i64 %base_sxtw, %offset_sxtw 171 %addr_sxtw = inttoptr i64 %addrint_sxtw to i64* 172 %val64_sxtw = load volatile i64, i64* %addr_sxtw 173 store volatile i64 %val64_sxtw, i64* @var_64bit 174; CHECK: ldr {{x[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, sxtw] 175 176 %base_lsl = ptrtoint i64* %base to i64 177 %addrint_lsl = add i64 %base_lsl, %off64 178 %addr_lsl = inttoptr i64 %addrint_lsl to i64* 179 %val64_lsl = load volatile i64, i64* %addr_lsl 180 store volatile i64 %val64_lsl, i64* @var_64bit 181; CHECK: ldr {{x[0-9]+}}, [{{x[0-9]+}}, {{x[0-9]+}}] 182 183 %base_uxtwN = ptrtoint i64* %base to i64 184 %offset_uxtwN = zext i32 %off32 to i64 185 %offset2_uxtwN = shl i64 %offset_uxtwN, 3 186 %addrint_uxtwN = add i64 %base_uxtwN, %offset2_uxtwN 187 %addr_uxtwN = inttoptr i64 %addrint_uxtwN to i64* 188 %val64 = load volatile i64, i64* @var_64bit 189 store volatile i64 %val64, i64* %addr_uxtwN 190; CHECK: str {{x[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, uxtw #3] 191 ret void 192} 193 194define void @ldst_float(float* %base, i32 %off32, i64 %off64) minsize { 195; CHECK-LABEL: ldst_float: 196 197 %addr_sxtwN = getelementptr float, float* %base, i32 %off32 198 %val_sxtwN = load volatile float, float* %addr_sxtwN 199 store volatile float %val_sxtwN, float* @var_float 200; CHECK: ldr {{s[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, sxtw #2] 201; CHECK-NOFP-NOT: ldr {{s[0-9]+}}, 202 203 %addr_lslN = getelementptr float, float* %base, i64 %off64 204 %val_lslN = load volatile float, float* %addr_lslN 205 store volatile float %val_lslN, float* @var_float 206; CHECK: ldr {{s[0-9]+}}, [{{x[0-9]+}}, {{x[0-9]+}}, lsl #2] 207; CHECK-NOFP-NOT: ldr {{s[0-9]+}}, 208 209 %addrint_uxtw = ptrtoint float* %base to i64 210 %offset_uxtw = zext i32 %off32 to i64 211 %addrint1_uxtw = add i64 %addrint_uxtw, %offset_uxtw 212 %addr_uxtw = inttoptr i64 %addrint1_uxtw to float* 213 %val_uxtw = load volatile float, float* %addr_uxtw 214 store volatile float %val_uxtw, float* @var_float 215; CHECK: ldr {{s[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, uxtw] 216; CHECK-NOFP-NOT: ldr {{s[0-9]+}}, 217 218 %base_sxtw = ptrtoint float* %base to i64 219 %offset_sxtw = sext i32 %off32 to i64 220 %addrint_sxtw = add i64 %base_sxtw, %offset_sxtw 221 %addr_sxtw = inttoptr i64 %addrint_sxtw to float* 222 %val64_sxtw = load volatile float, float* %addr_sxtw 223 store volatile float %val64_sxtw, float* @var_float 224; CHECK: ldr {{s[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, sxtw] 225; CHECK-NOFP-NOT: ldr {{s[0-9]+}}, 226 227 %base_lsl = ptrtoint float* %base to i64 228 %addrint_lsl = add i64 %base_lsl, %off64 229 %addr_lsl = inttoptr i64 %addrint_lsl to float* 230 %val64_lsl = load volatile float, float* %addr_lsl 231 store volatile float %val64_lsl, float* @var_float 232; CHECK: ldr {{s[0-9]+}}, [{{x[0-9]+}}, {{x[0-9]+}}] 233; CHECK-NOFP-NOT: ldr {{s[0-9]+}}, 234 235 %base_uxtwN = ptrtoint float* %base to i64 236 %offset_uxtwN = zext i32 %off32 to i64 237 %offset2_uxtwN = shl i64 %offset_uxtwN, 2 238 %addrint_uxtwN = add i64 %base_uxtwN, %offset2_uxtwN 239 %addr_uxtwN = inttoptr i64 %addrint_uxtwN to float* 240 %val64 = load volatile float, float* @var_float 241 store volatile float %val64, float* %addr_uxtwN 242; CHECK: str {{s[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, uxtw #2] 243; CHECK-NOFP-NOT: ldr {{s[0-9]+}}, 244 ret void 245} 246 247define void @ldst_double(double* %base, i32 %off32, i64 %off64) minsize { 248; CHECK-LABEL: ldst_double: 249 250 %addr_sxtwN = getelementptr double, double* %base, i32 %off32 251 %val_sxtwN = load volatile double, double* %addr_sxtwN 252 store volatile double %val_sxtwN, double* @var_double 253; CHECK: ldr {{d[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, sxtw #3] 254; CHECK-NOFP-NOT: ldr {{d[0-9]+}}, 255 256 %addr_lslN = getelementptr double, double* %base, i64 %off64 257 %val_lslN = load volatile double, double* %addr_lslN 258 store volatile double %val_lslN, double* @var_double 259; CHECK: ldr {{d[0-9]+}}, [{{x[0-9]+}}, {{x[0-9]+}}, lsl #3] 260; CHECK-NOFP-NOT: ldr {{d[0-9]+}}, 261 262 %addrint_uxtw = ptrtoint double* %base to i64 263 %offset_uxtw = zext i32 %off32 to i64 264 %addrint1_uxtw = add i64 %addrint_uxtw, %offset_uxtw 265 %addr_uxtw = inttoptr i64 %addrint1_uxtw to double* 266 %val_uxtw = load volatile double, double* %addr_uxtw 267 store volatile double %val_uxtw, double* @var_double 268; CHECK: ldr {{d[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, uxtw] 269; CHECK-NOFP-NOT: ldr {{d[0-9]+}}, 270 271 %base_sxtw = ptrtoint double* %base to i64 272 %offset_sxtw = sext i32 %off32 to i64 273 %addrint_sxtw = add i64 %base_sxtw, %offset_sxtw 274 %addr_sxtw = inttoptr i64 %addrint_sxtw to double* 275 %val64_sxtw = load volatile double, double* %addr_sxtw 276 store volatile double %val64_sxtw, double* @var_double 277; CHECK: ldr {{d[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, sxtw] 278; CHECK-NOFP-NOT: ldr {{d[0-9]+}}, 279 280 %base_lsl = ptrtoint double* %base to i64 281 %addrint_lsl = add i64 %base_lsl, %off64 282 %addr_lsl = inttoptr i64 %addrint_lsl to double* 283 %val64_lsl = load volatile double, double* %addr_lsl 284 store volatile double %val64_lsl, double* @var_double 285; CHECK: ldr {{d[0-9]+}}, [{{x[0-9]+}}, {{x[0-9]+}}] 286; CHECK-NOFP-NOT: ldr {{d[0-9]+}}, 287 288 %base_uxtwN = ptrtoint double* %base to i64 289 %offset_uxtwN = zext i32 %off32 to i64 290 %offset2_uxtwN = shl i64 %offset_uxtwN, 3 291 %addrint_uxtwN = add i64 %base_uxtwN, %offset2_uxtwN 292 %addr_uxtwN = inttoptr i64 %addrint_uxtwN to double* 293 %val64 = load volatile double, double* @var_double 294 store volatile double %val64, double* %addr_uxtwN 295; CHECK: str {{d[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, uxtw #3] 296; CHECK-NOFP-NOT: ldr {{d[0-9]+}}, 297 ret void 298} 299 300 301define void @ldst_128bit(fp128* %base, i32 %off32, i64 %off64) minsize { 302; CHECK-LABEL: ldst_128bit: 303 304 %addr_sxtwN = getelementptr fp128, fp128* %base, i32 %off32 305 %val_sxtwN = load volatile fp128, fp128* %addr_sxtwN 306 store volatile fp128 %val_sxtwN, fp128* %base 307; CHECK: ldr {{q[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, sxtw #4] 308; CHECK-NOFP-NOT: ldr {{q[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, sxtw #4] 309 310 %addr_lslN = getelementptr fp128, fp128* %base, i64 %off64 311 %val_lslN = load volatile fp128, fp128* %addr_lslN 312 store volatile fp128 %val_lslN, fp128* %base 313; CHECK: ldr {{q[0-9]+}}, [{{x[0-9]+}}, {{x[0-9]+}}, lsl #4] 314; CHECK-NOFP-NOT: ldr {{q[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, sxtw #4] 315 316 %addrint_uxtw = ptrtoint fp128* %base to i64 317 %offset_uxtw = zext i32 %off32 to i64 318 %addrint1_uxtw = add i64 %addrint_uxtw, %offset_uxtw 319 %addr_uxtw = inttoptr i64 %addrint1_uxtw to fp128* 320 %val_uxtw = load volatile fp128, fp128* %addr_uxtw 321 store volatile fp128 %val_uxtw, fp128* %base 322; CHECK: ldr {{q[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, uxtw] 323; CHECK-NOFP-NOT: ldr {{q[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, sxtw #4] 324 325 %base_sxtw = ptrtoint fp128* %base to i64 326 %offset_sxtw = sext i32 %off32 to i64 327 %addrint_sxtw = add i64 %base_sxtw, %offset_sxtw 328 %addr_sxtw = inttoptr i64 %addrint_sxtw to fp128* 329 %val64_sxtw = load volatile fp128, fp128* %addr_sxtw 330 store volatile fp128 %val64_sxtw, fp128* %base 331; CHECK: ldr {{q[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, sxtw] 332; CHECK-NOFP-NOT: ldr {{q[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, sxtw #4] 333 334 %base_lsl = ptrtoint fp128* %base to i64 335 %addrint_lsl = add i64 %base_lsl, %off64 336 %addr_lsl = inttoptr i64 %addrint_lsl to fp128* 337 %val64_lsl = load volatile fp128, fp128* %addr_lsl 338 store volatile fp128 %val64_lsl, fp128* %base 339; CHECK: ldr {{q[0-9]+}}, [{{x[0-9]+}}, {{x[0-9]+}}] 340; CHECK-NOFP-NOT: ldr {{q[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, sxtw #4] 341 342 %base_uxtwN = ptrtoint fp128* %base to i64 343 %offset_uxtwN = zext i32 %off32 to i64 344 %offset2_uxtwN = shl i64 %offset_uxtwN, 4 345 %addrint_uxtwN = add i64 %base_uxtwN, %offset2_uxtwN 346 %addr_uxtwN = inttoptr i64 %addrint_uxtwN to fp128* 347 %val64 = load volatile fp128, fp128* %base 348 store volatile fp128 %val64, fp128* %addr_uxtwN 349; CHECK: str {{q[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, uxtw #4] 350; CHECK-NOFP-NOT: ldr {{q[0-9]+}}, [{{x[0-9]+}}, {{[xw][0-9]+}}, sxtw #4] 351 ret void 352} 353