1; RUN: llc -mtriple=armv8-none-linux-gnu -verify-machineinstrs < %s | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK-LE --check-prefix=CHECK-ARM --check-prefix=CHECK-ARM-LE 2; RUN: llc -mtriple=armebv8-none-linux-gnu -verify-machineinstrs < %s | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK-BE --check-prefix=CHECK-ARM --check-prefix=CHECK-ARM-BE 3; RUN: llc -mtriple=thumbv8-none-linux-gnu -verify-machineinstrs < %s | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK-LE --check-prefix=CHECK-THUMB --check-prefix=CHECK-THUMB-LE 4; RUN: llc -mtriple=thumbebv8-none-linux-gnu -verify-machineinstrs < %s | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK-BE --check-prefix=CHECK-THUMB --check-prefix=CHECK-THUMB-BE 5 6@var8 = global i8 0 7@var16 = global i16 0 8@var32 = global i32 0 9@var64 = global i64 0 10 11define i8 @test_atomic_load_add_i8(i8 %offset) nounwind { 12; CHECK-LABEL: test_atomic_load_add_i8: 13 %old = atomicrmw add i8* @var8, i8 %offset seq_cst 14; CHECK-NOT: dmb 15; CHECK-NOT: mcr 16; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var8 17; CHECK: movt r[[ADDR]], :upper16:var8 18 19; CHECK: .LBB{{[0-9]+}}_1: 20; CHECK: ldaexb r[[OLD:[0-9]+]], [r[[ADDR]]] 21 ; r0 below is a reasonable guess but could change: it certainly comes into the 22 ; function there. 23; CHECK-NEXT: add{{s?}} [[NEW:r[0-9]+]], r[[OLD]], r0 24; CHECK-NEXT: stlexb [[STATUS:r[0-9]+]], [[NEW]], [r[[ADDR]]] 25; CHECK-NEXT: cmp [[STATUS]], #0 26; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 27; CHECK-NOT: dmb 28; CHECK-NOT: mcr 29 30; CHECK: mov r0, r[[OLD]] 31 ret i8 %old 32} 33 34define i16 @test_atomic_load_add_i16(i16 %offset) nounwind { 35; CHECK-LABEL: test_atomic_load_add_i16: 36 %old = atomicrmw add i16* @var16, i16 %offset acquire 37; CHECK-NOT: dmb 38; CHECK-NOT: mcr 39; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var16 40; CHECK: movt r[[ADDR]], :upper16:var16 41 42; CHECK: .LBB{{[0-9]+}}_1: 43; CHECK: ldaexh r[[OLD:[0-9]+]], [r[[ADDR]]] 44 ; r0 below is a reasonable guess but could change: it certainly comes into the 45 ; function there. 46; CHECK-NEXT: add{{s?}} [[NEW:r[0-9]+]], r[[OLD]], r0 47; CHECK-NEXT: strexh [[STATUS:r[0-9]+]], [[NEW]], [r[[ADDR]]] 48; CHECK-NEXT: cmp [[STATUS]], #0 49; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 50; CHECK-NOT: dmb 51; CHECK-NOT: mcr 52 53; CHECK: mov r0, r[[OLD]] 54 ret i16 %old 55} 56 57define i32 @test_atomic_load_add_i32(i32 %offset) nounwind { 58; CHECK-LABEL: test_atomic_load_add_i32: 59 %old = atomicrmw add i32* @var32, i32 %offset release 60; CHECK-NOT: dmb 61; CHECK-NOT: mcr 62; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var32 63; CHECK: movt r[[ADDR]], :upper16:var32 64 65; CHECK: .LBB{{[0-9]+}}_1: 66; CHECK: ldrex r[[OLD:[0-9]+]], [r[[ADDR]]] 67 ; r0 below is a reasonable guess but could change: it certainly comes into the 68 ; function there. 69; CHECK-NEXT: add{{s?}} [[NEW:r[0-9]+]], r[[OLD]], r0 70; CHECK-NEXT: stlex [[STATUS:r[0-9]+]], [[NEW]], [r[[ADDR]]] 71; CHECK-NEXT: cmp [[STATUS]], #0 72; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 73; CHECK-NOT: dmb 74; CHECK-NOT: mcr 75 76; CHECK: mov r0, r[[OLD]] 77 ret i32 %old 78} 79 80define void @test_atomic_load_add_i64(i64 %offset) nounwind { 81; CHECK-LABEL: test_atomic_load_add_i64: 82 %old = atomicrmw add i64* @var64, i64 %offset monotonic 83; CHECK-NOT: dmb 84; CHECK-NOT: mcr 85; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var64 86; CHECK: movt r[[ADDR]], :upper16:var64 87 88; CHECK: .LBB{{[0-9]+}}_1: 89; CHECK: ldrexd r[[OLD1:[0-9]+]], r[[OLD2:[0-9]+]], [r[[ADDR]]] 90 ; r0, r1 below is a reasonable guess but could change: it certainly comes into the 91 ; function there. 92; CHECK-LE-NEXT: adds{{(\.w)?}} [[NEW1:r[0-9]+|lr]], r[[OLD1]], r0 93; CHECK-LE-NEXT: adc{{(\.w)?}} [[NEW2:r[0-9]+]], r[[OLD2]], r1 94; CHECK-BE-NEXT: adds{{(\.w)?}} [[NEW2:r[0-9]+|lr]], r[[OLD2]], r1 95; CHECK-BE-NEXT: adc{{(\.w)?}} [[NEW1:r[0-9]+]], r[[OLD1]], r0 96; CHECK-NEXT: strexd [[STATUS:r[0-9]+]], [[NEW1]], [[NEW2]], [r[[ADDR]]] 97; CHECK-NEXT: cmp [[STATUS]], #0 98; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 99; CHECK-NOT: dmb 100; CHECK-NOT: mcr 101 102; CHECK: strd r[[OLD1]], r[[OLD2]], [r[[ADDR]]] 103 store i64 %old, i64* @var64 104 ret void 105} 106 107define i8 @test_atomic_load_sub_i8(i8 %offset) nounwind { 108; CHECK-LABEL: test_atomic_load_sub_i8: 109 %old = atomicrmw sub i8* @var8, i8 %offset monotonic 110; CHECK-NOT: dmb 111; CHECK-NOT: mcr 112; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var8 113; CHECK: movt r[[ADDR]], :upper16:var8 114 115; CHECK: .LBB{{[0-9]+}}_1: 116; CHECK: ldrexb r[[OLD:[0-9]+]], [r[[ADDR]]] 117 ; r0 below is a reasonable guess but could change: it certainly comes into the 118 ; function there. 119; CHECK-NEXT: sub{{s?}} [[NEW:r[0-9]+]], r[[OLD]], r0 120; CHECK-NEXT: strexb [[STATUS:r[0-9]+]], [[NEW]], [r[[ADDR]]] 121; CHECK-NEXT: cmp [[STATUS]], #0 122; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 123; CHECK-NOT: dmb 124; CHECK-NOT: mcr 125 126; CHECK: mov r0, r[[OLD]] 127 ret i8 %old 128} 129 130define i16 @test_atomic_load_sub_i16(i16 %offset) nounwind { 131; CHECK-LABEL: test_atomic_load_sub_i16: 132 %old = atomicrmw sub i16* @var16, i16 %offset release 133; CHECK-NOT: dmb 134; CHECK-NOT: mcr 135; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var16 136; CHECK: movt r[[ADDR]], :upper16:var16 137 138; CHECK: .LBB{{[0-9]+}}_1: 139; CHECK: ldrexh r[[OLD:[0-9]+]], [r[[ADDR]]] 140 ; r0 below is a reasonable guess but could change: it certainly comes into the 141 ; function there. 142; CHECK-NEXT: sub{{s?}} [[NEW:r[0-9]+]], r[[OLD]], r0 143; CHECK-NEXT: stlexh [[STATUS:r[0-9]+]], [[NEW]], [r[[ADDR]]] 144; CHECK-NEXT: cmp [[STATUS]], #0 145; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 146; CHECK-NOT: dmb 147; CHECK-NOT: mcr 148 149; CHECK: mov r0, r[[OLD]] 150 ret i16 %old 151} 152 153define i32 @test_atomic_load_sub_i32(i32 %offset) nounwind { 154; CHECK-LABEL: test_atomic_load_sub_i32: 155 %old = atomicrmw sub i32* @var32, i32 %offset acquire 156; CHECK-NOT: dmb 157; CHECK-NOT: mcr 158; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var32 159; CHECK: movt r[[ADDR]], :upper16:var32 160 161; CHECK: .LBB{{[0-9]+}}_1: 162; CHECK: ldaex r[[OLD:[0-9]+]], [r[[ADDR]]] 163 ; r0 below is a reasonable guess but could change: it certainly comes into the 164 ; function there. 165; CHECK-NEXT: sub{{s?}} [[NEW:r[0-9]+]], r[[OLD]], r0 166; CHECK-NEXT: strex [[STATUS:r[0-9]+]], [[NEW]], [r[[ADDR]]] 167; CHECK-NEXT: cmp [[STATUS]], #0 168; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 169; CHECK-NOT: dmb 170; CHECK-NOT: mcr 171 172; CHECK: mov r0, r[[OLD]] 173 ret i32 %old 174} 175 176define void @test_atomic_load_sub_i64(i64 %offset) nounwind { 177; CHECK-LABEL: test_atomic_load_sub_i64: 178 %old = atomicrmw sub i64* @var64, i64 %offset seq_cst 179; CHECK-NOT: dmb 180; CHECK-NOT: mcr 181; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var64 182; CHECK: movt r[[ADDR]], :upper16:var64 183 184; CHECK: .LBB{{[0-9]+}}_1: 185; CHECK: ldaexd r[[OLD1:[0-9]+]], r[[OLD2:[0-9]+]], [r[[ADDR]]] 186 ; r0, r1 below is a reasonable guess but could change: it certainly comes into the 187 ; function there. 188; CHECK-LE-NEXT: subs{{(\.w)?}} [[NEW1:r[0-9]+|lr]], r[[OLD1]], r0 189; CHECK-LE-NEXT: sbc{{(\.w)?}} [[NEW2:r[0-9]+]], r[[OLD2]], r1 190; CHECK-BE-NEXT: subs{{(\.w)?}} [[NEW2:r[0-9]+|lr]], r[[OLD2]], r1 191; CHECK-BE-NEXT: sbc{{(\.w)?}} [[NEW1:r[0-9]+]], r[[OLD1]], r0 192; CHECK-NEXT: stlexd [[STATUS:r[0-9]+]], [[NEW1]], [[NEW2]], [r[[ADDR]]] 193; CHECK-NEXT: cmp [[STATUS]], #0 194; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 195; CHECK-NOT: dmb 196; CHECK-NOT: mcr 197 198; CHECK: strd r[[OLD1]], r[[OLD2]], [r[[ADDR]]] 199 store i64 %old, i64* @var64 200 ret void 201} 202 203define i8 @test_atomic_load_and_i8(i8 %offset) nounwind { 204; CHECK-LABEL: test_atomic_load_and_i8: 205 %old = atomicrmw and i8* @var8, i8 %offset release 206; CHECK-NOT: dmb 207; CHECK-NOT: mcr 208; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var8 209; CHECK: movt r[[ADDR]], :upper16:var8 210 211; CHECK: .LBB{{[0-9]+}}_1: 212; CHECK: ldrexb r[[OLD:[0-9]+]], [r[[ADDR]]] 213 ; r0 below is a reasonable guess but could change: it certainly comes into the 214 ; function there. 215; CHECK-NEXT: and{{(\.w)?}} [[NEW:r[0-9]+]], r[[OLD]], r0 216; CHECK-NEXT: stlexb [[STATUS:r[0-9]+]], [[NEW]], [r[[ADDR]]] 217; CHECK-NEXT: cmp [[STATUS]], #0 218; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 219; CHECK-NOT: dmb 220; CHECK-NOT: mcr 221 222; CHECK: mov r0, r[[OLD]] 223 ret i8 %old 224} 225 226define i16 @test_atomic_load_and_i16(i16 %offset) nounwind { 227; CHECK-LABEL: test_atomic_load_and_i16: 228 %old = atomicrmw and i16* @var16, i16 %offset monotonic 229; CHECK-NOT: dmb 230; CHECK-NOT: mcr 231; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var16 232; CHECK: movt r[[ADDR]], :upper16:var16 233 234; CHECK: .LBB{{[0-9]+}}_1: 235; CHECK: ldrexh r[[OLD:[0-9]+]], [r[[ADDR]]] 236 ; r0 below is a reasonable guess but could change: it certainly comes into the 237 ; function there. 238; CHECK-NEXT: and{{(\.w)?}} [[NEW:r[0-9]+]], r[[OLD]], r0 239; CHECK-NEXT: strexh [[STATUS:r[0-9]+]], [[NEW]], [r[[ADDR]]] 240; CHECK-NEXT: cmp [[STATUS]], #0 241; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 242; CHECK-NOT: dmb 243; CHECK-NOT: mcr 244 245; CHECK: mov r0, r[[OLD]] 246 ret i16 %old 247} 248 249define i32 @test_atomic_load_and_i32(i32 %offset) nounwind { 250; CHECK-LABEL: test_atomic_load_and_i32: 251 %old = atomicrmw and i32* @var32, i32 %offset seq_cst 252; CHECK-NOT: dmb 253; CHECK-NOT: mcr 254; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var32 255; CHECK: movt r[[ADDR]], :upper16:var32 256 257; CHECK: .LBB{{[0-9]+}}_1: 258; CHECK: ldaex r[[OLD:[0-9]+]], [r[[ADDR]]] 259 ; r0 below is a reasonable guess but could change: it certainly comes into the 260 ; function there. 261; CHECK-NEXT: and{{(\.w)?}} [[NEW:r[0-9]+]], r[[OLD]], r0 262; CHECK-NEXT: stlex [[STATUS:r[0-9]+]], [[NEW]], [r[[ADDR]]] 263; CHECK-NEXT: cmp [[STATUS]], #0 264; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 265; CHECK-NOT: dmb 266; CHECK-NOT: mcr 267 268; CHECK: mov r0, r[[OLD]] 269 ret i32 %old 270} 271 272define void @test_atomic_load_and_i64(i64 %offset) nounwind { 273; CHECK-LABEL: test_atomic_load_and_i64: 274 %old = atomicrmw and i64* @var64, i64 %offset acquire 275; CHECK-NOT: dmb 276; CHECK-NOT: mcr 277; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var64 278; CHECK: movt r[[ADDR]], :upper16:var64 279 280; CHECK: .LBB{{[0-9]+}}_1: 281; CHECK: ldaexd r[[OLD1:[0-9]+]], r[[OLD2:[0-9]+]], [r[[ADDR]]] 282 ; r0, r1 below is a reasonable guess but could change: it certainly comes into the 283 ; function there. 284; CHECK-LE-DAG: and{{(\.w)?}} [[NEW1:r[0-9]+|lr]], r[[OLD1]], r0 285; CHECK-LE-DAG: and{{(\.w)?}} [[NEW2:r[0-9]+|lr]], r[[OLD2]], r1 286; CHECK-BE-DAG: and{{(\.w)?}} [[NEW2:r[0-9]+|lr]], r[[OLD2]], r1 287; CHECK-BE-DAG: and{{(\.w)?}} [[NEW1:r[0-9]+|lr]], r[[OLD1]], r0 288; CHECK: strexd [[STATUS:r[0-9]+]], [[NEW1]], [[NEW2]], [r[[ADDR]]] 289; CHECK-NEXT: cmp [[STATUS]], #0 290; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 291; CHECK-NOT: dmb 292; CHECK-NOT: mcr 293 294; CHECK: strd r[[OLD1]], r[[OLD2]], [r[[ADDR]]] 295 store i64 %old, i64* @var64 296 ret void 297} 298 299define i8 @test_atomic_load_or_i8(i8 %offset) nounwind { 300; CHECK-LABEL: test_atomic_load_or_i8: 301 %old = atomicrmw or i8* @var8, i8 %offset seq_cst 302; CHECK-NOT: dmb 303; CHECK-NOT: mcr 304; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var8 305; CHECK: movt r[[ADDR]], :upper16:var8 306 307; CHECK: .LBB{{[0-9]+}}_1: 308; CHECK: ldaexb r[[OLD:[0-9]+]], [r[[ADDR]]] 309 ; r0 below is a reasonable guess but could change: it certainly comes into the 310 ; function there. 311; CHECK-NEXT: orr{{(\.w)?}} [[NEW:r[0-9]+]], r[[OLD]], r0 312; CHECK-NEXT: stlexb [[STATUS:r[0-9]+]], [[NEW]], [r[[ADDR]]] 313; CHECK-NEXT: cmp [[STATUS]], #0 314; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 315; CHECK-NOT: dmb 316; CHECK-NOT: mcr 317 318; CHECK: mov r0, r[[OLD]] 319 ret i8 %old 320} 321 322define i16 @test_atomic_load_or_i16(i16 %offset) nounwind { 323; CHECK-LABEL: test_atomic_load_or_i16: 324 %old = atomicrmw or i16* @var16, i16 %offset monotonic 325; CHECK-NOT: dmb 326; CHECK-NOT: mcr 327; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var16 328; CHECK: movt r[[ADDR]], :upper16:var16 329 330; CHECK: .LBB{{[0-9]+}}_1: 331; CHECK: ldrexh r[[OLD:[0-9]+]], [r[[ADDR]]] 332 ; r0 below is a reasonable guess but could change: it certainly comes into the 333 ; function there. 334; CHECK-NEXT: orr{{(\.w)?}} [[NEW:r[0-9]+]], r[[OLD]], r0 335; CHECK-NEXT: strexh [[STATUS:r[0-9]+]], [[NEW]], [r[[ADDR]]] 336; CHECK-NEXT: cmp [[STATUS]], #0 337; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 338; CHECK-NOT: dmb 339; CHECK-NOT: mcr 340 341; CHECK: mov r0, r[[OLD]] 342 ret i16 %old 343} 344 345define i32 @test_atomic_load_or_i32(i32 %offset) nounwind { 346; CHECK-LABEL: test_atomic_load_or_i32: 347 %old = atomicrmw or i32* @var32, i32 %offset acquire 348; CHECK-NOT: dmb 349; CHECK-NOT: mcr 350; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var32 351; CHECK: movt r[[ADDR]], :upper16:var32 352 353; CHECK: .LBB{{[0-9]+}}_1: 354; CHECK: ldaex r[[OLD:[0-9]+]], [r[[ADDR]]] 355 ; r0 below is a reasonable guess but could change: it certainly comes into the 356 ; function there. 357; CHECK-NEXT: orr{{(\.w)?}} [[NEW:r[0-9]+]], r[[OLD]], r0 358; CHECK-NEXT: strex [[STATUS:r[0-9]+]], [[NEW]], [r[[ADDR]]] 359; CHECK-NEXT: cmp [[STATUS]], #0 360; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 361; CHECK-NOT: dmb 362; CHECK-NOT: mcr 363 364; CHECK: mov r0, r[[OLD]] 365 ret i32 %old 366} 367 368define void @test_atomic_load_or_i64(i64 %offset) nounwind { 369; CHECK-LABEL: test_atomic_load_or_i64: 370 %old = atomicrmw or i64* @var64, i64 %offset release 371; CHECK-NOT: dmb 372; CHECK-NOT: mcr 373; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var64 374; CHECK: movt r[[ADDR]], :upper16:var64 375 376; CHECK: .LBB{{[0-9]+}}_1: 377; CHECK: ldrexd r[[OLD1:[0-9]+]], r[[OLD2:[0-9]+]], [r[[ADDR]]] 378 ; r0, r1 below is a reasonable guess but could change: it certainly comes into the 379 ; function there. 380; CHECK-LE-DAG: orr{{(\.w)?}} [[NEW1:r[0-9]+|lr]], r[[OLD1]], r0 381; CHECK-LE-DAG: orr{{(\.w)?}} [[NEW2:r[0-9]+|lr]], r[[OLD2]], r1 382; CHECK-BE-DAG: orr{{(\.w)?}} [[NEW2:r[0-9]+|lr]], r[[OLD2]], r1 383; CHECK-BE-DAG: orr{{(\.w)?}} [[NEW1:r[0-9]+|lr]], r[[OLD1]], r0 384; CHECK: stlexd [[STATUS:r[0-9]+]], [[NEW1]], [[NEW2]], [r[[ADDR]]] 385; CHECK-NEXT: cmp [[STATUS]], #0 386; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 387; CHECK-NOT: dmb 388; CHECK-NOT: mcr 389 390; CHECK: strd r[[OLD1]], r[[OLD2]], [r[[ADDR]]] 391 store i64 %old, i64* @var64 392 ret void 393} 394 395define i8 @test_atomic_load_xor_i8(i8 %offset) nounwind { 396; CHECK-LABEL: test_atomic_load_xor_i8: 397 %old = atomicrmw xor i8* @var8, i8 %offset acquire 398; CHECK-NOT: dmb 399; CHECK-NOT: mcr 400; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var8 401; CHECK: movt r[[ADDR]], :upper16:var8 402 403; CHECK: .LBB{{[0-9]+}}_1: 404; CHECK: ldaexb r[[OLD:[0-9]+]], [r[[ADDR]]] 405 ; r0 below is a reasonable guess but could change: it certainly comes into the 406 ; function there. 407; CHECK-NEXT: eor{{(\.w)?}} [[NEW:r[0-9]+]], r[[OLD]], r0 408; CHECK-NEXT: strexb [[STATUS:r[0-9]+]], [[NEW]], [r[[ADDR]]] 409; CHECK-NEXT: cmp [[STATUS]], #0 410; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 411; CHECK-NOT: dmb 412; CHECK-NOT: mcr 413 414; CHECK: mov r0, r[[OLD]] 415 ret i8 %old 416} 417 418define i16 @test_atomic_load_xor_i16(i16 %offset) nounwind { 419; CHECK-LABEL: test_atomic_load_xor_i16: 420 %old = atomicrmw xor i16* @var16, i16 %offset release 421; CHECK-NOT: dmb 422; CHECK-NOT: mcr 423; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var16 424; CHECK: movt r[[ADDR]], :upper16:var16 425 426; CHECK: .LBB{{[0-9]+}}_1: 427; CHECK: ldrexh r[[OLD:[0-9]+]], [r[[ADDR]]] 428 ; r0 below is a reasonable guess but could change: it certainly comes into the 429 ; function there. 430; CHECK-NEXT: eor{{(\.w)?}} [[NEW:r[0-9]+]], r[[OLD]], r0 431; CHECK-NEXT: stlexh [[STATUS:r[0-9]+]], [[NEW]], [r[[ADDR]]] 432; CHECK-NEXT: cmp [[STATUS]], #0 433; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 434; CHECK-NOT: dmb 435; CHECK-NOT: mcr 436 437; CHECK: mov r0, r[[OLD]] 438 ret i16 %old 439} 440 441define i32 @test_atomic_load_xor_i32(i32 %offset) nounwind { 442; CHECK-LABEL: test_atomic_load_xor_i32: 443 %old = atomicrmw xor i32* @var32, i32 %offset seq_cst 444; CHECK-NOT: dmb 445; CHECK-NOT: mcr 446; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var32 447; CHECK: movt r[[ADDR]], :upper16:var32 448 449; CHECK: .LBB{{[0-9]+}}_1: 450; CHECK: ldaex r[[OLD:[0-9]+]], [r[[ADDR]]] 451 ; r0 below is a reasonable guess but could change: it certainly comes into the 452 ; function there. 453; CHECK-NEXT: eor{{(\.w)?}} [[NEW:r[0-9]+]], r[[OLD]], r0 454; CHECK-NEXT: stlex [[STATUS:r[0-9]+]], [[NEW]], [r[[ADDR]]] 455; CHECK-NEXT: cmp [[STATUS]], #0 456; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 457; CHECK-NOT: dmb 458; CHECK-NOT: mcr 459 460; CHECK: mov r0, r[[OLD]] 461 ret i32 %old 462} 463 464define void @test_atomic_load_xor_i64(i64 %offset) nounwind { 465; CHECK-LABEL: test_atomic_load_xor_i64: 466 %old = atomicrmw xor i64* @var64, i64 %offset monotonic 467; CHECK-NOT: dmb 468; CHECK-NOT: mcr 469; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var64 470; CHECK: movt r[[ADDR]], :upper16:var64 471 472; CHECK: .LBB{{[0-9]+}}_1: 473; CHECK: ldrexd r[[OLD1:[0-9]+]], r[[OLD2:[0-9]+]], [r[[ADDR]]] 474 ; r0, r1 below is a reasonable guess but could change: it certainly comes into the 475 ; function there. 476; CHECK-LE-DAG: eor{{(\.w)?}} [[NEW1:r[0-9]+|lr]], r[[OLD1]], r0 477; CHECK-LE-DAG: eor{{(\.w)?}} [[NEW2:r[0-9]+|lr]], r[[OLD2]], r1 478; CHECK-BE-DAG: eor{{(\.w)?}} [[NEW2:r[0-9]+|lr]], r[[OLD2]], r1 479; CHECK-BE-DAG: eor{{(\.w)?}} [[NEW1:r[0-9]+|lr]], r[[OLD1]], r0 480; CHECK: strexd [[STATUS:r[0-9]+]], [[NEW1]], [[NEW2]], [r[[ADDR]]] 481; CHECK-NEXT: cmp [[STATUS]], #0 482; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 483; CHECK-NOT: dmb 484; CHECK-NOT: mcr 485 486; CHECK: strd r[[OLD1]], r[[OLD2]], [r[[ADDR]]] 487 store i64 %old, i64* @var64 488 ret void 489} 490 491define i8 @test_atomic_load_xchg_i8(i8 %offset) nounwind { 492; CHECK-LABEL: test_atomic_load_xchg_i8: 493 %old = atomicrmw xchg i8* @var8, i8 %offset monotonic 494; CHECK-NOT: dmb 495; CHECK-NOT: mcr 496; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var8 497; CHECK: movt r[[ADDR]], :upper16:var8 498 499; CHECK: .LBB{{[0-9]+}}_1: 500; CHECK: ldrexb r[[OLD:[0-9]+]], [r[[ADDR]]] 501 ; r0 below is a reasonable guess but could change: it certainly comes into the 502 ; function there. 503; CHECK-NEXT: strexb [[STATUS:r[0-9]+]], r0, [r[[ADDR]]] 504; CHECK-NEXT: cmp [[STATUS]], #0 505; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 506; CHECK-NOT: dmb 507; CHECK-NOT: mcr 508 509; CHECK: mov r0, r[[OLD]] 510 ret i8 %old 511} 512 513define i16 @test_atomic_load_xchg_i16(i16 %offset) nounwind { 514; CHECK-LABEL: test_atomic_load_xchg_i16: 515 %old = atomicrmw xchg i16* @var16, i16 %offset seq_cst 516; CHECK-NOT: dmb 517; CHECK-NOT: mcr 518; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var16 519; CHECK: movt r[[ADDR]], :upper16:var16 520 521; CHECK: .LBB{{[0-9]+}}_1: 522; CHECK: ldaexh r[[OLD:[0-9]+]], [r[[ADDR]]] 523 ; r0 below is a reasonable guess but could change: it certainly comes into the 524 ; function there. 525; CHECK-NEXT: stlexh [[STATUS:r[0-9]+]], r0, [r[[ADDR]]] 526; CHECK-NEXT: cmp [[STATUS]], #0 527; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 528; CHECK-NOT: dmb 529; CHECK-NOT: mcr 530 531; CHECK: mov r0, r[[OLD]] 532 ret i16 %old 533} 534 535define i32 @test_atomic_load_xchg_i32(i32 %offset) nounwind { 536; CHECK-LABEL: test_atomic_load_xchg_i32: 537 %old = atomicrmw xchg i32* @var32, i32 %offset release 538; CHECK-NOT: dmb 539; CHECK-NOT: mcr 540; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var32 541; CHECK: movt r[[ADDR]], :upper16:var32 542 543; CHECK: .LBB{{[0-9]+}}_1: 544; CHECK: ldrex r[[OLD:[0-9]+]], [r[[ADDR]]] 545 ; r0 below is a reasonable guess but could change: it certainly comes into the 546 ; function there. 547; CHECK-NEXT: stlex [[STATUS:r[0-9]+]], r0, [r[[ADDR]]] 548; CHECK-NEXT: cmp [[STATUS]], #0 549; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 550; CHECK-NOT: dmb 551; CHECK-NOT: mcr 552 553; CHECK: mov r0, r[[OLD]] 554 ret i32 %old 555} 556 557define void @test_atomic_load_xchg_i64(i64 %offset) nounwind { 558; CHECK-LABEL: test_atomic_load_xchg_i64: 559 %old = atomicrmw xchg i64* @var64, i64 %offset acquire 560; CHECK-NOT: dmb 561; CHECK-NOT: mcr 562; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var64 563; CHECK: movt r[[ADDR]], :upper16:var64 564 565; CHECK: .LBB{{[0-9]+}}_1: 566; CHECK: ldaexd [[OLD1:r[0-9]+]], [[OLD2:r[0-9]+|lr]], [r[[ADDR]]] 567 ; r0, r1 below is a reasonable guess but could change: it certainly comes into the 568 ; function there. 569; CHECK-NEXT: strexd [[STATUS:r[0-9]+]], r0, r1, [r[[ADDR]]] 570; CHECK-NEXT: cmp [[STATUS]], #0 571; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 572; CHECK-NOT: dmb 573; CHECK-NOT: mcr 574 575; CHECK: strd [[OLD1]], [[OLD2]], [r[[ADDR]]] 576 store i64 %old, i64* @var64 577 ret void 578} 579 580define i8 @test_atomic_load_min_i8(i8 signext %offset) nounwind { 581; CHECK-LABEL: test_atomic_load_min_i8: 582 %old = atomicrmw min i8* @var8, i8 %offset acquire 583; CHECK-NOT: dmb 584; CHECK-NOT: mcr 585; CHECK-DAG: movw [[ADDR:r[0-9]+|lr]], :lower16:var8 586; CHECK-DAG: movt [[ADDR]], :upper16:var8 587 588; CHECK: .LBB{{[0-9]+}}_1: 589; CHECK: ldaexb r[[OLD:[0-9]+]], {{.*}}[[ADDR]] 590; CHECK-NEXT: sxtb r[[OLDX:[0-9]+]], r[[OLD]] 591 ; r0 below is a reasonable guess but could change: it certainly comes into the 592 ; function there. 593; CHECK-NEXT: cmp r[[OLDX]], r0 594; Thumb mode: it le 595; CHECK: movle r[[OLDX]], r[[OLD]] 596; CHECK-NEXT: strexb [[STATUS:r[0-9]+]], r[[OLDX]], {{.*}}[[ADDR]]] 597; CHECK-NEXT: cmp [[STATUS]], #0 598; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 599; CHECK-NOT: dmb 600; CHECK-NOT: mcr 601 602; CHECK: mov r0, r[[OLD]] 603 ret i8 %old 604} 605 606define i16 @test_atomic_load_min_i16(i16 signext %offset) nounwind { 607; CHECK-LABEL: test_atomic_load_min_i16: 608 %old = atomicrmw min i16* @var16, i16 %offset release 609; CHECK-NOT: dmb 610; CHECK-NOT: mcr 611; CHECK: movw [[ADDR:r[0-9]+|lr]], :lower16:var16 612; CHECK: movt [[ADDR]], :upper16:var16 613 614; CHECK: .LBB{{[0-9]+}}_1: 615; CHECK: ldrexh r[[OLD:[0-9]+]], {{.*}}[[ADDR]] 616; CHECK-NEXT: sxth r[[OLDX:[0-9]+]], r[[OLD]] 617 ; r0 below is a reasonable guess but could change: it certainly comes into the 618 ; function there. 619; CHECK-NEXT: cmp r[[OLDX]], r0 620; Thumb mode: it le 621; CHECK: movle r[[OLDX]], r[[OLD]] 622; CHECK-NEXT: stlexh [[STATUS:r[0-9]+]], r[[OLDX]], {{.*}}[[ADDR]] 623; CHECK-NEXT: cmp [[STATUS]], #0 624; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 625; CHECK-NOT: dmb 626; CHECK-NOT: mcr 627 628; CHECK: mov r0, r[[OLD]] 629 ret i16 %old 630} 631 632define i32 @test_atomic_load_min_i32(i32 %offset) nounwind { 633; CHECK-LABEL: test_atomic_load_min_i32: 634 %old = atomicrmw min i32* @var32, i32 %offset monotonic 635; CHECK-NOT: dmb 636; CHECK-NOT: mcr 637; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var32 638; CHECK: movt r[[ADDR]], :upper16:var32 639 640; CHECK: .LBB{{[0-9]+}}_1: 641; CHECK: ldrex r[[OLD:[0-9]+]], [r[[ADDR]]] 642 ; r0 below is a reasonable guess but could change: it certainly comes into the 643 ; function there. 644; CHECK-NEXT: mov r[[NEW:[0-9]+]], r0 645; CHECK-NEXT: cmp r[[OLD]], r0 646; Thumb mode: it le 647; CHECK: movle r[[NEW]], r[[OLD]] 648; CHECK-NEXT: strex [[STATUS:r[0-9]+]], r[[NEW]], [r[[ADDR]]] 649; CHECK-NEXT: cmp [[STATUS]], #0 650; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 651; CHECK-NOT: dmb 652; CHECK-NOT: mcr 653 654; CHECK: mov r0, r[[OLD]] 655 ret i32 %old 656} 657 658define void @test_atomic_load_min_i64(i64 %offset) nounwind { 659; CHECK-LABEL: test_atomic_load_min_i64: 660 %old = atomicrmw min i64* @var64, i64 %offset seq_cst 661; CHECK-NOT: dmb 662; CHECK-NOT: mcr 663; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var64 664; CHECK: movt r[[ADDR]], :upper16:var64 665 666; CHECK: .LBB{{[0-9]+}}_1: 667; CHECK: ldaexd [[OLD1:r[0-9]+|lr]], [[OLD2:r[0-9]+|lr]], [r[[ADDR]]] 668 ; r0, r1 below is a reasonable guess but could change: it certainly comes into the 669 ; function there. 670; CHECK-ARM: mov [[MINHI:r[0-9]+]], r1 671; CHECK-ARM-LE: subs {{[^,]+}}, r0, [[OLD1]] 672; CHECK-ARM-LE: sbcs {{[^,]+}}, r1, [[OLD2]] 673; CHECK-ARM-BE: subs {{[^,]+}}, r1, [[OLD2]] 674; CHECK-ARM-BE: sbcs {{[^,]+}}, r0, [[OLD1]] 675; CHECK-ARM: mov [[CMP:r[0-9]+|lr]], #0 676; CHECK-ARM: movwge [[CMP:r[0-9]+|lr]], #1 677; CHECK-ARM: cmp [[CMP:r[0-9]+|lr]], #0 678; CHECK-ARM: movne [[MINHI]], [[OLD2]] 679; CHECK-ARM: mov [[MINLO:r[0-9]+]], r0 680; CHECK-ARM: movne [[MINLO]], [[OLD1]] 681; CHECK-ARM: stlexd [[STATUS:r[0-9]+]], [[MINLO]], [[MINHI]], [r[[ADDR]]] 682; CHECK-THUMB: stlexd [[STATUS:r[0-9]+]], {{r[0-9]+}}, {{r[0-9]+}}, [r[[ADDR]]] 683; CHECK-NEXT: cmp [[STATUS]], #0 684; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 685; CHECK-NOT: dmb 686; CHECK-NOT: mcr 687 688; CHECK-ARM: strd [[OLD1]], [[OLD2]], [r[[ADDR]]] 689 store i64 %old, i64* @var64 690 ret void 691} 692 693define i8 @test_atomic_load_max_i8(i8 signext %offset) nounwind { 694; CHECK-LABEL: test_atomic_load_max_i8: 695 %old = atomicrmw max i8* @var8, i8 %offset seq_cst 696; CHECK-NOT: dmb 697; CHECK-NOT: mcr 698; CHECK: movw [[ADDR:r[0-9]+|lr]], :lower16:var8 699; CHECK: movt [[ADDR]], :upper16:var8 700 701; CHECK: .LBB{{[0-9]+}}_1: 702; CHECK: ldaexb r[[OLD:[0-9]+]], {{.*}}[[ADDR]] 703; CHECK-NEXT: sxtb r[[OLDX:[0-9]+]], r[[OLD]] 704 ; r0 below is a reasonable guess but could change: it certainly comes into the 705 ; function there. 706; CHECK-NEXT: cmp r[[OLDX]], r0 707; Thumb mode: it gt 708; CHECK: movgt r[[OLDX]], r[[OLD]] 709; CHECK-NEXT: stlexb [[STATUS:r[0-9]+]], r[[OLDX]], {{.*}}[[ADDR]] 710; CHECK-NEXT: cmp [[STATUS]], #0 711; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 712; CHECK-NOT: dmb 713; CHECK-NOT: mcr 714 715; CHECK: mov r0, r[[OLD]] 716 ret i8 %old 717} 718 719define i16 @test_atomic_load_max_i16(i16 signext %offset) nounwind { 720; CHECK-LABEL: test_atomic_load_max_i16: 721 %old = atomicrmw max i16* @var16, i16 %offset acquire 722; CHECK-NOT: dmb 723; CHECK-NOT: mcr 724; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var16 725; CHECK: movt r[[ADDR]], :upper16:var16 726 727; CHECK: .LBB{{[0-9]+}}_1: 728; CHECK: ldaexh r[[OLD:[0-9]+]], [r[[ADDR]]] 729; CHECK-NEXT: sxth r[[OLDX:[0-9]+]], r[[OLD]] 730 ; r0 below is a reasonable guess but could change: it certainly comes into the 731 ; function there. 732; CHECK-NEXT: cmp r[[OLDX]], r0 733; Thumb mode: it gt 734; CHECK: movgt r[[OLDX]], r[[OLD]] 735; CHECK-NEXT: strexh [[STATUS:r[0-9]+]], r[[OLDX]], [r[[ADDR]]] 736; CHECK-NEXT: cmp [[STATUS]], #0 737; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 738; CHECK-NOT: dmb 739; CHECK-NOT: mcr 740 741; CHECK: mov r0, r[[OLD]] 742 ret i16 %old 743} 744 745define i32 @test_atomic_load_max_i32(i32 %offset) nounwind { 746; CHECK-LABEL: test_atomic_load_max_i32: 747 %old = atomicrmw max i32* @var32, i32 %offset release 748; CHECK-NOT: dmb 749; CHECK-NOT: mcr 750; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var32 751; CHECK: movt r[[ADDR]], :upper16:var32 752 753; CHECK: .LBB{{[0-9]+}}_1: 754; CHECK: ldrex r[[OLD:[0-9]+]], [r[[ADDR]]] 755 ; r0 below is a reasonable guess but could change: it certainly comes into the 756 ; function there. 757; CHECK-NEXT: mov r[[NEW:[0-9]+]], r0 758; CHECK-NEXT: cmp r[[OLD]], r0 759; Thumb mode: it gt 760; CHECK: movgt r[[NEW]], r[[OLD]] 761; CHECK-NEXT: stlex [[STATUS:r[0-9]+]], r[[NEW]], [r[[ADDR]]] 762; CHECK-NEXT: cmp [[STATUS]], #0 763; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 764; CHECK-NOT: dmb 765; CHECK-NOT: mcr 766 767; CHECK: mov r0, r[[OLD]] 768 ret i32 %old 769} 770 771define void @test_atomic_load_max_i64(i64 %offset) nounwind { 772; CHECK-LABEL: test_atomic_load_max_i64: 773 %old = atomicrmw max i64* @var64, i64 %offset monotonic 774; CHECK-NOT: dmb 775; CHECK-NOT: mcr 776; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var64 777; CHECK: movt r[[ADDR]], :upper16:var64 778 779; CHECK: .LBB{{[0-9]+}}_1: 780; CHECK: ldrexd [[OLD1:r[0-9]+]], [[OLD2:r[0-9]+|lr]], [r[[ADDR]]] 781 ; r0, r1 below is a reasonable guess but could change: it certainly comes into the 782 ; function there. 783; CHECK-ARM: mov [[MINHI:r[0-9]+]], r1 784; CHECK-ARM-LE: subs {{[^,]+}}, r0, [[OLD1]] 785; CHECK-ARM-LE: sbcs {{[^,]+}}, r1, [[OLD2]] 786; CHECK-ARM-BE: subs {{[^,]+}}, r1, [[OLD2]] 787; CHECK-ARM-BE: sbcs {{[^,]+}}, r0, [[OLD1]] 788; CHECK-ARM: mov [[CMP:r[0-9]+|lr]], #0 789; CHECK-ARM: movwlt [[CMP:r[0-9]+|lr]], #1 790; CHECK-ARM: cmp [[CMP:r[0-9]+|lr]], #0 791; CHECK-ARM: movne [[MINHI]], [[OLD2]] 792; CHECK-ARM: mov [[MINLO:r[0-9]+]], r0 793; CHECK-ARM: movne [[MINLO]], [[OLD1]] 794; CHECK-ARM: strexd [[STATUS:r[0-9]+]], [[MINLO]], [[MINHI]], [r[[ADDR]]] 795; CHECK-THUMB: strexd [[STATUS:r[0-9]+]], {{r[0-9]+}}, {{r[0-9]+}}, [r[[ADDR]]] 796; CHECK-NEXT: cmp [[STATUS]], #0 797; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 798; CHECK-NOT: dmb 799; CHECK-NOT: mcr 800 801; CHECK-ARM: strd [[OLD1]], [[OLD2]], [r[[ADDR]]] 802 store i64 %old, i64* @var64 803 ret void 804} 805 806define i8 @test_atomic_load_umin_i8(i8 zeroext %offset) nounwind { 807; CHECK-LABEL: test_atomic_load_umin_i8: 808 %old = atomicrmw umin i8* @var8, i8 %offset monotonic 809; CHECK-NOT: dmb 810; CHECK-NOT: mcr 811; CHECK: movw [[ADDR:r[0-9]+|lr]], :lower16:var8 812; CHECK: movt [[ADDR]], :upper16:var8 813 814; CHECK: .LBB{{[0-9]+}}_1: 815; CHECK: ldrexb r[[OLD:[0-9]+]], {{.*}}[[ADDR]] 816 ; r0 below is a reasonable guess but could change: it certainly comes into the 817 ; function there. 818; CHECK-NEXT: mov r[[NEW:[0-9]+]], r0 819; CHECK-NEXT: cmp r[[OLD]], r0 820; Thumb mode: it ls 821; CHECK: movls r[[NEW]], r[[OLD]] 822; CHECK-NEXT: strexb [[STATUS:r[0-9]+]], r[[NEW]], {{.*}}[[ADDR]] 823; CHECK-NEXT: cmp [[STATUS]], #0 824; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 825; CHECK-NOT: dmb 826; CHECK-NOT: mcr 827 828; CHECK: mov r0, r[[OLD]] 829 ret i8 %old 830} 831 832define i16 @test_atomic_load_umin_i16(i16 zeroext %offset) nounwind { 833; CHECK-LABEL: test_atomic_load_umin_i16: 834 %old = atomicrmw umin i16* @var16, i16 %offset acquire 835; CHECK-NOT: dmb 836; CHECK-NOT: mcr 837; CHECK: movw [[ADDR:r[0-9]+|lr]], :lower16:var16 838; CHECK: movt [[ADDR]], :upper16:var16 839 840; CHECK: .LBB{{[0-9]+}}_1: 841; CHECK: ldaexh r[[OLD:[0-9]+]], {{.*}}[[ADDR]] 842 ; r0 below is a reasonable guess but could change: it certainly comes into the 843 ; function there. 844; CHECK-NEXT: mov r[[NEW:[0-9]+]], r0 845; CHECK-NEXT: cmp r[[OLD]], r0 846; Thumb mode: it ls 847; CHECK: movls r[[NEW]], r[[OLD]] 848; CHECK-NEXT: strexh [[STATUS:r[0-9]+]], r[[NEW]], {{.*}}[[ADDR]] 849; CHECK-NEXT: cmp [[STATUS]], #0 850; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 851; CHECK-NOT: dmb 852; CHECK-NOT: mcr 853 854; CHECK: mov r0, r[[OLD]] 855 ret i16 %old 856} 857 858define i32 @test_atomic_load_umin_i32(i32 %offset) nounwind { 859; CHECK-LABEL: test_atomic_load_umin_i32: 860 %old = atomicrmw umin i32* @var32, i32 %offset seq_cst 861; CHECK-NOT: dmb 862; CHECK-NOT: mcr 863; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var32 864; CHECK: movt r[[ADDR]], :upper16:var32 865 866; CHECK: .LBB{{[0-9]+}}_1: 867; CHECK: ldaex r[[OLD:[0-9]+]], [r[[ADDR]]] 868 ; r0 below is a reasonable guess but could change: it certainly comes into the 869 ; function there. 870; CHECK-NEXT: mov r[[NEW:[0-9]+]], r0 871; CHECK-NEXT: cmp r[[OLD]], r0 872; Thumb mode: it ls 873; CHECK: movls r[[NEW]], r[[OLD]] 874; CHECK-NEXT: stlex [[STATUS:r[0-9]+]], r[[NEW]], [r[[ADDR]]] 875; CHECK-NEXT: cmp [[STATUS]], #0 876; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 877; CHECK-NOT: dmb 878; CHECK-NOT: mcr 879 880; CHECK: mov r0, r[[OLD]] 881 ret i32 %old 882} 883 884define void @test_atomic_load_umin_i64(i64 %offset) nounwind { 885; CHECK-LABEL: test_atomic_load_umin_i64: 886 %old = atomicrmw umin i64* @var64, i64 %offset seq_cst 887; CHECK-NOT: dmb 888; CHECK-NOT: mcr 889; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var64 890; CHECK: movt r[[ADDR]], :upper16:var64 891 892; CHECK: .LBB{{[0-9]+}}_1: 893; CHECK: ldaexd [[OLD1:r[0-9]+|lr]], [[OLD2:r[0-9]+|lr]], [r[[ADDR]]] 894 ; r0, r1 below is a reasonable guess but could change: it certainly comes into the 895 ; function there. 896; CHECK-ARM: mov [[MINHI:r[0-9]+]], r1 897; CHECK-ARM-LE: subs {{[^,]+}}, r0, [[OLD1]] 898; CHECK-ARM-LE: sbcs {{[^,]+}}, r1, [[OLD2]] 899; CHECK-ARM-BE: subs {{[^,]+}}, r1, [[OLD2]] 900; CHECK-ARM-BE: sbcs {{[^,]+}}, r0, [[OLD1]] 901; CHECK-ARM: mov [[CMP:r[0-9]+|lr]], #0 902; CHECK-ARM: movwhs [[CMP:r[0-9]+|lr]], #1 903; CHECK-ARM: cmp [[CMP:r[0-9]+|lr]], #0 904; CHECK-ARM: movne [[MINHI]], [[OLD2]] 905; CHECK-ARM: mov [[MINLO:r[0-9]+]], r0 906; CHECK-ARM: movne [[MINLO]], [[OLD1]] 907; CHECK-ARM: stlexd [[STATUS:r[0-9]+]], [[MINLO]], [[MINHI]], [r[[ADDR]]] 908; CHECK-THUMB: stlexd [[STATUS:r[0-9]+]], {{r[0-9]+}}, {{r[0-9]+}}, [r[[ADDR]]] 909; CHECK-NEXT: cmp [[STATUS]], #0 910; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 911; CHECK-NOT: dmb 912; CHECK-NOT: mcr 913 914; CHECK-ARM: strd [[OLD1]], [[OLD2]], [r[[ADDR]]] 915 store i64 %old, i64* @var64 916 ret void 917} 918 919define i8 @test_atomic_load_umax_i8(i8 zeroext %offset) nounwind { 920; CHECK-LABEL: test_atomic_load_umax_i8: 921 %old = atomicrmw umax i8* @var8, i8 %offset acq_rel 922; CHECK-NOT: dmb 923; CHECK-NOT: mcr 924; CHECK: movw [[ADDR:r[0-9]+|lr]], :lower16:var8 925; CHECK: movt [[ADDR]], :upper16:var8 926 927; CHECK: .LBB{{[0-9]+}}_1: 928; CHECK: ldaexb r[[OLD:[0-9]+]], {{.*}}[[ADDR]] 929 ; r0 below is a reasonable guess but could change: it certainly comes into the 930 ; function there. 931; CHECK-NEXT: mov r[[NEW:[0-9]+]], r0 932; CHECK-NEXT: cmp r[[OLD]], r0 933; Thumb mode: it hi 934; CHECK: movhi r[[NEW]], r[[OLD]] 935; CHECK-NEXT: stlexb [[STATUS:r[0-9]+]], r[[NEW]], {{.*}}[[ADDR]] 936; CHECK-NEXT: cmp [[STATUS]], #0 937; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 938; CHECK-NOT: dmb 939; CHECK-NOT: mcr 940 941; CHECK: mov r0, r[[OLD]] 942 ret i8 %old 943} 944 945define i16 @test_atomic_load_umax_i16(i16 zeroext %offset) nounwind { 946; CHECK-LABEL: test_atomic_load_umax_i16: 947 %old = atomicrmw umax i16* @var16, i16 %offset monotonic 948; CHECK-NOT: dmb 949; CHECK-NOT: mcr 950; CHECK: movw [[ADDR:r[0-9]+|lr]], :lower16:var16 951; CHECK: movt [[ADDR]], :upper16:var16 952 953; CHECK: .LBB{{[0-9]+}}_1: 954; CHECK: ldrexh r[[OLD:[0-9]+]], {{.*}}[[ADDR]] 955 ; r0 below is a reasonable guess but could change: it certainly comes into the 956 ; function there. 957; CHECK-NEXT: mov r[[NEW:[0-9]+]], r0 958; CHECK-NEXT: cmp r[[OLD]], r0 959; Thumb mode: it hi 960; CHECK: movhi r[[NEW]], r[[OLD]] 961; CHECK-NEXT: strexh [[STATUS:r[0-9]+]], r[[NEW]], {{.*}}[[ADDR]] 962; CHECK-NEXT: cmp [[STATUS]], #0 963; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 964; CHECK-NOT: dmb 965; CHECK-NOT: mcr 966 967; CHECK: mov r0, r[[OLD]] 968 ret i16 %old 969} 970 971define i32 @test_atomic_load_umax_i32(i32 %offset) nounwind { 972; CHECK-LABEL: test_atomic_load_umax_i32: 973 %old = atomicrmw umax i32* @var32, i32 %offset seq_cst 974; CHECK-NOT: dmb 975; CHECK-NOT: mcr 976; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var32 977; CHECK: movt r[[ADDR]], :upper16:var32 978 979; CHECK: .LBB{{[0-9]+}}_1: 980; CHECK: ldaex r[[OLD:[0-9]+]], [r[[ADDR]]] 981 ; r0 below is a reasonable guess but could change: it certainly comes into the 982 ; function there. 983; CHECK-NEXT: mov r[[NEW:[0-9]+]], r0 984; CHECK-NEXT: cmp r[[OLD]], r0 985; Thumb mode: it hi 986; CHECK: movhi r[[NEW]], r[[OLD]] 987; CHECK-NEXT: stlex [[STATUS:r[0-9]+]], r[[NEW]], [r[[ADDR]]] 988; CHECK-NEXT: cmp [[STATUS]], #0 989; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 990; CHECK-NOT: dmb 991; CHECK-NOT: mcr 992 993; CHECK: mov r0, r[[OLD]] 994 ret i32 %old 995} 996 997define void @test_atomic_load_umax_i64(i64 %offset) nounwind { 998; CHECK-LABEL: test_atomic_load_umax_i64: 999 %old = atomicrmw umax i64* @var64, i64 %offset seq_cst 1000; CHECK-NOT: dmb 1001; CHECK-NOT: mcr 1002; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var64 1003; CHECK: movt r[[ADDR]], :upper16:var64 1004 1005; CHECK: .LBB{{[0-9]+}}_1: 1006; CHECK: ldaexd [[OLD1:r[0-9]+|lr]], [[OLD2:r[0-9]+|lr]], [r[[ADDR]]] 1007 ; r0, r1 below is a reasonable guess but could change: it certainly comes into the 1008 ; function there. 1009; CHECK-ARM: mov [[MINHI:r[0-9]+]], r1 1010; CHECK-ARM-LE: subs {{[^,]+}}, r0, [[OLD1]] 1011; CHECK-ARM-LE: sbcs {{[^,]+}}, r1, [[OLD2]] 1012; CHECK-ARM-BE: subs {{[^,]+}}, r1, [[OLD2]] 1013; CHECK-ARM-BE: sbcs {{[^,]+}}, r0, [[OLD1]] 1014; CHECK-ARM: mov [[CMP:r[0-9]+|lr]], #0 1015; CHECK-ARM: movwlo [[CMP:r[0-9]+|lr]], #1 1016; CHECK-ARM: cmp [[CMP:r[0-9]+|lr]], #0 1017; CHECK-ARM: movne [[MINHI]], [[OLD2]] 1018; CHECK-ARM: mov [[MINLO:r[0-9]+]], r0 1019; CHECK-ARM: movne [[MINLO]], [[OLD1]] 1020; CHECK-ARM: stlexd [[STATUS:r[0-9]+]], [[MINLO]], [[MINHI]], [r[[ADDR]]] 1021; CHECK-THUMB: stlexd [[STATUS:r[0-9]+]], {{r[0-9]+}}, {{r[0-9]+}}, [r[[ADDR]]] 1022; CHECK-NEXT: cmp [[STATUS]], #0 1023; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 1024; CHECK-NOT: dmb 1025; CHECK-NOT: mcr 1026 1027; CHECK-ARM: strd [[OLD1]], [[OLD2]], [r[[ADDR]]] 1028 store i64 %old, i64* @var64 1029 ret void 1030} 1031 1032define i8 @test_atomic_cmpxchg_i8(i8 zeroext %wanted, i8 zeroext %new) nounwind { 1033; CHECK-LABEL: test_atomic_cmpxchg_i8: 1034 %pair = cmpxchg i8* @var8, i8 %wanted, i8 %new acquire acquire 1035 %old = extractvalue { i8, i1 } %pair, 0 1036; CHECK-NOT: dmb 1037; CHECK-NOT: mcr 1038; CHECK-DAG: movw r[[ADDR:[0-9]+]], :lower16:var8 1039; CHECK-DAG: movt r[[ADDR]], :upper16:var8 1040; CHECK-THUMB-DAG: mov r[[WANTED:[0-9]+]], r0 1041 1042; CHECK: .LBB{{[0-9]+}}_1: 1043; CHECK: ldaexb r[[OLD:[0-9]+]], [r[[ADDR]]] 1044 ; r0 below is a reasonable guess but could change: it certainly comes into the 1045 ; function there. 1046; CHECK-ARM-NEXT: cmp r[[OLD]], r0 1047; CHECK-THUMB-NEXT: cmp r[[OLD]], r[[WANTED]] 1048; CHECK-NEXT: bne .LBB{{[0-9]+}}_4 1049; CHECK-NEXT: %bb.2: 1050 ; As above, r1 is a reasonable guess. 1051; CHECK: strexb [[STATUS:r[0-9]+]], r1, [r[[ADDR]]] 1052; CHECK-NEXT: cmp [[STATUS]], #0 1053; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 1054; CHECK-ARM: mov r0, r[[OLD]] 1055; CHECK: bx lr 1056; CHECK-NEXT: .LBB{{[0-9]+}}_4: 1057; CHECK-NEXT: clrex 1058; CHECK-NOT: dmb 1059; CHECK-NOT: mcr 1060 1061; CHECK-ARM: mov r0, r[[OLD]] 1062; CHECK-ARM-NEXT: bx lr 1063 ret i8 %old 1064} 1065 1066define i16 @test_atomic_cmpxchg_i16(i16 zeroext %wanted, i16 zeroext %new) nounwind { 1067; CHECK-LABEL: test_atomic_cmpxchg_i16: 1068 %pair = cmpxchg i16* @var16, i16 %wanted, i16 %new seq_cst seq_cst 1069 %old = extractvalue { i16, i1 } %pair, 0 1070; CHECK-NOT: dmb 1071; CHECK-NOT: mcr 1072; CHECK-DAG: movw r[[ADDR:[0-9]+]], :lower16:var16 1073; CHECK-DAG: movt r[[ADDR]], :upper16:var16 1074; CHECK-THUMB-DAG: mov r[[WANTED:[0-9]+]], r0 1075 1076; CHECK: .LBB{{[0-9]+}}_1: 1077; CHECK: ldaexh r[[OLD:[0-9]+]], [r[[ADDR]]] 1078 ; r0 below is a reasonable guess but could change: it certainly comes into the 1079 ; function there. 1080; CHECK-ARM-NEXT: cmp r[[OLD]], r0 1081; CHECK-THUMB-NEXT: cmp r[[OLD]], r[[WANTED]] 1082; CHECK-NEXT: bne .LBB{{[0-9]+}}_4 1083; CHECK-NEXT: %bb.2: 1084 ; As above, r1 is a reasonable guess. 1085; CHECK: stlexh [[STATUS:r[0-9]+]], r1, [r[[ADDR]]] 1086; CHECK-NEXT: cmp [[STATUS]], #0 1087; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 1088; CHECK-ARM: mov r0, r[[OLD]] 1089; CHECK: bx lr 1090; CHECK-NEXT: .LBB{{[0-9]+}}_4: 1091; CHECK-NEXT: clrex 1092; CHECK-NOT: dmb 1093; CHECK-NOT: mcr 1094 1095; CHECK-ARM: mov r0, r[[OLD]] 1096; CHECK-ARM-NEXT: bx lr 1097 ret i16 %old 1098} 1099 1100define void @test_atomic_cmpxchg_i32(i32 %wanted, i32 %new) nounwind { 1101; CHECK-LABEL: test_atomic_cmpxchg_i32: 1102 %pair = cmpxchg i32* @var32, i32 %wanted, i32 %new release monotonic 1103 %old = extractvalue { i32, i1 } %pair, 0 1104 store i32 %old, i32* @var32 1105; CHECK-NOT: dmb 1106; CHECK-NOT: mcr 1107; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var32 1108; CHECK: movt r[[ADDR]], :upper16:var32 1109 1110; CHECK: .LBB{{[0-9]+}}_1: 1111; CHECK: ldrex r[[OLD:[0-9]+]], [r[[ADDR]]] 1112 ; r0 below is a reasonable guess but could change: it certainly comes into the 1113 ; function there. 1114; CHECK-NEXT: cmp r[[OLD]], r0 1115; CHECK-NEXT: bne .LBB{{[0-9]+}}_4 1116; CHECK-NEXT: %bb.2: 1117 ; As above, r1 is a reasonable guess. 1118; CHECK: stlex [[STATUS:r[0-9]+]], r1, [r[[ADDR]]] 1119; CHECK-NEXT: cmp [[STATUS]], #0 1120; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 1121; CHECK: str{{(.w)?}} r[[OLD]], 1122; CHECK-NEXT: bx lr 1123; CHECK-NEXT: .LBB{{[0-9]+}}_4: 1124; CHECK-NEXT: clrex 1125; CHECK-NOT: dmb 1126; CHECK-NOT: mcr 1127 1128; CHECK: str{{(.w)?}} r[[OLD]], 1129; CHECK-ARM-NEXT: bx lr 1130 ret void 1131} 1132 1133define void @test_atomic_cmpxchg_i64(i64 %wanted, i64 %new) nounwind { 1134; CHECK-LABEL: test_atomic_cmpxchg_i64: 1135 %pair = cmpxchg i64* @var64, i64 %wanted, i64 %new monotonic monotonic 1136 %old = extractvalue { i64, i1 } %pair, 0 1137; CHECK-NOT: dmb 1138; CHECK-NOT: mcr 1139; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var64 1140; CHECK: movt r[[ADDR]], :upper16:var64 1141 1142; CHECK: .LBB{{[0-9]+}}_1: 1143; CHECK: ldrexd [[OLD1:r[0-9]+|lr]], [[OLD2:r[0-9]+|lr]], [r[[ADDR]]] 1144 ; r0, r1 below is a reasonable guess but could change: it certainly comes into the 1145 ; function there. 1146; CHECK-LE-DAG: eor{{(\.w)?}} [[MISMATCH_LO:r[0-9]+|lr]], [[OLD1]], r0 1147; CHECK-LE-DAG: eor{{(\.w)?}} [[MISMATCH_HI:r[0-9]+|lr]], [[OLD2]], r1 1148; CHECK-ARM-LE: orrs{{(\.w)?}} {{r[0-9]+}}, [[MISMATCH_LO]], [[MISMATCH_HI]] 1149; CHECK-THUMB-LE: orrs{{(\.w)?}} {{(r[0-9]+, )?}}[[MISMATCH_HI]], [[MISMATCH_LO]] 1150; CHECK-BE-DAG: eor{{(\.w)?}} [[MISMATCH_HI:r[0-9]+|lr]], [[OLD2]], r1 1151; CHECK-BE-DAG: eor{{(\.w)?}} [[MISMATCH_LO:r[0-9]+|lr]], [[OLD1]], r0 1152; CHECK-ARM-BE: orrs{{(\.w)?}} {{r[0-9]+}}, [[MISMATCH_HI]], [[MISMATCH_LO]] 1153; CHECK-THUMB-BE: orrs{{(\.w)?}} {{(r[0-9]+, )?}}[[MISMATCH_LO]], [[MISMATCH_HI]] 1154; CHECK-NEXT: bne .LBB{{[0-9]+}}_4 1155; CHECK-NEXT: %bb.2: 1156 ; As above, r2, r3 is a reasonable guess. 1157; CHECK: strexd [[STATUS:r[0-9]+]], r2, r3, [r[[ADDR]]] 1158; CHECK-NEXT: cmp [[STATUS]], #0 1159; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 1160; CHECK: strd [[OLD1]], [[OLD2]], [r[[ADDR]]] 1161; CHECK-NEXT: pop 1162; CHECK-NEXT: .LBB{{[0-9]+}}_4: 1163; CHECK-NEXT: clrex 1164; CHECK-NOT: dmb 1165; CHECK-NOT: mcr 1166 1167; CHECK-ARM: strd [[OLD1]], [[OLD2]], [r[[ADDR]]] 1168 store i64 %old, i64* @var64 1169 ret void 1170} 1171 1172define i8 @test_atomic_load_monotonic_i8() nounwind { 1173; CHECK-LABEL: test_atomic_load_monotonic_i8: 1174 %val = load atomic i8, i8* @var8 monotonic, align 1 1175; CHECK-NOT: dmb 1176; CHECK-NOT: mcr 1177; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var8 1178; CHECK: movt r[[ADDR]], :upper16:var8 1179; CHECK: ldrb r0, [r[[ADDR]]] 1180; CHECK-NOT: dmb 1181; CHECK-NOT: mcr 1182 1183 ret i8 %val 1184} 1185 1186define i8 @test_atomic_load_monotonic_regoff_i8(i64 %base, i64 %off) nounwind { 1187; CHECK-LABEL: test_atomic_load_monotonic_regoff_i8: 1188 %addr_int = add i64 %base, %off 1189 %addr = inttoptr i64 %addr_int to i8* 1190 1191 %val = load atomic i8, i8* %addr monotonic, align 1 1192; CHECK-NOT: dmb 1193; CHECK-NOT: mcr 1194; CHECK-LE: ldrb r0, [r0, r2] 1195; CHECK-BE: ldrb r0, [r1, r3] 1196; CHECK-NOT: dmb 1197; CHECK-NOT: mcr 1198 1199 ret i8 %val 1200} 1201 1202define i8 @test_atomic_load_acquire_i8() nounwind { 1203; CHECK-LABEL: test_atomic_load_acquire_i8: 1204 %val = load atomic i8, i8* @var8 acquire, align 1 1205; CHECK-NOT: dmb 1206; CHECK-NOT: mcr 1207; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var8 1208; CHECK-NOT: dmb 1209; CHECK-NOT: mcr 1210; CHECK: movt r[[ADDR]], :upper16:var8 1211; CHECK-NOT: dmb 1212; CHECK-NOT: mcr 1213; CHECK: ldab r0, [r[[ADDR]]] 1214; CHECK-NOT: dmb 1215; CHECK-NOT: mcr 1216 ret i8 %val 1217} 1218 1219define i8 @test_atomic_load_seq_cst_i8() nounwind { 1220; CHECK-LABEL: test_atomic_load_seq_cst_i8: 1221 %val = load atomic i8, i8* @var8 seq_cst, align 1 1222; CHECK-NOT: dmb 1223; CHECK-NOT: mcr 1224; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var8 1225; CHECK-NOT: dmb 1226; CHECK-NOT: mcr 1227; CHECK: movt r[[ADDR]], :upper16:var8 1228; CHECK-NOT: dmb 1229; CHECK-NOT: mcr 1230; CHECK: ldab r0, [r[[ADDR]]] 1231; CHECK-NOT: dmb 1232; CHECK-NOT: mcr 1233 ret i8 %val 1234} 1235 1236define i16 @test_atomic_load_monotonic_i16() nounwind { 1237; CHECK-LABEL: test_atomic_load_monotonic_i16: 1238 %val = load atomic i16, i16* @var16 monotonic, align 2 1239; CHECK-NOT: dmb 1240; CHECK-NOT: mcr 1241; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var16 1242; CHECK-NOT: dmb 1243; CHECK-NOT: mcr 1244; CHECK: movt r[[ADDR]], :upper16:var16 1245; CHECK-NOT: dmb 1246; CHECK-NOT: mcr 1247; CHECK: ldrh r0, [r[[ADDR]]] 1248; CHECK-NOT: dmb 1249; CHECK-NOT: mcr 1250 1251 ret i16 %val 1252} 1253 1254define i32 @test_atomic_load_monotonic_regoff_i32(i64 %base, i64 %off) nounwind { 1255; CHECK-LABEL: test_atomic_load_monotonic_regoff_i32: 1256 %addr_int = add i64 %base, %off 1257 %addr = inttoptr i64 %addr_int to i32* 1258 1259 %val = load atomic i32, i32* %addr monotonic, align 4 1260; CHECK-NOT: dmb 1261; CHECK-NOT: mcr 1262; CHECK-LE: ldr r0, [r0, r2] 1263; CHECK-BE: ldr r0, [r1, r3] 1264; CHECK-NOT: dmb 1265; CHECK-NOT: mcr 1266 1267 ret i32 %val 1268} 1269 1270define i64 @test_atomic_load_seq_cst_i64() nounwind { 1271; CHECK-LABEL: test_atomic_load_seq_cst_i64: 1272 %val = load atomic i64, i64* @var64 seq_cst, align 8 1273; CHECK-NOT: dmb 1274; CHECK-NOT: mcr 1275; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var64 1276; CHECK-NOT: dmb 1277; CHECK-NOT: mcr 1278; CHECK: movt r[[ADDR]], :upper16:var64 1279; CHECK-NOT: dmb 1280; CHECK-NOT: mcr 1281; CHECK: ldaexd r0, r1, [r[[ADDR]]] 1282; CHECK-NOT: dmb 1283; CHECK-NOT: mcr 1284 ret i64 %val 1285} 1286 1287define void @test_atomic_store_monotonic_i8(i8 %val) nounwind { 1288; CHECK-LABEL: test_atomic_store_monotonic_i8: 1289 store atomic i8 %val, i8* @var8 monotonic, align 1 1290; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var8 1291; CHECK: movt r[[ADDR]], :upper16:var8 1292; CHECK: strb r0, [r[[ADDR]]] 1293 1294 ret void 1295} 1296 1297define void @test_atomic_store_monotonic_regoff_i8(i64 %base, i64 %off, i8 %val) nounwind { 1298; CHECK-LABEL: test_atomic_store_monotonic_regoff_i8: 1299 1300 %addr_int = add i64 %base, %off 1301 %addr = inttoptr i64 %addr_int to i8* 1302 1303 store atomic i8 %val, i8* %addr monotonic, align 1 1304; CHECK-LE: ldr{{b?(\.w)?}} [[VAL:r[0-9]+]], [sp] 1305; CHECK-LE: strb [[VAL]], [r0, r2] 1306; CHECK-BE: ldrb{{(\.w)?}} [[VAL:r[0-9]+]], [sp, #3] 1307; CHECK-BE: strb [[VAL]], [r1, r3] 1308 1309 ret void 1310} 1311 1312define void @test_atomic_store_release_i8(i8 %val) nounwind { 1313; CHECK-LABEL: test_atomic_store_release_i8: 1314 store atomic i8 %val, i8* @var8 release, align 1 1315; CHECK-NOT: dmb 1316; CHECK-NOT: mcr 1317; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var8 1318; CHECK-NOT: dmb 1319; CHECK-NOT: mcr 1320; CHECK: movt r[[ADDR]], :upper16:var8 1321; CHECK-NOT: dmb 1322; CHECK-NOT: mcr 1323; CHECK: stlb r0, [r[[ADDR]]] 1324; CHECK-NOT: dmb 1325; CHECK-NOT: mcr 1326 ret void 1327} 1328 1329define void @test_atomic_store_seq_cst_i8(i8 %val) nounwind { 1330; CHECK-LABEL: test_atomic_store_seq_cst_i8: 1331 store atomic i8 %val, i8* @var8 seq_cst, align 1 1332; CHECK-NOT: dmb 1333; CHECK-NOT: mcr 1334; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var8 1335; CHECK-NOT: dmb 1336; CHECK-NOT: mcr 1337; CHECK: movt r[[ADDR]], :upper16:var8 1338; CHECK-NOT: dmb 1339; CHECK-NOT: mcr 1340; CHECK: stlb r0, [r[[ADDR]]] 1341; CHECK-NOT: dmb 1342; CHECK-NOT: mcr 1343 ret void 1344} 1345 1346define void @test_atomic_store_monotonic_i16(i16 %val) nounwind { 1347; CHECK-LABEL: test_atomic_store_monotonic_i16: 1348 store atomic i16 %val, i16* @var16 monotonic, align 2 1349; CHECK-NOT: dmb 1350; CHECK-NOT: mcr 1351; CHECK: movw r[[ADDR:[0-9]+]], :lower16:var16 1352; CHECK-NOT: dmb 1353; CHECK-NOT: mcr 1354; CHECK: movt r[[ADDR]], :upper16:var16 1355; CHECK-NOT: dmb 1356; CHECK-NOT: mcr 1357; CHECK: strh r0, [r[[ADDR]]] 1358; CHECK-NOT: dmb 1359; CHECK-NOT: mcr 1360 ret void 1361} 1362 1363define void @test_atomic_store_monotonic_regoff_i32(i64 %base, i64 %off, i32 %val) nounwind { 1364; CHECK-LABEL: test_atomic_store_monotonic_regoff_i32: 1365 1366 %addr_int = add i64 %base, %off 1367 %addr = inttoptr i64 %addr_int to i32* 1368 1369 store atomic i32 %val, i32* %addr monotonic, align 4 1370; CHECK-NOT: dmb 1371; CHECK-NOT: mcr 1372; CHECK: ldr [[VAL:r[0-9]+]], [sp] 1373; CHECK-NOT: dmb 1374; CHECK-NOT: mcr 1375; CHECK-LE: str [[VAL]], [r0, r2] 1376; CHECK-BE: str [[VAL]], [r1, r3] 1377; CHECK-NOT: dmb 1378; CHECK-NOT: mcr 1379 1380 ret void 1381} 1382 1383define void @test_atomic_store_release_i64(i64 %val) nounwind { 1384; CHECK-LABEL: test_atomic_store_release_i64: 1385 store atomic i64 %val, i64* @var64 release, align 8 1386; CHECK-NOT: dmb 1387; CHECK-NOT: mcr 1388; CHECK: movw [[ADDR:r[0-9]+|lr]], :lower16:var64 1389; CHECK: movt [[ADDR]], :upper16:var64 1390 1391; CHECK: .LBB{{[0-9]+}}_1: 1392 ; r0, r1 below is a reasonable guess but could change: it certainly comes into the 1393 ; function there. 1394; CHECK: stlexd [[STATUS:r[0-9]+]], r0, r1, {{.*}}[[ADDR]] 1395; CHECK-NEXT: cmp [[STATUS]], #0 1396; CHECK-NEXT: bne .LBB{{[0-9]+}}_1 1397; CHECK-NOT: dmb 1398; CHECK-NOT: mcr 1399 1400 ret void 1401} 1402 1403define i32 @not.barriers(i32* %var, i1 %cond) { 1404; CHECK-LABEL: not.barriers: 1405 br i1 %cond, label %atomic_ver, label %simple_ver 1406simple_ver: 1407 %oldval = load i32, i32* %var 1408 %newval = add nsw i32 %oldval, -1 1409 store i32 %newval, i32* %var 1410 br label %somewhere 1411atomic_ver: 1412 fence seq_cst 1413 %val = atomicrmw add i32* %var, i32 -1 monotonic 1414 fence seq_cst 1415 br label %somewhere 1416; CHECK: dmb 1417; CHECK: ldrex 1418; CHECK: dmb 1419 ; The key point here is that the second dmb isn't immediately followed by the 1420 ; simple_ver basic block, which LLVM attempted to do when DMB had been marked 1421 ; with isBarrier. For now, look for something that looks like "somewhere". 1422; CHECK-NEXT: {{mov|bx}} 1423somewhere: 1424 %combined = phi i32 [ %val, %atomic_ver ], [ %newval, %simple_ver] 1425 ret i32 %combined 1426} 1427