; RUN: opt -S -early-cse < %s | FileCheck %s ; RUN: opt < %s -S -basicaa -early-cse-memssa | FileCheck %s ; NOTE: This file is testing the current implementation. Some of ; the transforms used as negative tests below would be legal, but ; only if reached through a chain of logic which EarlyCSE is incapable ; of performing. To say it differently, this file tests a conservative ; version of the memory model. If we want to extend EarlyCSE to be more ; aggressive in the future, we may need to relax some of the negative tests. ; We can value forward across the fence since we can (semantically) ; reorder the following load before the fence. define i32 @test(i32* %addr.i) { ; CHECK-LABEL: @test ; CHECK: store ; CHECK: fence ; CHECK-NOT: load ; CHECK: ret store i32 5, i32* %addr.i, align 4 fence release %a = load i32, i32* %addr.i, align 4 ret i32 %a } ; Same as above define i32 @test2(i32* noalias %addr.i, i32* noalias %otheraddr) { ; CHECK-LABEL: @test2 ; CHECK: load ; CHECK: fence ; CHECK-NOT: load ; CHECK: ret %a = load i32, i32* %addr.i, align 4 fence release %a2 = load i32, i32* %addr.i, align 4 %res = sub i32 %a, %a2 ret i32 %a } ; We can not value forward across an acquire barrier since we might ; be syncronizing with another thread storing to the same variable ; followed by a release fence. If this thread observed the release ; had happened, we must present a consistent view of memory at the ; fence. Note that it would be legal to reorder '%a' after the fence ; and then remove '%a2'. The current implementation doesn't know how ; to do this, but if it learned, this test will need revised. define i32 @test3(i32* noalias %addr.i, i32* noalias %otheraddr) { ; CHECK-LABEL: @test3 ; CHECK: load ; CHECK: fence ; CHECK: load ; CHECK: sub ; CHECK: ret %a = load i32, i32* %addr.i, align 4 fence acquire %a2 = load i32, i32* %addr.i, align 4 %res = sub i32 %a, %a2 ret i32 %res } ; We can not dead store eliminate accross the fence. We could in ; principal reorder the second store above the fence and then DSE either ; store, but this is beyond the simple last-store DSE which EarlyCSE ; implements. define void @test4(i32* %addr.i) { ; CHECK-LABEL: @test4 ; CHECK: store ; CHECK: fence ; CHECK: store ; CHECK: ret store i32 5, i32* %addr.i, align 4 fence release store i32 5, i32* %addr.i, align 4 ret void } ; We *could* DSE across this fence, but don't. No other thread can ; observe the order of the acquire fence and the store. define void @test5(i32* %addr.i) { ; CHECK-LABEL: @test5 ; CHECK: store ; CHECK: fence ; CHECK: store ; CHECK: ret store i32 5, i32* %addr.i, align 4 fence acquire store i32 5, i32* %addr.i, align 4 ret void }