| ; RUN: opt -S -codegenprepare -disable-complex-addr-modes=false -addr-sink-new-phis=true -addr-sink-new-select=true %s | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK-YES |
| ; RUN: opt -S -codegenprepare -disable-complex-addr-modes=false -addr-sink-new-phis=false -addr-sink-new-select=true %s | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK-NO |
| target datalayout = |
| "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128" |
| target triple = "x86_64-unknown-linux-gnu" |
| |
| ; Can we sink for different base if there is no phi for base? |
| define i32 @test1(i1 %cond, i64* %b1, i64* %b2) { |
| ; CHECK-LABEL: @test1 |
| entry: |
| %a1 = getelementptr inbounds i64, i64* %b1, i64 5 |
| %c1 = bitcast i64* %a1 to i32* |
| br i1 %cond, label %if.then, label %fallthrough |
| |
| if.then: |
| %a2 = getelementptr inbounds i64, i64* %b2, i64 5 |
| %c2 = bitcast i64* %a2 to i32* |
| br label %fallthrough |
| |
| fallthrough: |
| ; CHECK-YES: sunk_phi |
| ; CHECK-NO-LABEL: fallthrough: |
| ; CHECK-NO: phi |
| ; CHECK-NO-NEXT: load |
| %c = phi i32* [%c1, %entry], [%c2, %if.then] |
| %v = load i32, i32* %c, align 4 |
| ret i32 %v |
| } |
| |
| ; Can we sink for different base if there is phi for base? |
| define i32 @test2(i1 %cond, i64* %b1, i64* %b2) { |
| ; CHECK-LABEL: @test2 |
| entry: |
| %a1 = getelementptr inbounds i64, i64* %b1, i64 5 |
| %c1 = bitcast i64* %a1 to i32* |
| br i1 %cond, label %if.then, label %fallthrough |
| |
| if.then: |
| %a2 = getelementptr inbounds i64, i64* %b2, i64 5 |
| %c2 = bitcast i64* %a2 to i32* |
| br label %fallthrough |
| |
| fallthrough: |
| ; CHECK: getelementptr i8, {{.+}} 40 |
| %b = phi i64* [%b1, %entry], [%b2, %if.then] |
| %c = phi i32* [%c1, %entry], [%c2, %if.then] |
| %v = load i32, i32* %c, align 4 |
| ret i32 %v |
| } |
| |
| ; Can we sink for different base if there is phi for base but not valid one? |
| define i32 @test3(i1 %cond, i64* %b1, i64* %b2) { |
| ; CHECK-LABEL: @test3 |
| entry: |
| %a1 = getelementptr inbounds i64, i64* %b1, i64 5 |
| %c1 = bitcast i64* %a1 to i32* |
| br i1 %cond, label %if.then, label %fallthrough |
| |
| if.then: |
| %a2 = getelementptr inbounds i64, i64* %b2, i64 5 |
| %c2 = bitcast i64* %a2 to i32* |
| br label %fallthrough |
| |
| fallthrough: |
| ; CHECK-YES: sunk_phi |
| ; CHECK-NO-LABEL: fallthrough: |
| ; CHECK-NO: phi |
| ; CHECK-NO: phi |
| ; CHECK-NO-NEXT: load |
| %b = phi i64* [%b2, %entry], [%b1, %if.then] |
| %c = phi i32* [%c1, %entry], [%c2, %if.then] |
| %v = load i32, i32* %c, align 4 |
| ret i32 %v |
| } |
| |
| ; Can we sink for different base if both addresses are in the same block? |
| define i32 @test4(i1 %cond, i64* %b1, i64* %b2) { |
| ; CHECK-LABEL: @test4 |
| entry: |
| %a1 = getelementptr inbounds i64, i64* %b1, i64 5 |
| %c1 = bitcast i64* %a1 to i32* |
| %a2 = getelementptr inbounds i64, i64* %b2, i64 5 |
| %c2 = bitcast i64* %a2 to i32* |
| br i1 %cond, label %if.then, label %fallthrough |
| |
| if.then: |
| br label %fallthrough |
| |
| fallthrough: |
| ; CHECK-YES: sunk_phi |
| ; CHECK-NO-LABEL: fallthrough: |
| ; CHECK-NO: phi |
| ; CHECK-NO-NEXT: load |
| %c = phi i32* [%c1, %entry], [%c2, %if.then] |
| %v = load i32, i32* %c, align 4 |
| ret i32 %v |
| } |
| |
| ; Can we sink for different base if there is phi for base? |
| ; Both addresses are in the same block. |
| define i32 @test5(i1 %cond, i64* %b1, i64* %b2) { |
| ; CHECK-LABEL: @test5 |
| entry: |
| %a1 = getelementptr inbounds i64, i64* %b1, i64 5 |
| %c1 = bitcast i64* %a1 to i32* |
| %a2 = getelementptr inbounds i64, i64* %b2, i64 5 |
| %c2 = bitcast i64* %a2 to i32* |
| br i1 %cond, label %if.then, label %fallthrough |
| |
| if.then: |
| br label %fallthrough |
| |
| fallthrough: |
| ; CHECK: getelementptr i8, {{.+}} 40 |
| %b = phi i64* [%b1, %entry], [%b2, %if.then] |
| %c = phi i32* [%c1, %entry], [%c2, %if.then] |
| %v = load i32, i32* %c, align 4 |
| ret i32 %v |
| } |
| |
| ; Can we sink for different base if there is phi for base but not valid one? |
| ; Both addresses are in the same block. |
| define i32 @test6(i1 %cond, i64* %b1, i64* %b2) { |
| ; CHECK-LABEL: @test6 |
| entry: |
| %a1 = getelementptr inbounds i64, i64* %b1, i64 5 |
| %c1 = bitcast i64* %a1 to i32* |
| %a2 = getelementptr inbounds i64, i64* %b2, i64 5 |
| %c2 = bitcast i64* %a2 to i32* |
| br i1 %cond, label %if.then, label %fallthrough |
| |
| if.then: |
| br label %fallthrough |
| |
| fallthrough: |
| ; CHECK-YES: sunk_phi |
| ; CHECK-NO-LABEL: fallthrough: |
| ; CHECK-NO: phi |
| ; CHECK-NO-NEXT: phi |
| ; CHECK-NO-NEXT: load |
| %b = phi i64* [%b2, %entry], [%b1, %if.then] |
| %c = phi i32* [%c1, %entry], [%c2, %if.then] |
| %v = load i32, i32* %c, align 4 |
| ret i32 %v |
| } |
| |
| ; case with a loop. No phi node. |
| define i32 @test7(i32 %N, i1 %cond, i64* %b1, i64* %b2) { |
| ; CHECK-LABEL: @test7 |
| entry: |
| %a1 = getelementptr inbounds i64, i64* %b1, i64 5 |
| %c1 = bitcast i64* %a1 to i32* |
| br label %loop |
| |
| loop: |
| ; CHECK-LABEL: loop: |
| ; CHECK-YES: sunk_phi |
| %iv = phi i32 [0, %entry], [%iv.inc, %fallthrough] |
| %c3 = phi i32* [%c1, %entry], [%c, %fallthrough] |
| br i1 %cond, label %if.then, label %fallthrough |
| |
| if.then: |
| %a2 = getelementptr inbounds i64, i64* %b2, i64 5 |
| %c2 = bitcast i64* %a2 to i32* |
| br label %fallthrough |
| |
| fallthrough: |
| ; CHECK-YES: sunk_phi |
| ; CHECK-NO-LABEL: fallthrough: |
| ; CHECK-NO: phi |
| ; CHECK-NO-NEXT: load |
| %c = phi i32* [%c3, %loop], [%c2, %if.then] |
| %v = load volatile i32, i32* %c, align 4 |
| %iv.inc = add i32 %iv, 1 |
| %cmp = icmp slt i32 %iv.inc, %N |
| br i1 %cmp, label %loop, label %exit |
| |
| exit: |
| ret i32 %v |
| } |
| |
| ; case with a loop. There is phi node. |
| define i32 @test8(i32 %N, i1 %cond, i64* %b1, i64* %b2) { |
| ; CHECK-LABEL: @test8 |
| entry: |
| %a1 = getelementptr inbounds i64, i64* %b1, i64 5 |
| %c1 = bitcast i64* %a1 to i32* |
| br label %loop |
| |
| loop: |
| %iv = phi i32 [0, %entry], [%iv.inc, %fallthrough] |
| %c3 = phi i32* [%c1, %entry], [%c, %fallthrough] |
| %b3 = phi i64* [%b1, %entry], [%b, %fallthrough] |
| br i1 %cond, label %if.then, label %fallthrough |
| |
| if.then: |
| %a2 = getelementptr inbounds i64, i64* %b2, i64 5 |
| %c2 = bitcast i64* %a2 to i32* |
| br label %fallthrough |
| |
| fallthrough: |
| ; CHECK: getelementptr i8, {{.+}} 40 |
| %c = phi i32* [%c3, %loop], [%c2, %if.then] |
| %b = phi i64* [%b3, %loop], [%b2, %if.then] |
| %v = load volatile i32, i32* %c, align 4 |
| %iv.inc = add i32 %iv, 1 |
| %cmp = icmp slt i32 %iv.inc, %N |
| br i1 %cmp, label %loop, label %exit |
| |
| exit: |
| ret i32 %v |
| } |
| |
| ; case with a loop. There is phi node but it does not fit. |
| define i32 @test9(i32 %N, i1 %cond, i64* %b1, i64* %b2) { |
| ; CHECK-LABEL: @test9 |
| entry: |
| %a1 = getelementptr inbounds i64, i64* %b1, i64 5 |
| %c1 = bitcast i64* %a1 to i32* |
| br label %loop |
| |
| loop: |
| ; CHECK-LABEL: loop: |
| ; CHECK-YES: sunk_phi |
| %iv = phi i32 [0, %entry], [%iv.inc, %fallthrough] |
| %c3 = phi i32* [%c1, %entry], [%c, %fallthrough] |
| %b3 = phi i64* [%b1, %entry], [%b2, %fallthrough] |
| br i1 %cond, label %if.then, label %fallthrough |
| |
| if.then: |
| %a2 = getelementptr inbounds i64, i64* %b2, i64 5 |
| %c2 = bitcast i64* %a2 to i32* |
| br label %fallthrough |
| |
| fallthrough: |
| ; CHECK-YES: sunk_phi |
| ; CHECK-NO-LABEL: fallthrough: |
| ; CHECK-NO: phi |
| ; CHECK-NO-NEXT: phi |
| ; CHECK-NO-NEXT: load |
| %c = phi i32* [%c3, %loop], [%c2, %if.then] |
| %b = phi i64* [%b3, %loop], [%b2, %if.then] |
| %v = load volatile i32, i32* %c, align 4 |
| %iv.inc = add i32 %iv, 1 |
| %cmp = icmp slt i32 %iv.inc, %N |
| br i1 %cmp, label %loop, label %exit |
| |
| exit: |
| ret i32 %v |
| } |
| |
| ; Case through a loop. No phi node. |
| define i32 @test10(i32 %N, i1 %cond, i64* %b1, i64* %b2) { |
| ; CHECK-LABEL: @test10 |
| entry: |
| %a1 = getelementptr inbounds i64, i64* %b1, i64 5 |
| %c1 = bitcast i64* %a1 to i32* |
| br i1 %cond, label %if.then, label %fallthrough |
| |
| if.then: |
| %a2 = getelementptr inbounds i64, i64* %b2, i64 5 |
| %c2 = bitcast i64* %a2 to i32* |
| br label %fallthrough |
| |
| fallthrough: |
| ; CHECK-YES: sunk_phi |
| ; CHECK-NO-LABEL: fallthrough: |
| ; CHECK-NO-NEXT: phi |
| ; CHECK-NO-NEXT: br |
| %c = phi i32* [%c1, %entry], [%c2, %if.then] |
| br label %loop |
| |
| loop: |
| %iv = phi i32 [0, %fallthrough], [%iv.inc, %loop] |
| %iv.inc = add i32 %iv, 1 |
| %cmp = icmp slt i32 %iv.inc, %N |
| br i1 %cmp, label %loop, label %exit |
| |
| exit: |
| ; CHECK-YES: sunkaddr |
| %v = load volatile i32, i32* %c, align 4 |
| ret i32 %v |
| } |
| |
| ; Case through a loop. There is a phi. |
| define i32 @test11(i32 %N, i1 %cond, i64* %b1, i64* %b2) { |
| ; CHECK-LABEL: @test11 |
| entry: |
| %a1 = getelementptr inbounds i64, i64* %b1, i64 5 |
| %c1 = bitcast i64* %a1 to i32* |
| br i1 %cond, label %if.then, label %fallthrough |
| |
| if.then: |
| %a2 = getelementptr inbounds i64, i64* %b2, i64 5 |
| %c2 = bitcast i64* %a2 to i32* |
| br label %fallthrough |
| |
| fallthrough: |
| ; CHECK: phi |
| ; CHECK: phi |
| ; CHECK: br |
| %c = phi i32* [%c1, %entry], [%c2, %if.then] |
| %b = phi i64* [%b1, %entry], [%b2, %if.then] |
| br label %loop |
| |
| loop: |
| %iv = phi i32 [0, %fallthrough], [%iv.inc, %loop] |
| %iv.inc = add i32 %iv, 1 |
| %cmp = icmp slt i32 %iv.inc, %N |
| br i1 %cmp, label %loop, label %exit |
| |
| exit: |
| ; CHECK: sunkaddr |
| %v = load volatile i32, i32* %c, align 4 |
| ret i32 %v |
| } |
| |
| ; Complex case with address value from previous iteration. |
| define i32 @test12(i32 %N, i1 %cond, i64* %b1, i64* %b2, i64* %b3) { |
| ; CHECK-LABEL: @test12 |
| entry: |
| %a1 = getelementptr inbounds i64, i64* %b1, i64 5 |
| %c1 = bitcast i64* %a1 to i32* |
| br label %loop |
| |
| loop: |
| ; CHECK-LABEL: loop: |
| ; CHECK-YES: sunk_phi |
| ; CHECK-NO: phi |
| ; CHECK-NO-NEXT: phi |
| ; CHECK-NO-NEXT: phi |
| ; CHECK-NO-NEXT: br |
| %iv = phi i32 [0, %entry], [%iv.inc, %backedge] |
| %c3 = phi i32* [%c1, %entry], [%c, %backedge] |
| %b4 = phi i64* [%b1, %entry], [%b5, %backedge] |
| br i1 %cond, label %if.then, label %fallthrough |
| |
| if.then: |
| %a2 = getelementptr inbounds i64, i64* %b2, i64 5 |
| %c2 = bitcast i64* %a2 to i32* |
| br label %fallthrough |
| |
| fallthrough: |
| ; CHECK-LABEL: fallthrough: |
| ; CHECK-YES: sunk_phi |
| ; CHECK-NO: phi |
| ; CHECK-NO-NEXT: phi |
| ; CHECK-NO-NEXT: load |
| %c = phi i32* [%c3, %loop], [%c2, %if.then] |
| %b6 = phi i64* [%b4, %loop], [%b2, %if.then] |
| %v = load volatile i32, i32* %c, align 4 |
| %a4 = getelementptr inbounds i64, i64* %b4, i64 5 |
| %c4 = bitcast i64* %a4 to i32* |
| %cmp = icmp slt i32 %iv, 20 |
| br i1 %cmp, label %backedge, label %if.then.2 |
| |
| if.then.2: |
| br label %backedge |
| |
| backedge: |
| %b5 = phi i64* [%b4, %fallthrough], [%b6, %if.then.2] |
| %iv.inc = add i32 %iv, 1 |
| %cmp2 = icmp slt i32 %iv.inc, %N |
| br i1 %cmp2, label %loop, label %exit |
| |
| exit: |
| ret i32 %v |
| } |
| |
| %struct.S = type {i32, i32} |
| ; Case with index |
| define i32 @test13(i1 %cond, %struct.S* %b1, %struct.S* %b2, i64 %Index) { |
| ; CHECK-LABEL: @test13 |
| entry: |
| %a1 = getelementptr inbounds %struct.S, %struct.S* %b1, i64 %Index, i32 1 |
| br i1 %cond, label %if.then, label %fallthrough |
| |
| if.then: |
| %i2 = mul i64 %Index, 2 |
| %a2 = getelementptr inbounds %struct.S, %struct.S* %b2, i64 %Index, i32 1 |
| br label %fallthrough |
| |
| fallthrough: |
| ; CHECK-YES: sunk_phi |
| ; CHECK-NO-LABEL: fallthrough: |
| ; CHECK-NO-NEXT: phi |
| ; CHECK-NO-NEXT: load |
| %a = phi i32* [%a1, %entry], [%a2, %if.then] |
| %v = load i32, i32* %a, align 4 |
| ret i32 %v |
| } |
| |
| ; Select of Select case. |
| define i64 @test14(i1 %c1, i1 %c2, i64* %b1, i64* %b2, i64* %b3) { |
| ; CHECK-LABEL: @test14 |
| entry: |
| ; CHECK-LABEL: entry: |
| %g1 = getelementptr inbounds i64, i64* %b1, i64 5 |
| %g2 = getelementptr inbounds i64, i64* %b2, i64 5 |
| %g3 = getelementptr inbounds i64, i64* %b3, i64 5 |
| %s1 = select i1 %c1, i64* %g1, i64* %g2 |
| %s2 = select i1 %c2, i64* %s1, i64* %g3 |
| ; CHECK: sunkaddr |
| %v = load i64 , i64* %s2, align 8 |
| ret i64 %v |
| } |
| |
| ; Select of Phi case. |
| define i64 @test15(i1 %c1, i1 %c2, i64* %b1, i64* %b2, i64* %b3) { |
| ; CHECK-LABEL: @test15 |
| entry: |
| %g1 = getelementptr inbounds i64, i64* %b1, i64 5 |
| %g2 = getelementptr inbounds i64, i64* %b2, i64 5 |
| %g3 = getelementptr inbounds i64, i64* %b3, i64 5 |
| br i1 %c1, label %if.then, label %fallthrough |
| |
| if.then: |
| br label %fallthrough |
| |
| fallthrough: |
| ; CHECK-LABEL: fallthrough: |
| %p1 = phi i64* [%g1, %entry], [%g2, %if.then] |
| %s1 = select i1 %c2, i64* %p1, i64* %g3 |
| ; CHECK-YES: sunkaddr |
| ; CHECK-NO: phi |
| ; CHECK-NO-NEXT: select |
| ; CHECK-NO-NEXT: load |
| %v = load i64 , i64* %s1, align 8 |
| ret i64 %v |
| } |
| |
| ; Select of Phi case. Phi exists |
| define i64 @test16(i1 %c1, i1 %c2, i64* %b1, i64* %b2, i64* %b3) { |
| ; CHECK-LABEL: @test16 |
| entry: |
| %g1 = getelementptr inbounds i64, i64* %b1, i64 5 |
| %g2 = getelementptr inbounds i64, i64* %b2, i64 5 |
| %g3 = getelementptr inbounds i64, i64* %b3, i64 5 |
| br i1 %c1, label %if.then, label %fallthrough |
| |
| if.then: |
| br label %fallthrough |
| |
| fallthrough: |
| ; CHECK-LABEL: fallthrough: |
| %p = phi i64* [%b1, %entry], [%b2, %if.then] |
| %p1 = phi i64* [%g1, %entry], [%g2, %if.then] |
| %s1 = select i1 %c2, i64* %p1, i64* %g3 |
| ; CHECK: sunkaddr |
| %v = load i64 , i64* %s1, align 8 |
| ret i64 %v |
| } |
| |
| ; Phi of Select case. |
| define i64 @test17(i1 %c1, i1 %c2, i64* %b1, i64* %b2, i64* %b3) { |
| ; CHECK-LABEL: @test17 |
| entry: |
| %g1 = getelementptr inbounds i64, i64* %b1, i64 5 |
| %g2 = getelementptr inbounds i64, i64* %b2, i64 5 |
| %g3 = getelementptr inbounds i64, i64* %b3, i64 5 |
| %s1 = select i1 %c2, i64* %g1, i64* %g2 |
| br i1 %c1, label %if.then, label %fallthrough |
| |
| if.then: |
| br label %fallthrough |
| |
| fallthrough: |
| ; CHECK-LABEL: fallthrough: |
| %p1 = phi i64* [%s1, %entry], [%g3, %if.then] |
| ; CHECK-YES: sunkaddr |
| ; CHECK-NO: phi |
| ; CHECK-NO-NEXT: load |
| %v = load i64 , i64* %p1, align 8 |
| ret i64 %v |
| } |
| |
| ; The same two addr modes by different paths |
| define i32 @test18(i1 %cond1, i1 %cond2, i64* %b1, i64* %b2) { |
| ; CHECK-LABEL: @test18 |
| entry: |
| %g1 = getelementptr inbounds i64, i64* %b2, i64 5 |
| %bc1 = bitcast i64* %g1 to i32* |
| br i1 %cond1, label %if.then1, label %if.then2 |
| |
| if.then1: |
| %g2 = getelementptr inbounds i64, i64* %b1, i64 5 |
| %bc2 = bitcast i64* %g2 to i32* |
| br label %fallthrough |
| |
| if.then2: |
| %bc1_1 = bitcast i64* %g1 to i32* |
| br i1 %cond2, label %fallthrough, label %if.then3 |
| |
| if.then3: |
| %bc1_2 = bitcast i64* %g1 to i32* |
| br label %fallthrough |
| |
| fallthrough: |
| ; CHECK-YES: sunk_phi |
| ; CHECK-NO-LABEL: fallthrough: |
| ; CHECK-NO: phi |
| ; CHECK-NO-NEXT: load |
| %c = phi i32* [%bc2, %if.then1], [%bc1_1, %if.then2], [%bc1_2, %if.then3] |
| %v1 = load i32, i32* %c, align 4 |
| %g1_1 = getelementptr inbounds i64, i64* %b2, i64 5 |
| %bc1_1_1 = bitcast i64* %g1_1 to i32* |
| %v2 = load i32, i32* %bc1_1_1, align 4 |
| %v = add i32 %v1, %v2 |
| ret i32 %v |
| } |
| |
| ; Different types but null is the first? |
| define i32 @test19(i1 %cond1, i1 %cond2, i64* %b2, i8* %b1) { |
| ; CHECK-LABEL: @test19 |
| entry: |
| %g1 = getelementptr inbounds i64, i64* %b2, i64 5 |
| %bc1 = bitcast i64* %g1 to i32* |
| br i1 %cond1, label %if.then1, label %if.then2 |
| |
| if.then1: |
| %g2 = getelementptr inbounds i8, i8* %b1, i64 40 |
| %bc2 = bitcast i8* %g2 to i32* |
| br label %fallthrough |
| |
| if.then2: |
| %bc1_1 = bitcast i64* %g1 to i32* |
| br i1 %cond2, label %fallthrough, label %if.then3 |
| |
| if.then3: |
| %g3 = getelementptr inbounds i64, i64* null, i64 5 |
| %bc1_2 = bitcast i64* %g3 to i32* |
| br label %fallthrough |
| |
| fallthrough: |
| ; CHECK-NOT: sunk_phi |
| %c = phi i32* [%bc2, %if.then1], [%bc1_1, %if.then2], [%bc1_2, %if.then3] |
| %v1 = load i32, i32* %c, align 4 |
| %g1_1 = getelementptr inbounds i64, i64* %b2, i64 5 |
| %bc1_1_1 = bitcast i64* %g1_1 to i32* |
| %v2 = load i32, i32* %bc1_1_1, align 4 |
| %v = add i32 %v1, %v2 |
| ret i32 %v |
| } |