| ; RUN: opt -S -codegenprepare -mtriple=aarch64-linux %s | FileCheck -enable-var-scope %s |
| |
| ; Test for CodeGenPrepare::optimizeLoadExt(): simple case: two loads |
| ; feeding a phi that zext's each loaded value. |
| define i32 @test_free_zext(i32* %ptr, i32* %ptr2, i32 %c) { |
| ; CHECK-LABEL: @test_free_zext( |
| bb1: |
| ; CHECK: bb1: |
| ; CHECK: %[[T1:.*]] = load |
| ; CHECK: %[[A1:.*]] = and i32 %[[T1]], 65535 |
| %load1 = load i32, i32* %ptr, align 4 |
| %cmp = icmp ne i32 %c, 0 |
| br i1 %cmp, label %bb2, label %bb3 |
| bb2: |
| ; CHECK: bb2: |
| ; CHECK: %[[T2:.*]] = load |
| ; CHECK: %[[A2:.*]] = and i32 %[[T2]], 65535 |
| %load2 = load i32, i32* %ptr2, align 4 |
| br label %bb3 |
| bb3: |
| ; CHECK: bb3: |
| ; CHECK: phi i32 [ %[[A1]], %bb1 ], [ %[[A2]], %bb2 ] |
| %phi = phi i32 [ %load1, %bb1 ], [ %load2, %bb2 ] |
| %and = and i32 %phi, 65535 |
| ret i32 %and |
| } |
| |
| ; Test for CodeGenPrepare::optimizeLoadExt(): exercise all opcode |
| ; cases of active bit calculation. |
| define i32 @test_free_zext2(i32* %ptr, i16* %dst16, i32* %dst32, i32 %c) { |
| ; CHECK-LABEL: @test_free_zext2( |
| bb1: |
| ; CHECK: bb1: |
| ; CHECK: %[[T1:.*]] = load |
| ; CHECK: %[[A1:.*]] = and i32 %[[T1]], 65535 |
| %load1 = load i32, i32* %ptr, align 4 |
| %cmp = icmp ne i32 %c, 0 |
| br i1 %cmp, label %bb2, label %bb4 |
| bb2: |
| ; CHECK: bb2: |
| %trunc = trunc i32 %load1 to i16 |
| store i16 %trunc, i16* %dst16, align 2 |
| br i1 %cmp, label %bb3, label %bb4 |
| bb3: |
| ; CHECK: bb3: |
| %shl = shl i32 %load1, 16 |
| store i32 %shl, i32* %dst32, align 4 |
| br label %bb4 |
| bb4: |
| ; CHECK: bb4: |
| ; CHECK-NOT: and |
| ; CHECK: ret i32 %[[A1]] |
| %and = and i32 %load1, 65535 |
| ret i32 %and |
| } |
| |
| ; Test for CodeGenPrepare::optimizeLoadExt(): check case of zext-able |
| ; load feeding a phi in the same block. |
| define void @test_free_zext3(i32* %ptr, i32* %ptr2, i32* %dst, i64* %c) { |
| ; CHECK-LABEL: @test_free_zext3( |
| bb1: |
| ; CHECK: bb1: |
| ; CHECK: %[[T1:.*]] = load |
| ; CHECK: %[[A1:.*]] = and i32 %[[T1]], 65535 |
| %load1 = load i32, i32* %ptr, align 4 |
| br label %loop |
| loop: |
| ; CHECK: loop: |
| ; CHECK: phi i32 [ %[[A1]], %bb1 ], [ %[[A2:.*]], %loop ] |
| %phi = phi i32 [ %load1, %bb1 ], [ %load2, %loop ] |
| %and = and i32 %phi, 65535 |
| store i32 %and, i32* %dst, align 4 |
| %idx = load volatile i64, i64* %c, align 4 |
| %addr = getelementptr inbounds i32, i32* %ptr2, i64 %idx |
| ; CHECK: %[[T2:.*]] = load i32 |
| ; CHECK: %[[A2]] = and i32 %[[T2]], 65535 |
| %load2 = load i32, i32* %addr, align 4 |
| %cmp = icmp ne i64 %idx, 0 |
| br i1 %cmp, label %loop, label %end |
| end: |
| ret void |
| } |