blob: 53fe89730f3aa81969afeb824920455b3c4cc5b8 [file] [log] [blame]
; RUN: llc -march=r600 -mcpu=redwood -debug-only=r600cf %s -o - 2>%t | FileCheck %s --check-prefix=FUNC
; RUN: FileCheck --check-prefix=BUG64 %s < %t
; RUN: llc -march=r600 -mcpu=sumo -debug-only=r600cf %s -o - 2>%t | FileCheck %s --check-prefix=FUNC
; RUN: FileCheck --check-prefix=BUG64 %s < %t
; RUN: llc -march=r600 -mcpu=barts -debug-only=r600cf %s -o - 2>%t | FileCheck %s --check-prefix=FUNC
; RUN: FileCheck --check-prefix=BUG64 %s < %t
; RUN: llc -march=r600 -mcpu=turks -debug-only=r600cf %s -o - 2>%t | FileCheck %s --check-prefix=FUNC
; RUN: FileCheck --check-prefix=BUG64 %s < %t
; RUN: llc -march=r600 -mcpu=caicos -debug-only=r600cf %s -o - 2>%t | FileCheck %s --check-prefix=FUNC
; RUN: FileCheck --check-prefix=BUG64 %s < %t
; RUN: llc -march=r600 -mcpu=cedar -debug-only=r600cf %s -o - 2>%t | FileCheck %s --check-prefix=FUNC
; RUN: FileCheck --check-prefix=BUG32 %s < %t
; RUN: llc -march=r600 -mcpu=juniper -debug-only=r600cf %s -o - 2>%t | FileCheck %s --check-prefix=FUNC
; RUN: FileCheck --check-prefix=NOBUG %s < %t
; RUN: llc -march=r600 -mcpu=cypress -debug-only=r600cf %s -o - 2>%t | FileCheck %s --check-prefix=FUNC
; RUN: FileCheck --check-prefix=NOBUG %s < %t
; RUN: llc -march=r600 -mcpu=cayman -debug-only=r600cf %s -o - 2>%t | FileCheck %s --check-prefix=FUNC
; RUN: FileCheck --check-prefix=NOBUG %s < %t
; REQUIRES: asserts
; We are currently allocating 2 extra sub-entries on Evergreen / NI for
; non-WQM push instructions if we change this to 1, then we will need to
; add one level of depth to each of these tests.
; BUG64-NOT: Applying bug work-around
; BUG32-NOT: Applying bug work-around
; NOBUG-NOT: Applying bug work-around
; FUNC-LABEL: {{^}}nested3:
define amdgpu_kernel void @nested3(i32 addrspace(1)* %out, i32 %cond) {
entry:
%0 = icmp sgt i32 %cond, 0
br i1 %0, label %if.1, label %end
if.1:
%1 = icmp sgt i32 %cond, 10
br i1 %1, label %if.2, label %if.store.1
if.store.1:
store i32 1, i32 addrspace(1)* %out
br label %end
if.2:
%2 = icmp sgt i32 %cond, 20
br i1 %2, label %if.3, label %if.2.store
if.2.store:
store i32 2, i32 addrspace(1)* %out
br label %end
if.3:
store i32 3, i32 addrspace(1)* %out
br label %end
end:
ret void
}
; BUG64: Applying bug work-around
; BUG32-NOT: Applying bug work-around
; NOBUG-NOT: Applying bug work-around
; FUNC-LABEL: {{^}}nested4:
define amdgpu_kernel void @nested4(i32 addrspace(1)* %out, i32 %cond) {
entry:
%0 = icmp sgt i32 %cond, 0
br i1 %0, label %if.1, label %end
if.1:
%1 = icmp sgt i32 %cond, 10
br i1 %1, label %if.2, label %if.1.store
if.1.store:
store i32 1, i32 addrspace(1)* %out
br label %end
if.2:
%2 = icmp sgt i32 %cond, 20
br i1 %2, label %if.3, label %if.2.store
if.2.store:
store i32 2, i32 addrspace(1)* %out
br label %end
if.3:
%3 = icmp sgt i32 %cond, 30
br i1 %3, label %if.4, label %if.3.store
if.3.store:
store i32 3, i32 addrspace(1)* %out
br label %end
if.4:
store i32 4, i32 addrspace(1)* %out
br label %end
end:
ret void
}
; BUG64: Applying bug work-around
; BUG32-NOT: Applying bug work-around
; NOBUG-NOT: Applying bug work-around
; FUNC-LABEL: {{^}}nested7:
define amdgpu_kernel void @nested7(i32 addrspace(1)* %out, i32 %cond) {
entry:
%0 = icmp sgt i32 %cond, 0
br i1 %0, label %if.1, label %end
if.1:
%1 = icmp sgt i32 %cond, 10
br i1 %1, label %if.2, label %if.1.store
if.1.store:
store i32 1, i32 addrspace(1)* %out
br label %end
if.2:
%2 = icmp sgt i32 %cond, 20
br i1 %2, label %if.3, label %if.2.store
if.2.store:
store i32 2, i32 addrspace(1)* %out
br label %end
if.3:
%3 = icmp sgt i32 %cond, 30
br i1 %3, label %if.4, label %if.3.store
if.3.store:
store i32 3, i32 addrspace(1)* %out
br label %end
if.4:
%4 = icmp sgt i32 %cond, 40
br i1 %4, label %if.5, label %if.4.store
if.4.store:
store i32 4, i32 addrspace(1)* %out
br label %end
if.5:
%5 = icmp sgt i32 %cond, 50
br i1 %5, label %if.6, label %if.5.store
if.5.store:
store i32 5, i32 addrspace(1)* %out
br label %end
if.6:
%6 = icmp sgt i32 %cond, 60
br i1 %6, label %if.7, label %if.6.store
if.6.store:
store i32 6, i32 addrspace(1)* %out
br label %end
if.7:
store i32 7, i32 addrspace(1)* %out
br label %end
end:
ret void
}
; BUG64: Applying bug work-around
; BUG32: Applying bug work-around
; NOBUG-NOT: Applying bug work-around
; FUNC-LABEL: {{^}}nested8:
define amdgpu_kernel void @nested8(i32 addrspace(1)* %out, i32 %cond) {
entry:
%0 = icmp sgt i32 %cond, 0
br i1 %0, label %if.1, label %end
if.1:
%1 = icmp sgt i32 %cond, 10
br i1 %1, label %if.2, label %if.1.store
if.1.store:
store i32 1, i32 addrspace(1)* %out
br label %end
if.2:
%2 = icmp sgt i32 %cond, 20
br i1 %2, label %if.3, label %if.2.store
if.2.store:
store i32 2, i32 addrspace(1)* %out
br label %end
if.3:
%3 = icmp sgt i32 %cond, 30
br i1 %3, label %if.4, label %if.3.store
if.3.store:
store i32 3, i32 addrspace(1)* %out
br label %end
if.4:
%4 = icmp sgt i32 %cond, 40
br i1 %4, label %if.5, label %if.4.store
if.4.store:
store i32 4, i32 addrspace(1)* %out
br label %end
if.5:
%5 = icmp sgt i32 %cond, 50
br i1 %5, label %if.6, label %if.5.store
if.5.store:
store i32 5, i32 addrspace(1)* %out
br label %end
if.6:
%6 = icmp sgt i32 %cond, 60
br i1 %6, label %if.7, label %if.6.store
if.6.store:
store i32 6, i32 addrspace(1)* %out
br label %end
if.7:
%7 = icmp sgt i32 %cond, 70
br i1 %7, label %if.8, label %if.7.store
if.7.store:
store i32 7, i32 addrspace(1)* %out
br label %end
if.8:
store i32 8, i32 addrspace(1)* %out
br label %end
end:
ret void
}