blob: 39f5a32fd372e74cf31923a58d22266e4cf67a96 [file] [log] [blame]
; This tests Read-Modify-Write (RMW) detection and lowering at the O2
; optimization level.
; RUN: %if --need=target_X8632 --command %p2i --filetype=obj --disassemble \
; RUN: --target x8632 -i %s --args -O2 \
; RUN: | %if --need=target_X8632 --command FileCheck %s
define internal void @rmw_add_i32_var(i32 %addr_arg, i32 %var) {
entry:
%addr = inttoptr i32 %addr_arg to i32*
%val = load i32, i32* %addr, align 1
%rmw = add i32 %val, %var
store i32 %rmw, i32* %addr, align 1
ret void
}
; Look for something like: add DWORD PTR [eax],ecx
; CHECK-LABEL: rmw_add_i32_var
; CHECK: add DWORD PTR [e{{ax|bx|cx|dx|bp|di|si}}],e{{ax|bx|cx|dx|bp|di|si}}
define internal void @rmw_add_i32_imm(i32 %addr_arg) {
entry:
%addr = inttoptr i32 %addr_arg to i32*
%val = load i32, i32* %addr, align 1
%rmw = add i32 %val, 19
store i32 %rmw, i32* %addr, align 1
ret void
}
; Look for something like: add DWORD PTR [eax],0x13
; CHECK-LABEL: rmw_add_i32_imm
; CHECK: add DWORD PTR [e{{ax|bx|cx|dx|bp|di|si}}],0x13
define internal i32 @no_rmw_add_i32_var(i32 %addr_arg, i32 %var) {
entry:
%addr = inttoptr i32 %addr_arg to i32*
%val = load i32, i32* %addr, align 1
%rmw = add i32 %val, %var
store i32 %rmw, i32* %addr, align 1
ret i32 %rmw
}
; CHECK-LABEL: no_rmw_add_i32_var
; CHECK: add e{{ax|bx|cx|dx|bp|di|si}},DWORD PTR [e{{ax|bx|cx|dx|bp|di|si}}]
define internal void @rmw_add_i16_var(i32 %addr_arg, i32 %var32) {
entry:
%var = trunc i32 %var32 to i16
%addr = inttoptr i32 %addr_arg to i16*
%val = load i16, i16* %addr, align 1
%rmw = add i16 %val, %var
store i16 %rmw, i16* %addr, align 1
ret void
}
; Look for something like: add WORD PTR [eax],cx
; CHECK-LABEL: rmw_add_i16_var
; CHECK: add WORD PTR [e{{ax|bx|cx|dx|bp|di|si}}],{{ax|bx|cx|dx|bp|di|si}}
define internal void @rmw_add_i16_imm(i32 %addr_arg) {
entry:
%addr = inttoptr i32 %addr_arg to i16*
%val = load i16, i16* %addr, align 1
%rmw = add i16 %val, 19
store i16 %rmw, i16* %addr, align 1
ret void
}
; Look for something like: add WORD PTR [eax],0x13
; CHECK-LABEL: rmw_add_i16_imm
; CHECK: add WORD PTR [e{{ax|bx|cx|dx|bp|di|si}}],0x13
define internal void @rmw_add_i8_var(i32 %addr_arg, i32 %var32) {
entry:
%var = trunc i32 %var32 to i8
%addr = inttoptr i32 %addr_arg to i8*
%val = load i8, i8* %addr, align 1
%rmw = add i8 %val, %var
store i8 %rmw, i8* %addr, align 1
ret void
}
; Look for something like: add BYTE PTR [eax],cl
; CHECK-LABEL: rmw_add_i8_var
; CHECK: add BYTE PTR [e{{ax|bx|cx|dx|bp|di|si}}],{{al|bl|cl|dl}}
define internal void @rmw_add_i8_imm(i32 %addr_arg) {
entry:
%addr = inttoptr i32 %addr_arg to i8*
%val = load i8, i8* %addr, align 1
%rmw = add i8 %val, 19
store i8 %rmw, i8* %addr, align 1
ret void
}
; Look for something like: add BYTE PTR [eax],0x13
; CHECK-LABEL: rmw_add_i8_imm
; CHECK: add BYTE PTR [e{{ax|bx|cx|dx|bp|di|si}}],0x13
define internal void @rmw_add_i32_var_addropt(i32 %addr_arg, i32 %var) {
entry:
%addr_arg_plus_12 = add i32 %addr_arg, 12
%var_times_4 = mul i32 %var, 4
%addr_base = add i32 %addr_arg_plus_12 , %var_times_4
%addr = inttoptr i32 %addr_base to i32*
%val = load i32, i32* %addr, align 1
%rmw = add i32 %val, %var
store i32 %rmw, i32* %addr, align 1
ret void
}
; Look for something like: add DWORD PTR [eax+ecx*4+12],ecx
; CHECK-LABEL: rmw_add_i32_var_addropt
; CHECK: add DWORD PTR [e{{..}}+e{{..}}*4+0xc],e{{ax|bx|cx|dx|bp|di|si}}
; Test for commutativity opportunities. This is the same as rmw_add_i32_var
; except with the "add" operands reversed.
define internal void @rmw_add_i32_var_comm(i32 %addr_arg, i32 %var) {
entry:
%addr = inttoptr i32 %addr_arg to i32*
%val = load i32, i32* %addr, align 1
%rmw = add i32 %var, %val
store i32 %rmw, i32* %addr, align 1
ret void
}
; Look for something like: add DWORD PTR [eax],ecx
; CHECK-LABEL: rmw_add_i32_var_comm
; CHECK: add DWORD PTR [e{{ax|bx|cx|dx|bp|di|si}}],e{{ax|bx|cx|dx|bp|di|si}}
; Test that commutativity isn't triggered for a non-commutative arithmetic
; operator (sub). This is the same as rmw_add_i32_var_comm except with a
; "sub" operation.
define internal i32 @no_rmw_sub_i32_var(i32 %addr_arg, i32 %var) {
entry:
%addr = inttoptr i32 %addr_arg to i32*
%val = load i32, i32* %addr, align 1
%rmw = sub i32 %var, %val
store i32 %rmw, i32* %addr, align 1
ret i32 %rmw
}
; CHECK-LABEL: no_rmw_sub_i32_var
; CHECK: sub e{{ax|bx|cx|dx|bp|di|si}},DWORD PTR [e{{ax|bx|cx|dx|bp|di|si}}]
define internal void @rmw_add_i64_undef(i32 %addr_arg) {
entry:
%addr = inttoptr i32 %addr_arg to i64*
%val = load i64, i64* %addr, align 1
%rmw = add i64 %val, undef
store i64 %rmw, i64* %addr, align 1
ret void
}
; CHECK-LABEL: rmw_add_i64_undef
; CHECK: add DWORD PTR [e{{ax|bx|cx|dx|bp|di|si}}],0x0
; CHECK: adc DWORD PTR [e{{ax|bx|cx|dx|bp|di|si}}+0x4],0x0