| ; This tests Read-Modify-Write (RMW) detection and lowering at the O2 |
| ; optimization level. |
| |
| ; RUN: %if --need=target_X8632 --command %p2i --filetype=obj --disassemble \ |
| ; RUN: --target x8632 -i %s --args -O2 \ |
| ; RUN: | %if --need=target_X8632 --command FileCheck %s |
| |
| define internal void @rmw_add_i32_var(i32 %addr_arg, i32 %var) { |
| entry: |
| %addr = inttoptr i32 %addr_arg to i32* |
| %val = load i32, i32* %addr, align 1 |
| %rmw = add i32 %val, %var |
| store i32 %rmw, i32* %addr, align 1 |
| ret void |
| } |
| ; Look for something like: add DWORD PTR [eax],ecx |
| ; CHECK-LABEL: rmw_add_i32_var |
| ; CHECK: add DWORD PTR [e{{ax|bx|cx|dx|bp|di|si}}],e{{ax|bx|cx|dx|bp|di|si}} |
| |
| define internal void @rmw_add_i32_imm(i32 %addr_arg) { |
| entry: |
| %addr = inttoptr i32 %addr_arg to i32* |
| %val = load i32, i32* %addr, align 1 |
| %rmw = add i32 %val, 19 |
| store i32 %rmw, i32* %addr, align 1 |
| ret void |
| } |
| ; Look for something like: add DWORD PTR [eax],0x13 |
| ; CHECK-LABEL: rmw_add_i32_imm |
| ; CHECK: add DWORD PTR [e{{ax|bx|cx|dx|bp|di|si}}],0x13 |
| |
| define internal i32 @no_rmw_add_i32_var(i32 %addr_arg, i32 %var) { |
| entry: |
| %addr = inttoptr i32 %addr_arg to i32* |
| %val = load i32, i32* %addr, align 1 |
| %rmw = add i32 %val, %var |
| store i32 %rmw, i32* %addr, align 1 |
| ret i32 %rmw |
| } |
| ; CHECK-LABEL: no_rmw_add_i32_var |
| ; CHECK: add e{{ax|bx|cx|dx|bp|di|si}},DWORD PTR [e{{ax|bx|cx|dx|bp|di|si}}] |
| |
| define internal void @rmw_add_i16_var(i32 %addr_arg, i32 %var32) { |
| entry: |
| %var = trunc i32 %var32 to i16 |
| %addr = inttoptr i32 %addr_arg to i16* |
| %val = load i16, i16* %addr, align 1 |
| %rmw = add i16 %val, %var |
| store i16 %rmw, i16* %addr, align 1 |
| ret void |
| } |
| ; Look for something like: add WORD PTR [eax],cx |
| ; CHECK-LABEL: rmw_add_i16_var |
| ; CHECK: add WORD PTR [e{{ax|bx|cx|dx|bp|di|si}}],{{ax|bx|cx|dx|bp|di|si}} |
| |
| define internal void @rmw_add_i16_imm(i32 %addr_arg) { |
| entry: |
| %addr = inttoptr i32 %addr_arg to i16* |
| %val = load i16, i16* %addr, align 1 |
| %rmw = add i16 %val, 19 |
| store i16 %rmw, i16* %addr, align 1 |
| ret void |
| } |
| ; Look for something like: add WORD PTR [eax],0x13 |
| ; CHECK-LABEL: rmw_add_i16_imm |
| ; CHECK: add WORD PTR [e{{ax|bx|cx|dx|bp|di|si}}],0x13 |
| |
| define internal void @rmw_add_i8_var(i32 %addr_arg, i32 %var32) { |
| entry: |
| %var = trunc i32 %var32 to i8 |
| %addr = inttoptr i32 %addr_arg to i8* |
| %val = load i8, i8* %addr, align 1 |
| %rmw = add i8 %val, %var |
| store i8 %rmw, i8* %addr, align 1 |
| ret void |
| } |
| ; Look for something like: add BYTE PTR [eax],cl |
| ; CHECK-LABEL: rmw_add_i8_var |
| ; CHECK: add BYTE PTR [e{{ax|bx|cx|dx|bp|di|si}}],{{al|bl|cl|dl}} |
| |
| define internal void @rmw_add_i8_imm(i32 %addr_arg) { |
| entry: |
| %addr = inttoptr i32 %addr_arg to i8* |
| %val = load i8, i8* %addr, align 1 |
| %rmw = add i8 %val, 19 |
| store i8 %rmw, i8* %addr, align 1 |
| ret void |
| } |
| ; Look for something like: add BYTE PTR [eax],0x13 |
| ; CHECK-LABEL: rmw_add_i8_imm |
| ; CHECK: add BYTE PTR [e{{ax|bx|cx|dx|bp|di|si}}],0x13 |
| |
| define internal void @rmw_add_i32_var_addropt(i32 %addr_arg, i32 %var) { |
| entry: |
| %addr_arg_plus_12 = add i32 %addr_arg, 12 |
| %var_times_4 = mul i32 %var, 4 |
| %addr_base = add i32 %addr_arg_plus_12 , %var_times_4 |
| %addr = inttoptr i32 %addr_base to i32* |
| %val = load i32, i32* %addr, align 1 |
| %rmw = add i32 %val, %var |
| store i32 %rmw, i32* %addr, align 1 |
| ret void |
| } |
| ; Look for something like: add DWORD PTR [eax+ecx*4+12],ecx |
| ; CHECK-LABEL: rmw_add_i32_var_addropt |
| ; CHECK: add DWORD PTR [e{{..}}+e{{..}}*4+0xc],e{{ax|bx|cx|dx|bp|di|si}} |
| |
| ; Test for commutativity opportunities. This is the same as rmw_add_i32_var |
| ; except with the "add" operands reversed. |
| define internal void @rmw_add_i32_var_comm(i32 %addr_arg, i32 %var) { |
| entry: |
| %addr = inttoptr i32 %addr_arg to i32* |
| %val = load i32, i32* %addr, align 1 |
| %rmw = add i32 %var, %val |
| store i32 %rmw, i32* %addr, align 1 |
| ret void |
| } |
| ; Look for something like: add DWORD PTR [eax],ecx |
| ; CHECK-LABEL: rmw_add_i32_var_comm |
| ; CHECK: add DWORD PTR [e{{ax|bx|cx|dx|bp|di|si}}],e{{ax|bx|cx|dx|bp|di|si}} |
| |
| ; Test that commutativity isn't triggered for a non-commutative arithmetic |
| ; operator (sub). This is the same as rmw_add_i32_var_comm except with a |
| ; "sub" operation. |
| define internal i32 @no_rmw_sub_i32_var(i32 %addr_arg, i32 %var) { |
| entry: |
| %addr = inttoptr i32 %addr_arg to i32* |
| %val = load i32, i32* %addr, align 1 |
| %rmw = sub i32 %var, %val |
| store i32 %rmw, i32* %addr, align 1 |
| ret i32 %rmw |
| } |
| ; CHECK-LABEL: no_rmw_sub_i32_var |
| ; CHECK: sub e{{ax|bx|cx|dx|bp|di|si}},DWORD PTR [e{{ax|bx|cx|dx|bp|di|si}}] |
| |
| define internal void @rmw_add_i64_undef(i32 %addr_arg) { |
| entry: |
| %addr = inttoptr i32 %addr_arg to i64* |
| %val = load i64, i64* %addr, align 1 |
| %rmw = add i64 %val, undef |
| store i64 %rmw, i64* %addr, align 1 |
| ret void |
| } |
| ; CHECK-LABEL: rmw_add_i64_undef |
| ; CHECK: add DWORD PTR [e{{ax|bx|cx|dx|bp|di|si}}],0x0 |
| ; CHECK: adc DWORD PTR [e{{ax|bx|cx|dx|bp|di|si}}+0x4],0x0 |