blob: 08e7d673a79c01c0b853e5373350089fb4faf578 [file] [log] [blame]
; Test the a=b*b lowering sequence which can use a single temporary register
; instead of two registers.
; RUN: %if --need=target_X8632 --command %p2i --filetype=obj --disassemble \
; RUN: --target x8632 -i %s --args -O2 -mattr=sse4.1 \
; RUN: | %if --need=target_X8632 --command FileCheck %s
; RUN: %if --need=target_X8632 --command %p2i --filetype=obj --disassemble \
; RUN: --target x8632 -i %s --args -Om1 -mattr=sse4.1 \
; RUN: | %if --need=target_X8632 --command FileCheck %s
; RUN: %if --need=target_MIPS32 --need=allow_dump \
; RUN: --command %p2i --filetype=asm --assemble --disassemble --target \
; RUN: mips32 -i %s --args -O2 -allow-externally-defined-symbols \
; RUN: | %if --need=target_MIPS32 --need=allow_dump \
; RUN: --command FileCheck --check-prefix MIPS32 %s
define internal float @Square_float(float %a) {
entry:
%result = fmul float %a, %a
ret float %result
}
; CHECK-LABEL: Square_float
; CHECK: mulss [[REG:xmm.]],[[REG]]
; MIPS32-LABEL: Square_float
; MIPS32: mov.s
; MIPS32: mul.s
define internal double @Square_double(double %a) {
entry:
%result = fmul double %a, %a
ret double %result
}
; CHECK-LABEL: Square_double
; CHECK: mulsd [[REG:xmm.]],[[REG]]
; MIPS32-LABEL: Square_double
; MIPS32: mov.d
; MIPS32: mul.d
define internal i32 @Square_i32(i32 %a) {
entry:
%result = mul i32 %a, %a
ret i32 %result
}
; CHECK-LABEL: Square_i32
; CHECK: imul [[REG:e..]],[[REG]]
; MIPS32-LABEL: Square_i32
; MIPS32: move
; MIPS32: mul
define internal i32 @Square_i16(i32 %a) {
entry:
%a.16 = trunc i32 %a to i16
%result = mul i16 %a.16, %a.16
%result.i32 = sext i16 %result to i32
ret i32 %result.i32
}
; CHECK-LABEL: Square_i16
; CHECK: imul [[REG:..]],[[REG]]
; MIPS32-LABEL: Square_i16
; MIPS32: move
; MIPS32: mul
; MIPS32: sll
; MIPS32: sra
define internal i32 @Square_i8(i32 %a) {
entry:
%a.8 = trunc i32 %a to i8
%result = mul i8 %a.8, %a.8
%result.i32 = sext i8 %result to i32
ret i32 %result.i32
}
; CHECK-LABEL: Square_i8
; CHECK: imul al
; MIPS32-LABEL: Square_i8
; MIPS32: move
; MIPS32: mul
; MIPS32: sll
; MIPS32: sra
define internal <4 x float> @Square_v4f32(<4 x float> %a) {
entry:
%result = fmul <4 x float> %a, %a
ret <4 x float> %result
}
; CHECK-LABEL: Square_v4f32
; CHECK: mulps [[REG:xmm.]],[[REG]]
define internal <4 x i32> @Square_v4i32(<4 x i32> %a) {
entry:
%result = mul <4 x i32> %a, %a
ret <4 x i32> %result
}
; CHECK-LABEL: Square_v4i32
; CHECK: pmulld [[REG:xmm.]],[[REG]]
define internal <8 x i16> @Square_v8i16(<8 x i16> %a) {
entry:
%result = mul <8 x i16> %a, %a
ret <8 x i16> %result
}
; CHECK-LABEL: Square_v8i16
; CHECK: pmullw [[REG:xmm.]],[[REG]]
define internal <16 x i8> @Square_v16i8(<16 x i8> %a) {
entry:
%result = mul <16 x i8> %a, %a
ret <16 x i8> %result
}
; CHECK-LABEL: Square_v16i8
; CHECK-NOT: pmul