tests_lit/llvm2ice_tests/vector-fcmp.ll - SwiftShader - Git at Google

 ; This file checks support for comparing vector values with the fcmp
 ; instruction.

 ; RUN: %p2i -i %s -a -O2 --verbose none \
 ; RUN:   | llvm-mc -triple=i686-none-nacl -filetype=obj \
 ; RUN:   | llvm-objdump -d --symbolize -x86-asm-syntax=intel - | FileCheck %s
 ; RUN: %p2i -i %s -a -Om1 --verbose none \
 ; RUN:   | llvm-mc -triple=i686-none-nacl -filetype=obj \
 ; RUN:   | llvm-objdump -d --symbolize -x86-asm-syntax=intel - | FileCheck %s

 ; Check that sext elimination occurs when the result of the comparison
 ; instruction is alrady sign extended.  Sign extension to 4 x i32 uses
 ; the pslld instruction.
 define <4 x i32> @sextElimination(<4 x float> %a, <4 x float> %b) {
 entry:
   %res.trunc = fcmp oeq <4 x float> %a, %b
   %res = sext <4 x i1> %res.trunc to <4 x i32>
   ret <4 x i32> %res
 ; CHECK-LABEL: sextElimination:
 ; CHECK: cmpeqps
 ; CHECK-NOT: pslld
 }

 define <4 x i32> @fcmpFalseVector(<4 x float> %a, <4 x float> %b) {
 entry:
   %res.trunc = fcmp false <4 x float> %a, %b
   %res = sext <4 x i1> %res.trunc to <4 x i32>
   ret <4 x i32> %res
 ; CHECK-LABEL: fcmpFalseVector:
 ; CHECK: pxor
 }

 define <4 x i32> @fcmpOeqVector(<4 x float> %a, <4 x float> %b) {
 entry:
   %res.trunc = fcmp oeq <4 x float> %a, %b
   %res = sext <4 x i1> %res.trunc to <4 x i32>
   ret <4 x i32> %res
 ; CHECK-LABEL: fcmpOeqVector:
 ; CHECK: cmpeqps
 }

 define <4 x i32> @fcmpOgeVector(<4 x float> %a, <4 x float> %b) {
 entry:
   %res.trunc = fcmp oge <4 x float> %a, %b
   %res = sext <4 x i1> %res.trunc to <4 x i32>
   ret <4 x i32> %res
 ; CHECK-LABEL: fcmpOgeVector:
 ; CHECK: cmpleps
 }

 define <4 x i32> @fcmpOgtVector(<4 x float> %a, <4 x float> %b) {
 entry:
   %res.trunc = fcmp ogt <4 x float> %a, %b
   %res = sext <4 x i1> %res.trunc to <4 x i32>
   ret <4 x i32> %res
 ; CHECK-LABEL: fcmpOgtVector:
 ; CHECK: cmpltps
 }

 define <4 x i32> @fcmpOleVector(<4 x float> %a, <4 x float> %b) {
 entry:
   %res.trunc = fcmp ole <4 x float> %a, %b
   %res = sext <4 x i1> %res.trunc to <4 x i32>
   ret <4 x i32> %res
 ; CHECK-LABEL: fcmpOleVector:
 ; CHECK: cmpleps
 }

 define <4 x i32> @fcmpOltVector(<4 x float> %a, <4 x float> %b) {
 entry:
   %res.trunc = fcmp olt <4 x float> %a, %b
   %res = sext <4 x i1> %res.trunc to <4 x i32>
   ret <4 x i32> %res
 ; CHECK-LABEL: fcmpOltVector:
 ; CHECK: cmpltps
 }

 define <4 x i32> @fcmpOneVector(<4 x float> %a, <4 x float> %b) {
 entry:
   %res.trunc = fcmp one <4 x float> %a, %b
   %res = sext <4 x i1> %res.trunc to <4 x i32>
   ret <4 x i32> %res
 ; CHECK-LABEL: fcmpOneVector:
 ; CHECK: cmpneqps
 ; CHECK: cmpordps
 ; CHECK: pand
 }

 define <4 x i32> @fcmpOrdVector(<4 x float> %a, <4 x float> %b) {
 entry:
   %res.trunc = fcmp ord <4 x float> %a, %b
   %res = sext <4 x i1> %res.trunc to <4 x i32>
   ret <4 x i32> %res
 ; CHECK-LABEL: fcmpOrdVector:
 ; CHECK: cmpordps
 }

 define <4 x i32> @fcmpTrueVector(<4 x float> %a, <4 x float> %b) {
 entry:
   %res.trunc = fcmp true <4 x float> %a, %b
   %res = sext <4 x i1> %res.trunc to <4 x i32>
   ret <4 x i32> %res
 ; CHECK-LABEL: fcmpTrueVector:
 ; CHECK: pcmpeqd
 }

 define <4 x i32> @fcmpUeqVector(<4 x float> %a, <4 x float> %b) {
 entry:
   %res.trunc = fcmp ueq <4 x float> %a, %b
   %res = sext <4 x i1> %res.trunc to <4 x i32>
   ret <4 x i32> %res
 ; CHECK-LABEL: fcmpUeqVector:
 ; CHECK: cmpeqps
 ; CHECK: cmpunordps
 ; CHECK: por
 }

 define <4 x i32> @fcmpUgeVector(<4 x float> %a, <4 x float> %b) {
 entry:
   %res.trunc = fcmp uge <4 x float> %a, %b
   %res = sext <4 x i1> %res.trunc to <4 x i32>
   ret <4 x i32> %res
 ; CHECK-LABEL: fcmpUgeVector:
 ; CHECK: cmpnltps
 }

 define <4 x i32> @fcmpUgtVector(<4 x float> %a, <4 x float> %b) {
 entry:
   %res.trunc = fcmp ugt <4 x float> %a, %b
   %res = sext <4 x i1> %res.trunc to <4 x i32>
   ret <4 x i32> %res
 ; CHECK-LABEL: fcmpUgtVector:
 ; CHECK: cmpnleps
 }

 define <4 x i32> @fcmpUleVector(<4 x float> %a, <4 x float> %b) {
 entry:
   %res.trunc = fcmp ule <4 x float> %a, %b
   %res = sext <4 x i1> %res.trunc to <4 x i32>
   ret <4 x i32> %res
 ; CHECK-LABEL: fcmpUleVector:
 ; CHECK: cmpnltps
 }

 define <4 x i32> @fcmpUltVector(<4 x float> %a, <4 x float> %b) {
 entry:
   %res.trunc = fcmp ult <4 x float> %a, %b
   %res = sext <4 x i1> %res.trunc to <4 x i32>
   ret <4 x i32> %res
 ; CHECK-LABEL: fcmpUltVector:
 ; CHECK: cmpnleps
 }

 define <4 x i32> @fcmpUneVector(<4 x float> %a, <4 x float> %b) {
 entry:
   %res.trunc = fcmp une <4 x float> %a, %b
   %res = sext <4 x i1> %res.trunc to <4 x i32>
   ret <4 x i32> %res
 ; CHECK-LABEL: fcmpUneVector:
 ; CHECK: cmpneqps
 }

 define <4 x i32> @fcmpUnoVector(<4 x float> %a, <4 x float> %b) {
 entry:
   %res.trunc = fcmp uno <4 x float> %a, %b
   %res = sext <4 x i1> %res.trunc to <4 x i32>
   ret <4 x i32> %res
 ; CHECK-LABEL: fcmpUnoVector:
 ; CHECK: cmpunordps
 }
	; This file checks support for comparing vector values with the fcmp
	; instruction.

	; RUN: %p2i -i %s -a -O2 --verbose none \
	; RUN: \| llvm-mc -triple=i686-none-nacl -filetype=obj \
	; RUN: \| llvm-objdump -d --symbolize -x86-asm-syntax=intel - \| FileCheck %s
	; RUN: %p2i -i %s -a -Om1 --verbose none \
	; RUN: \| llvm-mc -triple=i686-none-nacl -filetype=obj \
	; RUN: \| llvm-objdump -d --symbolize -x86-asm-syntax=intel - \| FileCheck %s

	; Check that sext elimination occurs when the result of the comparison
	; instruction is alrady sign extended. Sign extension to 4 x i32 uses
	; the pslld instruction.
	define <4 x i32> @sextElimination(<4 x float> %a, <4 x float> %b) {
	entry:
	%res.trunc = fcmp oeq <4 x float> %a, %b
	%res = sext <4 x i1> %res.trunc to <4 x i32>
	ret <4 x i32> %res
	; CHECK-LABEL: sextElimination:
	; CHECK: cmpeqps
	; CHECK-NOT: pslld
	}

	define <4 x i32> @fcmpFalseVector(<4 x float> %a, <4 x float> %b) {
	entry:
	%res.trunc = fcmp false <4 x float> %a, %b
	%res = sext <4 x i1> %res.trunc to <4 x i32>
	ret <4 x i32> %res
	; CHECK-LABEL: fcmpFalseVector:
	; CHECK: pxor
	}

	define <4 x i32> @fcmpOeqVector(<4 x float> %a, <4 x float> %b) {
	entry:
	%res.trunc = fcmp oeq <4 x float> %a, %b
	%res = sext <4 x i1> %res.trunc to <4 x i32>
	ret <4 x i32> %res
	; CHECK-LABEL: fcmpOeqVector:
	; CHECK: cmpeqps
	}

	define <4 x i32> @fcmpOgeVector(<4 x float> %a, <4 x float> %b) {
	entry:
	%res.trunc = fcmp oge <4 x float> %a, %b
	%res = sext <4 x i1> %res.trunc to <4 x i32>
	ret <4 x i32> %res
	; CHECK-LABEL: fcmpOgeVector:
	; CHECK: cmpleps
	}

	define <4 x i32> @fcmpOgtVector(<4 x float> %a, <4 x float> %b) {
	entry:
	%res.trunc = fcmp ogt <4 x float> %a, %b
	%res = sext <4 x i1> %res.trunc to <4 x i32>
	ret <4 x i32> %res
	; CHECK-LABEL: fcmpOgtVector:
	; CHECK: cmpltps
	}

	define <4 x i32> @fcmpOleVector(<4 x float> %a, <4 x float> %b) {
	entry:
	%res.trunc = fcmp ole <4 x float> %a, %b
	%res = sext <4 x i1> %res.trunc to <4 x i32>
	ret <4 x i32> %res
	; CHECK-LABEL: fcmpOleVector:
	; CHECK: cmpleps
	}

	define <4 x i32> @fcmpOltVector(<4 x float> %a, <4 x float> %b) {
	entry:
	%res.trunc = fcmp olt <4 x float> %a, %b
	%res = sext <4 x i1> %res.trunc to <4 x i32>
	ret <4 x i32> %res
	; CHECK-LABEL: fcmpOltVector:
	; CHECK: cmpltps
	}

	define <4 x i32> @fcmpOneVector(<4 x float> %a, <4 x float> %b) {
	entry:
	%res.trunc = fcmp one <4 x float> %a, %b
	%res = sext <4 x i1> %res.trunc to <4 x i32>
	ret <4 x i32> %res
	; CHECK-LABEL: fcmpOneVector:
	; CHECK: cmpneqps
	; CHECK: cmpordps
	; CHECK: pand
	}

	define <4 x i32> @fcmpOrdVector(<4 x float> %a, <4 x float> %b) {
	entry:
	%res.trunc = fcmp ord <4 x float> %a, %b
	%res = sext <4 x i1> %res.trunc to <4 x i32>
	ret <4 x i32> %res
	; CHECK-LABEL: fcmpOrdVector:
	; CHECK: cmpordps
	}

	define <4 x i32> @fcmpTrueVector(<4 x float> %a, <4 x float> %b) {
	entry:
	%res.trunc = fcmp true <4 x float> %a, %b
	%res = sext <4 x i1> %res.trunc to <4 x i32>
	ret <4 x i32> %res
	; CHECK-LABEL: fcmpTrueVector:
	; CHECK: pcmpeqd
	}

	define <4 x i32> @fcmpUeqVector(<4 x float> %a, <4 x float> %b) {
	entry:
	%res.trunc = fcmp ueq <4 x float> %a, %b
	%res = sext <4 x i1> %res.trunc to <4 x i32>
	ret <4 x i32> %res
	; CHECK-LABEL: fcmpUeqVector:
	; CHECK: cmpeqps
	; CHECK: cmpunordps
	; CHECK: por
	}

	define <4 x i32> @fcmpUgeVector(<4 x float> %a, <4 x float> %b) {
	entry:
	%res.trunc = fcmp uge <4 x float> %a, %b
	%res = sext <4 x i1> %res.trunc to <4 x i32>
	ret <4 x i32> %res
	; CHECK-LABEL: fcmpUgeVector:
	; CHECK: cmpnltps
	}

	define <4 x i32> @fcmpUgtVector(<4 x float> %a, <4 x float> %b) {
	entry:
	%res.trunc = fcmp ugt <4 x float> %a, %b
	%res = sext <4 x i1> %res.trunc to <4 x i32>
	ret <4 x i32> %res
	; CHECK-LABEL: fcmpUgtVector:
	; CHECK: cmpnleps
	}

	define <4 x i32> @fcmpUleVector(<4 x float> %a, <4 x float> %b) {
	entry:
	%res.trunc = fcmp ule <4 x float> %a, %b
	%res = sext <4 x i1> %res.trunc to <4 x i32>
	ret <4 x i32> %res
	; CHECK-LABEL: fcmpUleVector:
	; CHECK: cmpnltps
	}

	define <4 x i32> @fcmpUltVector(<4 x float> %a, <4 x float> %b) {
	entry:
	%res.trunc = fcmp ult <4 x float> %a, %b
	%res = sext <4 x i1> %res.trunc to <4 x i32>
	ret <4 x i32> %res
	; CHECK-LABEL: fcmpUltVector:
	; CHECK: cmpnleps
	}

	define <4 x i32> @fcmpUneVector(<4 x float> %a, <4 x float> %b) {
	entry:
	%res.trunc = fcmp une <4 x float> %a, %b
	%res = sext <4 x i1> %res.trunc to <4 x i32>
	ret <4 x i32> %res
	; CHECK-LABEL: fcmpUneVector:
	; CHECK: cmpneqps
	}

	define <4 x i32> @fcmpUnoVector(<4 x float> %a, <4 x float> %b) {
	entry:
	%res.trunc = fcmp uno <4 x float> %a, %b
	%res = sext <4 x i1> %res.trunc to <4 x i32>
	ret <4 x i32> %res
	; CHECK-LABEL: fcmpUnoVector:
	; CHECK: cmpunordps
	}