third_party/llvm-7.0/llvm/test/CodeGen/X86/combine-64bit-vec-binop.ll - SwiftShader - Git at Google

 ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=sse4.1 | FileCheck %s --check-prefix=SSE41

 define double @test1_add(double %A, double %B) {
 ; SSE41-LABEL: test1_add:
 ; SSE41:       # %bb.0:
 ; SSE41-NEXT:    paddd %xmm1, %xmm0
 ; SSE41-NEXT:    retq
   %1 = bitcast double %A to <2 x i32>
   %2 = bitcast double %B to <2 x i32>
   %add = add <2 x i32> %1, %2
   %3 = bitcast <2 x i32> %add to double
   ret double %3
 }

 define double @test2_add(double %A, double %B) {
 ; SSE41-LABEL: test2_add:
 ; SSE41:       # %bb.0:
 ; SSE41-NEXT:    paddw %xmm1, %xmm0
 ; SSE41-NEXT:    retq
   %1 = bitcast double %A to <4 x i16>
   %2 = bitcast double %B to <4 x i16>
   %add = add <4 x i16> %1, %2
   %3 = bitcast <4 x i16> %add to double
   ret double %3
 }

 define double @test3_add(double %A, double %B) {
 ; SSE41-LABEL: test3_add:
 ; SSE41:       # %bb.0:
 ; SSE41-NEXT:    paddb %xmm1, %xmm0
 ; SSE41-NEXT:    retq
   %1 = bitcast double %A to <8 x i8>
   %2 = bitcast double %B to <8 x i8>
   %add = add <8 x i8> %1, %2
   %3 = bitcast <8 x i8> %add to double
   ret double %3
 }

 define double @test1_sub(double %A, double %B) {
 ; SSE41-LABEL: test1_sub:
 ; SSE41:       # %bb.0:
 ; SSE41-NEXT:    psubd %xmm1, %xmm0
 ; SSE41-NEXT:    retq
   %1 = bitcast double %A to <2 x i32>
   %2 = bitcast double %B to <2 x i32>
   %sub = sub <2 x i32> %1, %2
   %3 = bitcast <2 x i32> %sub to double
   ret double %3
 }

 define double @test2_sub(double %A, double %B) {
 ; SSE41-LABEL: test2_sub:
 ; SSE41:       # %bb.0:
 ; SSE41-NEXT:    psubw %xmm1, %xmm0
 ; SSE41-NEXT:    retq
   %1 = bitcast double %A to <4 x i16>
   %2 = bitcast double %B to <4 x i16>
   %sub = sub <4 x i16> %1, %2
   %3 = bitcast <4 x i16> %sub to double
   ret double %3
 }

 define double @test3_sub(double %A, double %B) {
 ; SSE41-LABEL: test3_sub:
 ; SSE41:       # %bb.0:
 ; SSE41-NEXT:    psubb %xmm1, %xmm0
 ; SSE41-NEXT:    retq
   %1 = bitcast double %A to <8 x i8>
   %2 = bitcast double %B to <8 x i8>
   %sub = sub <8 x i8> %1, %2
   %3 = bitcast <8 x i8> %sub to double
   ret double %3
 }

 define double @test1_mul(double %A, double %B) {
 ; SSE41-LABEL: test1_mul:
 ; SSE41:       # %bb.0:
 ; SSE41-NEXT:    pmulld %xmm1, %xmm0
 ; SSE41-NEXT:    retq
   %1 = bitcast double %A to <2 x i32>
   %2 = bitcast double %B to <2 x i32>
   %mul = mul <2 x i32> %1, %2
   %3 = bitcast <2 x i32> %mul to double
   ret double %3
 }

 define double @test2_mul(double %A, double %B) {
 ; SSE41-LABEL: test2_mul:
 ; SSE41:       # %bb.0:
 ; SSE41-NEXT:    pmullw %xmm1, %xmm0
 ; SSE41-NEXT:    retq
   %1 = bitcast double %A to <4 x i16>
   %2 = bitcast double %B to <4 x i16>
   %mul = mul <4 x i16> %1, %2
   %3 = bitcast <4 x i16> %mul to double
   ret double %3
 }

 ; There is no legal ISD::MUL with type MVT::v8i16.
 define double @test3_mul(double %A, double %B) {
 ; SSE41-LABEL: test3_mul:
 ; SSE41:       # %bb.0:
 ; SSE41-NEXT:    pmovzxbw {{.*#+}} xmm2 = xmm0[0],zero,xmm0[1],zero,xmm0[2],zero,xmm0[3],zero,xmm0[4],zero,xmm0[5],zero,xmm0[6],zero,xmm0[7],zero
 ; SSE41-NEXT:    pmovzxbw {{.*#+}} xmm0 = xmm1[0],zero,xmm1[1],zero,xmm1[2],zero,xmm1[3],zero,xmm1[4],zero,xmm1[5],zero,xmm1[6],zero,xmm1[7],zero
 ; SSE41-NEXT:    pmullw %xmm2, %xmm0
 ; SSE41-NEXT:    pshufb {{.*#+}} xmm0 = xmm0[0,2,4,6,8,10,12,14,u,u,u,u,u,u,u,u]
 ; SSE41-NEXT:    retq
   %1 = bitcast double %A to <8 x i8>
   %2 = bitcast double %B to <8 x i8>
   %mul = mul <8 x i8> %1, %2
   %3 = bitcast <8 x i8> %mul to double
   ret double %3
 }

 define double @test1_and(double %A, double %B) {
 ; SSE41-LABEL: test1_and:
 ; SSE41:       # %bb.0:
 ; SSE41-NEXT:    andps %xmm1, %xmm0
 ; SSE41-NEXT:    retq
   %1 = bitcast double %A to <2 x i32>
   %2 = bitcast double %B to <2 x i32>
   %and = and <2 x i32> %1, %2
   %3 = bitcast <2 x i32> %and to double
   ret double %3
 }

 define double @test2_and(double %A, double %B) {
 ; SSE41-LABEL: test2_and:
 ; SSE41:       # %bb.0:
 ; SSE41-NEXT:    andps %xmm1, %xmm0
 ; SSE41-NEXT:    retq
   %1 = bitcast double %A to <4 x i16>
   %2 = bitcast double %B to <4 x i16>
   %and = and <4 x i16> %1, %2
   %3 = bitcast <4 x i16> %and to double
   ret double %3
 }

 define double @test3_and(double %A, double %B) {
 ; SSE41-LABEL: test3_and:
 ; SSE41:       # %bb.0:
 ; SSE41-NEXT:    andps %xmm1, %xmm0
 ; SSE41-NEXT:    retq
   %1 = bitcast double %A to <8 x i8>
   %2 = bitcast double %B to <8 x i8>
   %and = and <8 x i8> %1, %2
   %3 = bitcast <8 x i8> %and to double
   ret double %3
 }

 define double @test1_or(double %A, double %B) {
 ; SSE41-LABEL: test1_or:
 ; SSE41:       # %bb.0:
 ; SSE41-NEXT:    orps %xmm1, %xmm0
 ; SSE41-NEXT:    retq
   %1 = bitcast double %A to <2 x i32>
   %2 = bitcast double %B to <2 x i32>
   %or = or <2 x i32> %1, %2
   %3 = bitcast <2 x i32> %or to double
   ret double %3
 }

 define double @test2_or(double %A, double %B) {
 ; SSE41-LABEL: test2_or:
 ; SSE41:       # %bb.0:
 ; SSE41-NEXT:    orps %xmm1, %xmm0
 ; SSE41-NEXT:    retq
   %1 = bitcast double %A to <4 x i16>
   %2 = bitcast double %B to <4 x i16>
   %or = or <4 x i16> %1, %2
   %3 = bitcast <4 x i16> %or to double
   ret double %3
 }

 define double @test3_or(double %A, double %B) {
 ; SSE41-LABEL: test3_or:
 ; SSE41:       # %bb.0:
 ; SSE41-NEXT:    orps %xmm1, %xmm0
 ; SSE41-NEXT:    retq
   %1 = bitcast double %A to <8 x i8>
   %2 = bitcast double %B to <8 x i8>
   %or = or <8 x i8> %1, %2
   %3 = bitcast <8 x i8> %or to double
   ret double %3
 }

 define double @test1_xor(double %A, double %B) {
 ; SSE41-LABEL: test1_xor:
 ; SSE41:       # %bb.0:
 ; SSE41-NEXT:    xorps %xmm1, %xmm0
 ; SSE41-NEXT:    retq
   %1 = bitcast double %A to <2 x i32>
   %2 = bitcast double %B to <2 x i32>
   %xor = xor <2 x i32> %1, %2
   %3 = bitcast <2 x i32> %xor to double
   ret double %3
 }

 define double @test2_xor(double %A, double %B) {
 ; SSE41-LABEL: test2_xor:
 ; SSE41:       # %bb.0:
 ; SSE41-NEXT:    xorps %xmm1, %xmm0
 ; SSE41-NEXT:    retq
   %1 = bitcast double %A to <4 x i16>
   %2 = bitcast double %B to <4 x i16>
   %xor = xor <4 x i16> %1, %2
   %3 = bitcast <4 x i16> %xor to double
   ret double %3
 }

 define double @test3_xor(double %A, double %B) {
 ; SSE41-LABEL: test3_xor:
 ; SSE41:       # %bb.0:
 ; SSE41-NEXT:    xorps %xmm1, %xmm0
 ; SSE41-NEXT:    retq
   %1 = bitcast double %A to <8 x i8>
   %2 = bitcast double %B to <8 x i8>
   %xor = xor <8 x i8> %1, %2
   %3 = bitcast <8 x i8> %xor to double
   ret double %3
 }

 define double @test_fadd(double %A, double %B) {
 ; SSE41-LABEL: test_fadd:
 ; SSE41:       # %bb.0:
 ; SSE41-NEXT:    addps %xmm1, %xmm0
 ; SSE41-NEXT:    retq
   %1 = bitcast double %A to <2 x float>
   %2 = bitcast double %B to <2 x float>
   %add = fadd <2 x float> %1, %2
   %3 = bitcast <2 x float> %add to double
   ret double %3
 }

 define double @test_fsub(double %A, double %B) {
 ; SSE41-LABEL: test_fsub:
 ; SSE41:       # %bb.0:
 ; SSE41-NEXT:    subps %xmm1, %xmm0
 ; SSE41-NEXT:    retq
   %1 = bitcast double %A to <2 x float>
   %2 = bitcast double %B to <2 x float>
   %sub = fsub <2 x float> %1, %2
   %3 = bitcast <2 x float> %sub to double
   ret double %3
 }

 define double @test_fmul(double %A, double %B) {
 ; SSE41-LABEL: test_fmul:
 ; SSE41:       # %bb.0:
 ; SSE41-NEXT:    mulps %xmm1, %xmm0
 ; SSE41-NEXT:    retq
   %1 = bitcast double %A to <2 x float>
   %2 = bitcast double %B to <2 x float>
   %mul = fmul <2 x float> %1, %2
   %3 = bitcast <2 x float> %mul to double
   ret double %3
 }
	; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
	; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=sse4.1 \| FileCheck %s --check-prefix=SSE41

	define double @test1_add(double %A, double %B) {
	; SSE41-LABEL: test1_add:
	; SSE41: # %bb.0:
	; SSE41-NEXT: paddd %xmm1, %xmm0
	; SSE41-NEXT: retq
	%1 = bitcast double %A to <2 x i32>
	%2 = bitcast double %B to <2 x i32>
	%add = add <2 x i32> %1, %2
	%3 = bitcast <2 x i32> %add to double
	ret double %3
	}

	define double @test2_add(double %A, double %B) {
	; SSE41-LABEL: test2_add:
	; SSE41: # %bb.0:
	; SSE41-NEXT: paddw %xmm1, %xmm0
	; SSE41-NEXT: retq
	%1 = bitcast double %A to <4 x i16>
	%2 = bitcast double %B to <4 x i16>
	%add = add <4 x i16> %1, %2
	%3 = bitcast <4 x i16> %add to double
	ret double %3
	}

	define double @test3_add(double %A, double %B) {
	; SSE41-LABEL: test3_add:
	; SSE41: # %bb.0:
	; SSE41-NEXT: paddb %xmm1, %xmm0
	; SSE41-NEXT: retq
	%1 = bitcast double %A to <8 x i8>
	%2 = bitcast double %B to <8 x i8>
	%add = add <8 x i8> %1, %2
	%3 = bitcast <8 x i8> %add to double
	ret double %3
	}

	define double @test1_sub(double %A, double %B) {
	; SSE41-LABEL: test1_sub:
	; SSE41: # %bb.0:
	; SSE41-NEXT: psubd %xmm1, %xmm0
	; SSE41-NEXT: retq
	%1 = bitcast double %A to <2 x i32>
	%2 = bitcast double %B to <2 x i32>
	%sub = sub <2 x i32> %1, %2
	%3 = bitcast <2 x i32> %sub to double
	ret double %3
	}

	define double @test2_sub(double %A, double %B) {
	; SSE41-LABEL: test2_sub:
	; SSE41: # %bb.0:
	; SSE41-NEXT: psubw %xmm1, %xmm0
	; SSE41-NEXT: retq
	%1 = bitcast double %A to <4 x i16>
	%2 = bitcast double %B to <4 x i16>
	%sub = sub <4 x i16> %1, %2
	%3 = bitcast <4 x i16> %sub to double
	ret double %3
	}

	define double @test3_sub(double %A, double %B) {
	; SSE41-LABEL: test3_sub:
	; SSE41: # %bb.0:
	; SSE41-NEXT: psubb %xmm1, %xmm0
	; SSE41-NEXT: retq
	%1 = bitcast double %A to <8 x i8>
	%2 = bitcast double %B to <8 x i8>
	%sub = sub <8 x i8> %1, %2
	%3 = bitcast <8 x i8> %sub to double
	ret double %3
	}

	define double @test1_mul(double %A, double %B) {
	; SSE41-LABEL: test1_mul:
	; SSE41: # %bb.0:
	; SSE41-NEXT: pmulld %xmm1, %xmm0
	; SSE41-NEXT: retq
	%1 = bitcast double %A to <2 x i32>
	%2 = bitcast double %B to <2 x i32>
	%mul = mul <2 x i32> %1, %2
	%3 = bitcast <2 x i32> %mul to double
	ret double %3
	}

	define double @test2_mul(double %A, double %B) {
	; SSE41-LABEL: test2_mul:
	; SSE41: # %bb.0:
	; SSE41-NEXT: pmullw %xmm1, %xmm0
	; SSE41-NEXT: retq
	%1 = bitcast double %A to <4 x i16>
	%2 = bitcast double %B to <4 x i16>
	%mul = mul <4 x i16> %1, %2
	%3 = bitcast <4 x i16> %mul to double
	ret double %3
	}

	; There is no legal ISD::MUL with type MVT::v8i16.
	define double @test3_mul(double %A, double %B) {
	; SSE41-LABEL: test3_mul:
	; SSE41: # %bb.0:
	; SSE41-NEXT: pmovzxbw {{.*#+}} xmm2 = xmm0[0],zero,xmm0[1],zero,xmm0[2],zero,xmm0[3],zero,xmm0[4],zero,xmm0[5],zero,xmm0[6],zero,xmm0[7],zero
	; SSE41-NEXT: pmovzxbw {{.*#+}} xmm0 = xmm1[0],zero,xmm1[1],zero,xmm1[2],zero,xmm1[3],zero,xmm1[4],zero,xmm1[5],zero,xmm1[6],zero,xmm1[7],zero
	; SSE41-NEXT: pmullw %xmm2, %xmm0
	; SSE41-NEXT: pshufb {{.*#+}} xmm0 = xmm0[0,2,4,6,8,10,12,14,u,u,u,u,u,u,u,u]
	; SSE41-NEXT: retq
	%1 = bitcast double %A to <8 x i8>
	%2 = bitcast double %B to <8 x i8>
	%mul = mul <8 x i8> %1, %2
	%3 = bitcast <8 x i8> %mul to double
	ret double %3
	}

	define double @test1_and(double %A, double %B) {
	; SSE41-LABEL: test1_and:
	; SSE41: # %bb.0:
	; SSE41-NEXT: andps %xmm1, %xmm0
	; SSE41-NEXT: retq
	%1 = bitcast double %A to <2 x i32>
	%2 = bitcast double %B to <2 x i32>
	%and = and <2 x i32> %1, %2
	%3 = bitcast <2 x i32> %and to double
	ret double %3
	}

	define double @test2_and(double %A, double %B) {
	; SSE41-LABEL: test2_and:
	; SSE41: # %bb.0:
	; SSE41-NEXT: andps %xmm1, %xmm0
	; SSE41-NEXT: retq
	%1 = bitcast double %A to <4 x i16>
	%2 = bitcast double %B to <4 x i16>
	%and = and <4 x i16> %1, %2
	%3 = bitcast <4 x i16> %and to double
	ret double %3
	}

	define double @test3_and(double %A, double %B) {
	; SSE41-LABEL: test3_and:
	; SSE41: # %bb.0:
	; SSE41-NEXT: andps %xmm1, %xmm0
	; SSE41-NEXT: retq
	%1 = bitcast double %A to <8 x i8>
	%2 = bitcast double %B to <8 x i8>
	%and = and <8 x i8> %1, %2
	%3 = bitcast <8 x i8> %and to double
	ret double %3
	}

	define double @test1_or(double %A, double %B) {
	; SSE41-LABEL: test1_or:
	; SSE41: # %bb.0:
	; SSE41-NEXT: orps %xmm1, %xmm0
	; SSE41-NEXT: retq
	%1 = bitcast double %A to <2 x i32>
	%2 = bitcast double %B to <2 x i32>
	%or = or <2 x i32> %1, %2
	%3 = bitcast <2 x i32> %or to double
	ret double %3
	}

	define double @test2_or(double %A, double %B) {
	; SSE41-LABEL: test2_or:
	; SSE41: # %bb.0:
	; SSE41-NEXT: orps %xmm1, %xmm0
	; SSE41-NEXT: retq
	%1 = bitcast double %A to <4 x i16>
	%2 = bitcast double %B to <4 x i16>
	%or = or <4 x i16> %1, %2
	%3 = bitcast <4 x i16> %or to double
	ret double %3
	}

	define double @test3_or(double %A, double %B) {
	; SSE41-LABEL: test3_or:
	; SSE41: # %bb.0:
	; SSE41-NEXT: orps %xmm1, %xmm0
	; SSE41-NEXT: retq
	%1 = bitcast double %A to <8 x i8>
	%2 = bitcast double %B to <8 x i8>
	%or = or <8 x i8> %1, %2
	%3 = bitcast <8 x i8> %or to double
	ret double %3
	}

	define double @test1_xor(double %A, double %B) {
	; SSE41-LABEL: test1_xor:
	; SSE41: # %bb.0:
	; SSE41-NEXT: xorps %xmm1, %xmm0
	; SSE41-NEXT: retq
	%1 = bitcast double %A to <2 x i32>
	%2 = bitcast double %B to <2 x i32>
	%xor = xor <2 x i32> %1, %2
	%3 = bitcast <2 x i32> %xor to double
	ret double %3
	}

	define double @test2_xor(double %A, double %B) {
	; SSE41-LABEL: test2_xor:
	; SSE41: # %bb.0:
	; SSE41-NEXT: xorps %xmm1, %xmm0
	; SSE41-NEXT: retq
	%1 = bitcast double %A to <4 x i16>
	%2 = bitcast double %B to <4 x i16>
	%xor = xor <4 x i16> %1, %2
	%3 = bitcast <4 x i16> %xor to double
	ret double %3
	}

	define double @test3_xor(double %A, double %B) {
	; SSE41-LABEL: test3_xor:
	; SSE41: # %bb.0:
	; SSE41-NEXT: xorps %xmm1, %xmm0
	; SSE41-NEXT: retq
	%1 = bitcast double %A to <8 x i8>
	%2 = bitcast double %B to <8 x i8>
	%xor = xor <8 x i8> %1, %2
	%3 = bitcast <8 x i8> %xor to double
	ret double %3
	}

	define double @test_fadd(double %A, double %B) {
	; SSE41-LABEL: test_fadd:
	; SSE41: # %bb.0:
	; SSE41-NEXT: addps %xmm1, %xmm0
	; SSE41-NEXT: retq
	%1 = bitcast double %A to <2 x float>
	%2 = bitcast double %B to <2 x float>
	%add = fadd <2 x float> %1, %2
	%3 = bitcast <2 x float> %add to double
	ret double %3
	}

	define double @test_fsub(double %A, double %B) {
	; SSE41-LABEL: test_fsub:
	; SSE41: # %bb.0:
	; SSE41-NEXT: subps %xmm1, %xmm0
	; SSE41-NEXT: retq
	%1 = bitcast double %A to <2 x float>
	%2 = bitcast double %B to <2 x float>
	%sub = fsub <2 x float> %1, %2
	%3 = bitcast <2 x float> %sub to double
	ret double %3
	}

	define double @test_fmul(double %A, double %B) {
	; SSE41-LABEL: test_fmul:
	; SSE41: # %bb.0:
	; SSE41-NEXT: mulps %xmm1, %xmm0
	; SSE41-NEXT: retq
	%1 = bitcast double %A to <2 x float>
	%2 = bitcast double %B to <2 x float>
	%mul = fmul <2 x float> %1, %2
	%3 = bitcast <2 x float> %mul to double
	ret double %3
	}