| ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py |
| ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mcpu=skx | FileCheck %s --check-prefix=CHECK --check-prefix=VLX |
| ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mcpu=knl | FileCheck %s --check-prefix=CHECK --check-prefix=NoVLX |
| |
| define <4 x i64> @test256_1(<4 x i64> %x, <4 x i64> %y) nounwind { |
| ; VLX-LABEL: test256_1: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpeqq %ymm1, %ymm0, %k1 |
| ; VLX-NEXT: vpblendmq %ymm0, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_1: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vpcmpeqq %zmm1, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmq %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %mask = icmp eq <4 x i64> %x, %y |
| %max = select <4 x i1> %mask, <4 x i64> %x, <4 x i64> %y |
| ret <4 x i64> %max |
| } |
| |
| define <4 x i64> @test256_2(<4 x i64> %x, <4 x i64> %y, <4 x i64> %x1) nounwind { |
| ; VLX-LABEL: test256_2: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpgtq %ymm1, %ymm0, %k1 |
| ; VLX-NEXT: vpblendmq %ymm2, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_2: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm2 killed $ymm2 def $zmm2 |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vpcmpgtq %zmm1, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmq %zmm2, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %mask = icmp sgt <4 x i64> %x, %y |
| %max = select <4 x i1> %mask, <4 x i64> %x1, <4 x i64> %y |
| ret <4 x i64> %max |
| } |
| |
| define <8 x i32> @test256_3(<8 x i32> %x, <8 x i32> %y, <8 x i32> %x1) nounwind { |
| ; VLX-LABEL: test256_3: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpnltd %ymm1, %ymm0, %k1 |
| ; VLX-NEXT: vpblendmd %ymm2, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_3: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm2 killed $ymm2 def $zmm2 |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vpcmpnltd %zmm1, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm2, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %mask = icmp sge <8 x i32> %x, %y |
| %max = select <8 x i1> %mask, <8 x i32> %x1, <8 x i32> %y |
| ret <8 x i32> %max |
| } |
| |
| define <4 x i64> @test256_4(<4 x i64> %x, <4 x i64> %y, <4 x i64> %x1) nounwind { |
| ; VLX-LABEL: test256_4: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpnleuq %ymm1, %ymm0, %k1 |
| ; VLX-NEXT: vpblendmq %ymm2, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_4: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm2 killed $ymm2 def $zmm2 |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vpcmpnleuq %zmm1, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmq %zmm2, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %mask = icmp ugt <4 x i64> %x, %y |
| %max = select <4 x i1> %mask, <4 x i64> %x1, <4 x i64> %y |
| ret <4 x i64> %max |
| } |
| |
| define <8 x i32> @test256_5(<8 x i32> %x, <8 x i32> %x1, <8 x i32>* %yp) nounwind { |
| ; VLX-LABEL: test256_5: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpeqd (%rdi), %ymm0, %k1 |
| ; VLX-NEXT: vpblendmd %ymm0, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_5: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %ymm2 |
| ; NoVLX-NEXT: vpcmpeqd %zmm2, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <8 x i32>, <8 x i32>* %yp, align 4 |
| %mask = icmp eq <8 x i32> %x, %y |
| %max = select <8 x i1> %mask, <8 x i32> %x, <8 x i32> %x1 |
| ret <8 x i32> %max |
| } |
| |
| define <8 x i32> @test256_5b(<8 x i32> %x, <8 x i32> %x1, <8 x i32>* %yp) nounwind { |
| ; VLX-LABEL: test256_5b: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpeqd (%rdi), %ymm0, %k1 |
| ; VLX-NEXT: vpblendmd %ymm0, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_5b: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %ymm2 |
| ; NoVLX-NEXT: vpcmpeqd %zmm0, %zmm2, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <8 x i32>, <8 x i32>* %yp, align 4 |
| %mask = icmp eq <8 x i32> %y, %x |
| %max = select <8 x i1> %mask, <8 x i32> %x, <8 x i32> %x1 |
| ret <8 x i32> %max |
| } |
| |
| define <8 x i32> @test256_6(<8 x i32> %x, <8 x i32> %x1, <8 x i32>* %y.ptr) nounwind { |
| ; VLX-LABEL: test256_6: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpgtd (%rdi), %ymm0, %k1 |
| ; VLX-NEXT: vpblendmd %ymm0, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_6: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %ymm2 |
| ; NoVLX-NEXT: vpcmpgtd %zmm2, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <8 x i32>, <8 x i32>* %y.ptr, align 4 |
| %mask = icmp sgt <8 x i32> %x, %y |
| %max = select <8 x i1> %mask, <8 x i32> %x, <8 x i32> %x1 |
| ret <8 x i32> %max |
| } |
| |
| define <8 x i32> @test256_6b(<8 x i32> %x, <8 x i32> %x1, <8 x i32>* %y.ptr) nounwind { |
| ; VLX-LABEL: test256_6b: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpgtd (%rdi), %ymm0, %k1 |
| ; VLX-NEXT: vpblendmd %ymm0, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_6b: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %ymm2 |
| ; NoVLX-NEXT: vpcmpgtd %zmm2, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <8 x i32>, <8 x i32>* %y.ptr, align 4 |
| %mask = icmp slt <8 x i32> %y, %x |
| %max = select <8 x i1> %mask, <8 x i32> %x, <8 x i32> %x1 |
| ret <8 x i32> %max |
| } |
| |
| define <8 x i32> @test256_7(<8 x i32> %x, <8 x i32> %x1, <8 x i32>* %y.ptr) nounwind { |
| ; VLX-LABEL: test256_7: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpled (%rdi), %ymm0, %k1 |
| ; VLX-NEXT: vpblendmd %ymm0, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_7: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %ymm2 |
| ; NoVLX-NEXT: vpcmpled %zmm2, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <8 x i32>, <8 x i32>* %y.ptr, align 4 |
| %mask = icmp sle <8 x i32> %x, %y |
| %max = select <8 x i1> %mask, <8 x i32> %x, <8 x i32> %x1 |
| ret <8 x i32> %max |
| } |
| |
| define <8 x i32> @test256_7b(<8 x i32> %x, <8 x i32> %x1, <8 x i32>* %y.ptr) nounwind { |
| ; VLX-LABEL: test256_7b: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpled (%rdi), %ymm0, %k1 |
| ; VLX-NEXT: vpblendmd %ymm0, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_7b: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %ymm2 |
| ; NoVLX-NEXT: vpcmpnltd %zmm0, %zmm2, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <8 x i32>, <8 x i32>* %y.ptr, align 4 |
| %mask = icmp sge <8 x i32> %y, %x |
| %max = select <8 x i1> %mask, <8 x i32> %x, <8 x i32> %x1 |
| ret <8 x i32> %max |
| } |
| |
| define <8 x i32> @test256_8(<8 x i32> %x, <8 x i32> %x1, <8 x i32>* %y.ptr) nounwind { |
| ; VLX-LABEL: test256_8: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpleud (%rdi), %ymm0, %k1 |
| ; VLX-NEXT: vpblendmd %ymm0, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_8: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %ymm2 |
| ; NoVLX-NEXT: vpcmpleud %zmm2, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <8 x i32>, <8 x i32>* %y.ptr, align 4 |
| %mask = icmp ule <8 x i32> %x, %y |
| %max = select <8 x i1> %mask, <8 x i32> %x, <8 x i32> %x1 |
| ret <8 x i32> %max |
| } |
| |
| define <8 x i32> @test256_8b(<8 x i32> %x, <8 x i32> %x1, <8 x i32>* %y.ptr) nounwind { |
| ; VLX-LABEL: test256_8b: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpleud (%rdi), %ymm0, %k1 |
| ; VLX-NEXT: vpblendmd %ymm0, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_8b: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %ymm2 |
| ; NoVLX-NEXT: vpcmpnltud %zmm0, %zmm2, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <8 x i32>, <8 x i32>* %y.ptr, align 4 |
| %mask = icmp uge <8 x i32> %y, %x |
| %max = select <8 x i1> %mask, <8 x i32> %x, <8 x i32> %x1 |
| ret <8 x i32> %max |
| } |
| |
| define <8 x i32> @test256_9(<8 x i32> %x, <8 x i32> %y, <8 x i32> %x1, <8 x i32> %y1) nounwind { |
| ; VLX-LABEL: test256_9: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpeqd %ymm1, %ymm0, %k1 |
| ; VLX-NEXT: vpcmpeqd %ymm3, %ymm2, %k1 {%k1} |
| ; VLX-NEXT: vpblendmd %ymm0, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_9: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm3 killed $ymm3 def $zmm3 |
| ; NoVLX-NEXT: # kill: def $ymm2 killed $ymm2 def $zmm2 |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vpcmpeqd %zmm1, %zmm0, %k1 |
| ; NoVLX-NEXT: vpcmpeqd %zmm3, %zmm2, %k1 {%k1} |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %mask1 = icmp eq <8 x i32> %x1, %y1 |
| %mask0 = icmp eq <8 x i32> %x, %y |
| %mask = select <8 x i1> %mask0, <8 x i1> %mask1, <8 x i1> zeroinitializer |
| %max = select <8 x i1> %mask, <8 x i32> %x, <8 x i32> %y |
| ret <8 x i32> %max |
| } |
| |
| define <4 x i64> @test256_10(<4 x i64> %x, <4 x i64> %y, <4 x i64> %x1, <4 x i64> %y1) nounwind { |
| ; VLX-LABEL: test256_10: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpleq %ymm1, %ymm0, %k1 |
| ; VLX-NEXT: vpcmpnltq %ymm3, %ymm2, %k1 {%k1} |
| ; VLX-NEXT: vpblendmq %ymm0, %ymm2, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_10: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm3 killed $ymm3 def $zmm3 |
| ; NoVLX-NEXT: # kill: def $ymm2 killed $ymm2 def $zmm2 |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vpcmpleq %zmm1, %zmm0, %k1 |
| ; NoVLX-NEXT: vpcmpnltq %zmm3, %zmm2, %k1 {%k1} |
| ; NoVLX-NEXT: vpblendmq %zmm0, %zmm2, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %mask1 = icmp sge <4 x i64> %x1, %y1 |
| %mask0 = icmp sle <4 x i64> %x, %y |
| %mask = select <4 x i1> %mask0, <4 x i1> %mask1, <4 x i1> zeroinitializer |
| %max = select <4 x i1> %mask, <4 x i64> %x, <4 x i64> %x1 |
| ret <4 x i64> %max |
| } |
| |
| define <4 x i64> @test256_11(<4 x i64> %x, <4 x i64>* %y.ptr, <4 x i64> %x1, <4 x i64> %y1) nounwind { |
| ; VLX-LABEL: test256_11: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpgtq %ymm2, %ymm1, %k1 |
| ; VLX-NEXT: vpcmpgtq (%rdi), %ymm0, %k1 {%k1} |
| ; VLX-NEXT: vpblendmq %ymm0, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_11: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm2 killed $ymm2 def $zmm2 |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %ymm3 |
| ; NoVLX-NEXT: vpcmpgtq %zmm3, %zmm0, %k1 |
| ; NoVLX-NEXT: vpcmpgtq %zmm2, %zmm1, %k1 {%k1} |
| ; NoVLX-NEXT: vpblendmq %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %mask1 = icmp sgt <4 x i64> %x1, %y1 |
| %y = load <4 x i64>, <4 x i64>* %y.ptr, align 4 |
| %mask0 = icmp sgt <4 x i64> %x, %y |
| %mask = select <4 x i1> %mask0, <4 x i1> %mask1, <4 x i1> zeroinitializer |
| %max = select <4 x i1> %mask, <4 x i64> %x, <4 x i64> %x1 |
| ret <4 x i64> %max |
| } |
| |
| define <8 x i32> @test256_12(<8 x i32> %x, <8 x i32>* %y.ptr, <8 x i32> %x1, <8 x i32> %y1) nounwind { |
| ; VLX-LABEL: test256_12: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpnltd %ymm2, %ymm1, %k1 |
| ; VLX-NEXT: vpcmpleud (%rdi), %ymm0, %k1 {%k1} |
| ; VLX-NEXT: vpblendmd %ymm0, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_12: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm2 killed $ymm2 def $zmm2 |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %ymm3 |
| ; NoVLX-NEXT: vpcmpleud %zmm3, %zmm0, %k1 |
| ; NoVLX-NEXT: vpcmpnltd %zmm2, %zmm1, %k1 {%k1} |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %mask1 = icmp sge <8 x i32> %x1, %y1 |
| %y = load <8 x i32>, <8 x i32>* %y.ptr, align 4 |
| %mask0 = icmp ule <8 x i32> %x, %y |
| %mask = select <8 x i1> %mask0, <8 x i1> %mask1, <8 x i1> zeroinitializer |
| %max = select <8 x i1> %mask, <8 x i32> %x, <8 x i32> %x1 |
| ret <8 x i32> %max |
| } |
| |
| define <4 x i64> @test256_13(<4 x i64> %x, <4 x i64> %x1, i64* %yb.ptr) nounwind { |
| ; VLX-LABEL: test256_13: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpeqq (%rdi){1to4}, %ymm0, %k1 |
| ; VLX-NEXT: vpblendmq %ymm0, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_13: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vpbroadcastq (%rdi), %ymm2 |
| ; NoVLX-NEXT: vpcmpeqq %zmm2, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmq %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %yb = load i64, i64* %yb.ptr, align 4 |
| %y.0 = insertelement <4 x i64> undef, i64 %yb, i32 0 |
| %y = shufflevector <4 x i64> %y.0, <4 x i64> undef, <4 x i32> zeroinitializer |
| %mask = icmp eq <4 x i64> %x, %y |
| %max = select <4 x i1> %mask, <4 x i64> %x, <4 x i64> %x1 |
| ret <4 x i64> %max |
| } |
| |
| define <8 x i32> @test256_14(<8 x i32> %x, i32* %yb.ptr, <8 x i32> %x1) nounwind { |
| ; VLX-LABEL: test256_14: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpled (%rdi){1to8}, %ymm0, %k1 |
| ; VLX-NEXT: vpblendmd %ymm0, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_14: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vpbroadcastd (%rdi), %ymm2 |
| ; NoVLX-NEXT: vpcmpled %zmm2, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %yb = load i32, i32* %yb.ptr, align 4 |
| %y.0 = insertelement <8 x i32> undef, i32 %yb, i32 0 |
| %y = shufflevector <8 x i32> %y.0, <8 x i32> undef, <8 x i32> zeroinitializer |
| %mask = icmp sle <8 x i32> %x, %y |
| %max = select <8 x i1> %mask, <8 x i32> %x, <8 x i32> %x1 |
| ret <8 x i32> %max |
| } |
| |
| define <8 x i32> @test256_15(<8 x i32> %x, i32* %yb.ptr, <8 x i32> %x1, <8 x i32> %y1) nounwind { |
| ; VLX-LABEL: test256_15: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpnltd %ymm2, %ymm1, %k1 |
| ; VLX-NEXT: vpcmpgtd (%rdi){1to8}, %ymm0, %k1 {%k1} |
| ; VLX-NEXT: vpblendmd %ymm0, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_15: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm2 killed $ymm2 def $zmm2 |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vpcmpnltd %zmm2, %zmm1, %k1 |
| ; NoVLX-NEXT: vpbroadcastd (%rdi), %ymm2 |
| ; NoVLX-NEXT: vpcmpgtd %zmm2, %zmm0, %k1 {%k1} |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %mask1 = icmp sge <8 x i32> %x1, %y1 |
| %yb = load i32, i32* %yb.ptr, align 4 |
| %y.0 = insertelement <8 x i32> undef, i32 %yb, i32 0 |
| %y = shufflevector <8 x i32> %y.0, <8 x i32> undef, <8 x i32> zeroinitializer |
| %mask0 = icmp sgt <8 x i32> %x, %y |
| %mask = select <8 x i1> %mask0, <8 x i1> %mask1, <8 x i1> zeroinitializer |
| %max = select <8 x i1> %mask, <8 x i32> %x, <8 x i32> %x1 |
| ret <8 x i32> %max |
| } |
| |
| define <4 x i64> @test256_16(<4 x i64> %x, i64* %yb.ptr, <4 x i64> %x1, <4 x i64> %y1) nounwind { |
| ; VLX-LABEL: test256_16: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpnltq %ymm2, %ymm1, %k1 |
| ; VLX-NEXT: vpcmpgtq (%rdi){1to4}, %ymm0, %k1 {%k1} |
| ; VLX-NEXT: vpblendmq %ymm0, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_16: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm2 killed $ymm2 def $zmm2 |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vpcmpnltq %zmm2, %zmm1, %k1 |
| ; NoVLX-NEXT: vpbroadcastq (%rdi), %ymm2 |
| ; NoVLX-NEXT: vpcmpgtq %zmm2, %zmm0, %k1 {%k1} |
| ; NoVLX-NEXT: vpblendmq %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %mask1 = icmp sge <4 x i64> %x1, %y1 |
| %yb = load i64, i64* %yb.ptr, align 4 |
| %y.0 = insertelement <4 x i64> undef, i64 %yb, i32 0 |
| %y = shufflevector <4 x i64> %y.0, <4 x i64> undef, <4 x i32> zeroinitializer |
| %mask0 = icmp sgt <4 x i64> %x, %y |
| %mask = select <4 x i1> %mask0, <4 x i1> %mask1, <4 x i1> zeroinitializer |
| %max = select <4 x i1> %mask, <4 x i64> %x, <4 x i64> %x1 |
| ret <4 x i64> %max |
| } |
| |
| define <8 x i32> @test256_17(<8 x i32> %x, <8 x i32> %x1, <8 x i32>* %yp) nounwind { |
| ; VLX-LABEL: test256_17: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpneqd (%rdi), %ymm0, %k1 |
| ; VLX-NEXT: vpblendmd %ymm0, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_17: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %ymm2 |
| ; NoVLX-NEXT: vpcmpneqd %zmm2, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <8 x i32>, <8 x i32>* %yp, align 4 |
| %mask = icmp ne <8 x i32> %x, %y |
| %max = select <8 x i1> %mask, <8 x i32> %x, <8 x i32> %x1 |
| ret <8 x i32> %max |
| } |
| |
| define <8 x i32> @test256_18(<8 x i32> %x, <8 x i32> %x1, <8 x i32>* %yp) nounwind { |
| ; VLX-LABEL: test256_18: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpneqd (%rdi), %ymm0, %k1 |
| ; VLX-NEXT: vpblendmd %ymm0, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_18: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %ymm2 |
| ; NoVLX-NEXT: vpcmpneqd %zmm0, %zmm2, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <8 x i32>, <8 x i32>* %yp, align 4 |
| %mask = icmp ne <8 x i32> %y, %x |
| %max = select <8 x i1> %mask, <8 x i32> %x, <8 x i32> %x1 |
| ret <8 x i32> %max |
| } |
| |
| define <8 x i32> @test256_19(<8 x i32> %x, <8 x i32> %x1, <8 x i32>* %yp) nounwind { |
| ; VLX-LABEL: test256_19: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpnltud (%rdi), %ymm0, %k1 |
| ; VLX-NEXT: vpblendmd %ymm0, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_19: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %ymm2 |
| ; NoVLX-NEXT: vpcmpnltud %zmm2, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <8 x i32>, <8 x i32>* %yp, align 4 |
| %mask = icmp uge <8 x i32> %x, %y |
| %max = select <8 x i1> %mask, <8 x i32> %x, <8 x i32> %x1 |
| ret <8 x i32> %max |
| } |
| |
| define <8 x i32> @test256_20(<8 x i32> %x, <8 x i32> %x1, <8 x i32>* %yp) nounwind { |
| ; VLX-LABEL: test256_20: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpleud (%rdi), %ymm0, %k1 |
| ; VLX-NEXT: vpblendmd %ymm0, %ymm1, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test256_20: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm1 killed $ymm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %ymm2 |
| ; NoVLX-NEXT: vpcmpnltud %zmm0, %zmm2, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <8 x i32>, <8 x i32>* %yp, align 4 |
| %mask = icmp uge <8 x i32> %y, %x |
| %max = select <8 x i1> %mask, <8 x i32> %x, <8 x i32> %x1 |
| ret <8 x i32> %max |
| } |
| |
| define <2 x i64> @test128_1(<2 x i64> %x, <2 x i64> %y) nounwind { |
| ; VLX-LABEL: test128_1: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpeqq %xmm1, %xmm0, %k1 |
| ; VLX-NEXT: vpblendmq %xmm0, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_1: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vpcmpeqq %zmm1, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmq %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %mask = icmp eq <2 x i64> %x, %y |
| %max = select <2 x i1> %mask, <2 x i64> %x, <2 x i64> %y |
| ret <2 x i64> %max |
| } |
| |
| define <2 x i64> @test128_2(<2 x i64> %x, <2 x i64> %y, <2 x i64> %x1) nounwind { |
| ; VLX-LABEL: test128_2: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpgtq %xmm1, %xmm0, %k1 |
| ; VLX-NEXT: vpblendmq %xmm2, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_2: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm2 killed $xmm2 def $zmm2 |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vpcmpgtq %zmm1, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmq %zmm2, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %mask = icmp sgt <2 x i64> %x, %y |
| %max = select <2 x i1> %mask, <2 x i64> %x1, <2 x i64> %y |
| ret <2 x i64> %max |
| } |
| |
| define <4 x i32> @test128_3(<4 x i32> %x, <4 x i32> %y, <4 x i32> %x1) nounwind { |
| ; VLX-LABEL: test128_3: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpnltd %xmm1, %xmm0, %k1 |
| ; VLX-NEXT: vpblendmd %xmm2, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_3: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm2 killed $xmm2 def $zmm2 |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vpcmpnltd %zmm1, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm2, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %mask = icmp sge <4 x i32> %x, %y |
| %max = select <4 x i1> %mask, <4 x i32> %x1, <4 x i32> %y |
| ret <4 x i32> %max |
| } |
| |
| define <2 x i64> @test128_4(<2 x i64> %x, <2 x i64> %y, <2 x i64> %x1) nounwind { |
| ; VLX-LABEL: test128_4: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpnleuq %xmm1, %xmm0, %k1 |
| ; VLX-NEXT: vpblendmq %xmm2, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_4: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm2 killed $xmm2 def $zmm2 |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vpcmpnleuq %zmm1, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmq %zmm2, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %mask = icmp ugt <2 x i64> %x, %y |
| %max = select <2 x i1> %mask, <2 x i64> %x1, <2 x i64> %y |
| ret <2 x i64> %max |
| } |
| |
| define <4 x i32> @test128_5(<4 x i32> %x, <4 x i32> %x1, <4 x i32>* %yp) nounwind { |
| ; VLX-LABEL: test128_5: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpeqd (%rdi), %xmm0, %k1 |
| ; VLX-NEXT: vpblendmd %xmm0, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_5: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %xmm2 |
| ; NoVLX-NEXT: vpcmpeqd %zmm2, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <4 x i32>, <4 x i32>* %yp, align 4 |
| %mask = icmp eq <4 x i32> %x, %y |
| %max = select <4 x i1> %mask, <4 x i32> %x, <4 x i32> %x1 |
| ret <4 x i32> %max |
| } |
| |
| define <4 x i32> @test128_5b(<4 x i32> %x, <4 x i32> %x1, <4 x i32>* %yp) nounwind { |
| ; VLX-LABEL: test128_5b: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpeqd (%rdi), %xmm0, %k1 |
| ; VLX-NEXT: vpblendmd %xmm0, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_5b: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %xmm2 |
| ; NoVLX-NEXT: vpcmpeqd %zmm0, %zmm2, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <4 x i32>, <4 x i32>* %yp, align 4 |
| %mask = icmp eq <4 x i32> %y, %x |
| %max = select <4 x i1> %mask, <4 x i32> %x, <4 x i32> %x1 |
| ret <4 x i32> %max |
| } |
| |
| define <4 x i32> @test128_6(<4 x i32> %x, <4 x i32> %x1, <4 x i32>* %y.ptr) nounwind { |
| ; VLX-LABEL: test128_6: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpgtd (%rdi), %xmm0, %k1 |
| ; VLX-NEXT: vpblendmd %xmm0, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_6: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %xmm2 |
| ; NoVLX-NEXT: vpcmpgtd %zmm2, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <4 x i32>, <4 x i32>* %y.ptr, align 4 |
| %mask = icmp sgt <4 x i32> %x, %y |
| %max = select <4 x i1> %mask, <4 x i32> %x, <4 x i32> %x1 |
| ret <4 x i32> %max |
| } |
| |
| define <4 x i32> @test128_6b(<4 x i32> %x, <4 x i32> %x1, <4 x i32>* %y.ptr) nounwind { |
| ; VLX-LABEL: test128_6b: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpgtd (%rdi), %xmm0, %k1 |
| ; VLX-NEXT: vpblendmd %xmm0, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_6b: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %xmm2 |
| ; NoVLX-NEXT: vpcmpgtd %zmm2, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <4 x i32>, <4 x i32>* %y.ptr, align 4 |
| %mask = icmp slt <4 x i32> %y, %x |
| %max = select <4 x i1> %mask, <4 x i32> %x, <4 x i32> %x1 |
| ret <4 x i32> %max |
| } |
| |
| define <4 x i32> @test128_7(<4 x i32> %x, <4 x i32> %x1, <4 x i32>* %y.ptr) nounwind { |
| ; VLX-LABEL: test128_7: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpled (%rdi), %xmm0, %k1 |
| ; VLX-NEXT: vpblendmd %xmm0, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_7: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %xmm2 |
| ; NoVLX-NEXT: vpcmpled %zmm2, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <4 x i32>, <4 x i32>* %y.ptr, align 4 |
| %mask = icmp sle <4 x i32> %x, %y |
| %max = select <4 x i1> %mask, <4 x i32> %x, <4 x i32> %x1 |
| ret <4 x i32> %max |
| } |
| |
| define <4 x i32> @test128_7b(<4 x i32> %x, <4 x i32> %x1, <4 x i32>* %y.ptr) nounwind { |
| ; VLX-LABEL: test128_7b: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpled (%rdi), %xmm0, %k1 |
| ; VLX-NEXT: vpblendmd %xmm0, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_7b: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %xmm2 |
| ; NoVLX-NEXT: vpcmpnltd %zmm0, %zmm2, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <4 x i32>, <4 x i32>* %y.ptr, align 4 |
| %mask = icmp sge <4 x i32> %y, %x |
| %max = select <4 x i1> %mask, <4 x i32> %x, <4 x i32> %x1 |
| ret <4 x i32> %max |
| } |
| |
| define <4 x i32> @test128_8(<4 x i32> %x, <4 x i32> %x1, <4 x i32>* %y.ptr) nounwind { |
| ; VLX-LABEL: test128_8: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpleud (%rdi), %xmm0, %k1 |
| ; VLX-NEXT: vpblendmd %xmm0, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_8: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %xmm2 |
| ; NoVLX-NEXT: vpcmpleud %zmm2, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <4 x i32>, <4 x i32>* %y.ptr, align 4 |
| %mask = icmp ule <4 x i32> %x, %y |
| %max = select <4 x i1> %mask, <4 x i32> %x, <4 x i32> %x1 |
| ret <4 x i32> %max |
| } |
| |
| define <4 x i32> @test128_8b(<4 x i32> %x, <4 x i32> %x1, <4 x i32>* %y.ptr) nounwind { |
| ; VLX-LABEL: test128_8b: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpleud (%rdi), %xmm0, %k1 |
| ; VLX-NEXT: vpblendmd %xmm0, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_8b: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %xmm2 |
| ; NoVLX-NEXT: vpcmpnltud %zmm0, %zmm2, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <4 x i32>, <4 x i32>* %y.ptr, align 4 |
| %mask = icmp uge <4 x i32> %y, %x |
| %max = select <4 x i1> %mask, <4 x i32> %x, <4 x i32> %x1 |
| ret <4 x i32> %max |
| } |
| |
| define <4 x i32> @test128_9(<4 x i32> %x, <4 x i32> %y, <4 x i32> %x1, <4 x i32> %y1) nounwind { |
| ; VLX-LABEL: test128_9: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpeqd %xmm1, %xmm0, %k1 |
| ; VLX-NEXT: vpcmpeqd %xmm3, %xmm2, %k1 {%k1} |
| ; VLX-NEXT: vpblendmd %xmm0, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_9: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm3 killed $xmm3 def $zmm3 |
| ; NoVLX-NEXT: # kill: def $xmm2 killed $xmm2 def $zmm2 |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vpcmpeqd %zmm1, %zmm0, %k1 |
| ; NoVLX-NEXT: vpcmpeqd %zmm3, %zmm2, %k1 {%k1} |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %mask1 = icmp eq <4 x i32> %x1, %y1 |
| %mask0 = icmp eq <4 x i32> %x, %y |
| %mask = select <4 x i1> %mask0, <4 x i1> %mask1, <4 x i1> zeroinitializer |
| %max = select <4 x i1> %mask, <4 x i32> %x, <4 x i32> %y |
| ret <4 x i32> %max |
| } |
| |
| define <2 x i64> @test128_10(<2 x i64> %x, <2 x i64> %y, <2 x i64> %x1, <2 x i64> %y1) nounwind { |
| ; VLX-LABEL: test128_10: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpleq %xmm1, %xmm0, %k1 |
| ; VLX-NEXT: vpcmpnltq %xmm3, %xmm2, %k1 {%k1} |
| ; VLX-NEXT: vpblendmq %xmm0, %xmm2, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_10: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm3 killed $xmm3 def $zmm3 |
| ; NoVLX-NEXT: # kill: def $xmm2 killed $xmm2 def $zmm2 |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vpcmpleq %zmm1, %zmm0, %k1 |
| ; NoVLX-NEXT: vpcmpnltq %zmm3, %zmm2, %k1 {%k1} |
| ; NoVLX-NEXT: vpblendmq %zmm0, %zmm2, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %mask1 = icmp sge <2 x i64> %x1, %y1 |
| %mask0 = icmp sle <2 x i64> %x, %y |
| %mask = select <2 x i1> %mask0, <2 x i1> %mask1, <2 x i1> zeroinitializer |
| %max = select <2 x i1> %mask, <2 x i64> %x, <2 x i64> %x1 |
| ret <2 x i64> %max |
| } |
| |
| define <2 x i64> @test128_11(<2 x i64> %x, <2 x i64>* %y.ptr, <2 x i64> %x1, <2 x i64> %y1) nounwind { |
| ; VLX-LABEL: test128_11: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpgtq %xmm2, %xmm1, %k1 |
| ; VLX-NEXT: vpcmpgtq (%rdi), %xmm0, %k1 {%k1} |
| ; VLX-NEXT: vpblendmq %xmm0, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_11: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm2 killed $xmm2 def $zmm2 |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %xmm3 |
| ; NoVLX-NEXT: vpcmpgtq %zmm3, %zmm0, %k1 |
| ; NoVLX-NEXT: vpcmpgtq %zmm2, %zmm1, %k1 {%k1} |
| ; NoVLX-NEXT: vpblendmq %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %mask1 = icmp sgt <2 x i64> %x1, %y1 |
| %y = load <2 x i64>, <2 x i64>* %y.ptr, align 4 |
| %mask0 = icmp sgt <2 x i64> %x, %y |
| %mask = select <2 x i1> %mask0, <2 x i1> %mask1, <2 x i1> zeroinitializer |
| %max = select <2 x i1> %mask, <2 x i64> %x, <2 x i64> %x1 |
| ret <2 x i64> %max |
| } |
| |
| define <4 x i32> @test128_12(<4 x i32> %x, <4 x i32>* %y.ptr, <4 x i32> %x1, <4 x i32> %y1) nounwind { |
| ; VLX-LABEL: test128_12: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpnltd %xmm2, %xmm1, %k1 |
| ; VLX-NEXT: vpcmpleud (%rdi), %xmm0, %k1 {%k1} |
| ; VLX-NEXT: vpblendmd %xmm0, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_12: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm2 killed $xmm2 def $zmm2 |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %xmm3 |
| ; NoVLX-NEXT: vpcmpleud %zmm3, %zmm0, %k1 |
| ; NoVLX-NEXT: vpcmpnltd %zmm2, %zmm1, %k1 {%k1} |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %mask1 = icmp sge <4 x i32> %x1, %y1 |
| %y = load <4 x i32>, <4 x i32>* %y.ptr, align 4 |
| %mask0 = icmp ule <4 x i32> %x, %y |
| %mask = select <4 x i1> %mask0, <4 x i1> %mask1, <4 x i1> zeroinitializer |
| %max = select <4 x i1> %mask, <4 x i32> %x, <4 x i32> %x1 |
| ret <4 x i32> %max |
| } |
| |
| define <2 x i64> @test128_13(<2 x i64> %x, <2 x i64> %x1, i64* %yb.ptr) nounwind { |
| ; VLX-LABEL: test128_13: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpeqq (%rdi){1to2}, %xmm0, %k1 |
| ; VLX-NEXT: vpblendmq %xmm0, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_13: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vpbroadcastq (%rdi), %xmm2 |
| ; NoVLX-NEXT: vpcmpeqq %zmm2, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmq %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %yb = load i64, i64* %yb.ptr, align 4 |
| %y.0 = insertelement <2 x i64> undef, i64 %yb, i32 0 |
| %y = insertelement <2 x i64> %y.0, i64 %yb, i32 1 |
| %mask = icmp eq <2 x i64> %x, %y |
| %max = select <2 x i1> %mask, <2 x i64> %x, <2 x i64> %x1 |
| ret <2 x i64> %max |
| } |
| |
| define <4 x i32> @test128_14(<4 x i32> %x, i32* %yb.ptr, <4 x i32> %x1) nounwind { |
| ; VLX-LABEL: test128_14: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpled (%rdi){1to4}, %xmm0, %k1 |
| ; VLX-NEXT: vpblendmd %xmm0, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_14: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vpbroadcastd (%rdi), %xmm2 |
| ; NoVLX-NEXT: vpcmpled %zmm2, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %yb = load i32, i32* %yb.ptr, align 4 |
| %y.0 = insertelement <4 x i32> undef, i32 %yb, i32 0 |
| %y = shufflevector <4 x i32> %y.0, <4 x i32> undef, <4 x i32> zeroinitializer |
| %mask = icmp sle <4 x i32> %x, %y |
| %max = select <4 x i1> %mask, <4 x i32> %x, <4 x i32> %x1 |
| ret <4 x i32> %max |
| } |
| |
| define <4 x i32> @test128_15(<4 x i32> %x, i32* %yb.ptr, <4 x i32> %x1, <4 x i32> %y1) nounwind { |
| ; VLX-LABEL: test128_15: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpnltd %xmm2, %xmm1, %k1 |
| ; VLX-NEXT: vpcmpgtd (%rdi){1to4}, %xmm0, %k1 {%k1} |
| ; VLX-NEXT: vpblendmd %xmm0, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_15: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm2 killed $xmm2 def $zmm2 |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vpcmpnltd %zmm2, %zmm1, %k1 |
| ; NoVLX-NEXT: vpbroadcastd (%rdi), %xmm2 |
| ; NoVLX-NEXT: vpcmpgtd %zmm2, %zmm0, %k1 {%k1} |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %mask1 = icmp sge <4 x i32> %x1, %y1 |
| %yb = load i32, i32* %yb.ptr, align 4 |
| %y.0 = insertelement <4 x i32> undef, i32 %yb, i32 0 |
| %y = shufflevector <4 x i32> %y.0, <4 x i32> undef, <4 x i32> zeroinitializer |
| %mask0 = icmp sgt <4 x i32> %x, %y |
| %mask = select <4 x i1> %mask0, <4 x i1> %mask1, <4 x i1> zeroinitializer |
| %max = select <4 x i1> %mask, <4 x i32> %x, <4 x i32> %x1 |
| ret <4 x i32> %max |
| } |
| |
| define <2 x i64> @test128_16(<2 x i64> %x, i64* %yb.ptr, <2 x i64> %x1, <2 x i64> %y1) nounwind { |
| ; VLX-LABEL: test128_16: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpnltq %xmm2, %xmm1, %k1 |
| ; VLX-NEXT: vpcmpgtq (%rdi){1to2}, %xmm0, %k1 {%k1} |
| ; VLX-NEXT: vpblendmq %xmm0, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_16: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm2 killed $xmm2 def $zmm2 |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vpcmpnltq %zmm2, %zmm1, %k1 |
| ; NoVLX-NEXT: vpbroadcastq (%rdi), %xmm2 |
| ; NoVLX-NEXT: vpcmpgtq %zmm2, %zmm0, %k1 {%k1} |
| ; NoVLX-NEXT: vpblendmq %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %mask1 = icmp sge <2 x i64> %x1, %y1 |
| %yb = load i64, i64* %yb.ptr, align 4 |
| %y.0 = insertelement <2 x i64> undef, i64 %yb, i32 0 |
| %y = insertelement <2 x i64> %y.0, i64 %yb, i32 1 |
| %mask0 = icmp sgt <2 x i64> %x, %y |
| %mask = select <2 x i1> %mask0, <2 x i1> %mask1, <2 x i1> zeroinitializer |
| %max = select <2 x i1> %mask, <2 x i64> %x, <2 x i64> %x1 |
| ret <2 x i64> %max |
| } |
| |
| define <4 x i32> @test128_17(<4 x i32> %x, <4 x i32> %x1, <4 x i32>* %y.ptr) nounwind { |
| ; VLX-LABEL: test128_17: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpneqd (%rdi), %xmm0, %k1 |
| ; VLX-NEXT: vpblendmd %xmm0, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_17: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %xmm2 |
| ; NoVLX-NEXT: vpcmpneqd %zmm2, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <4 x i32>, <4 x i32>* %y.ptr, align 4 |
| %mask = icmp ne <4 x i32> %x, %y |
| %max = select <4 x i1> %mask, <4 x i32> %x, <4 x i32> %x1 |
| ret <4 x i32> %max |
| } |
| |
| define <4 x i32> @test128_18(<4 x i32> %x, <4 x i32> %x1, <4 x i32>* %y.ptr) nounwind { |
| ; VLX-LABEL: test128_18: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpneqd (%rdi), %xmm0, %k1 |
| ; VLX-NEXT: vpblendmd %xmm0, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_18: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %xmm2 |
| ; NoVLX-NEXT: vpcmpneqd %zmm0, %zmm2, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <4 x i32>, <4 x i32>* %y.ptr, align 4 |
| %mask = icmp ne <4 x i32> %y, %x |
| %max = select <4 x i1> %mask, <4 x i32> %x, <4 x i32> %x1 |
| ret <4 x i32> %max |
| } |
| |
| define <4 x i32> @test128_19(<4 x i32> %x, <4 x i32> %x1, <4 x i32>* %y.ptr) nounwind { |
| ; VLX-LABEL: test128_19: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpnltud (%rdi), %xmm0, %k1 |
| ; VLX-NEXT: vpblendmd %xmm0, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_19: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %xmm2 |
| ; NoVLX-NEXT: vpcmpnltud %zmm2, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <4 x i32>, <4 x i32>* %y.ptr, align 4 |
| %mask = icmp uge <4 x i32> %x, %y |
| %max = select <4 x i1> %mask, <4 x i32> %x, <4 x i32> %x1 |
| ret <4 x i32> %max |
| } |
| |
| define <4 x i32> @test128_20(<4 x i32> %x, <4 x i32> %x1, <4 x i32>* %y.ptr) nounwind { |
| ; VLX-LABEL: test128_20: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpcmpleud (%rdi), %xmm0, %k1 |
| ; VLX-NEXT: vpblendmd %xmm0, %xmm1, %xmm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: test128_20: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $xmm1 killed $xmm1 def $zmm1 |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 def $zmm0 |
| ; NoVLX-NEXT: vmovdqu (%rdi), %xmm2 |
| ; NoVLX-NEXT: vpcmpnltud %zmm0, %zmm2, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm0, %zmm1, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $xmm0 killed $xmm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %y = load <4 x i32>, <4 x i32>* %y.ptr, align 4 |
| %mask = icmp uge <4 x i32> %y, %x |
| %max = select <4 x i1> %mask, <4 x i32> %x, <4 x i32> %x1 |
| ret <4 x i32> %max |
| } |
| |
| define <8 x i32> @testnm_and(<8 x i32> %a, <8 x i32> %b, <8 x i32> %x, <8 x i32> %y) { |
| ; VLX-LABEL: testnm_and: |
| ; VLX: # %bb.0: |
| ; VLX-NEXT: vpor %ymm1, %ymm0, %ymm0 |
| ; VLX-NEXT: vptestnmd %ymm0, %ymm0, %k1 |
| ; VLX-NEXT: vpblendmd %ymm2, %ymm3, %ymm0 {%k1} |
| ; VLX-NEXT: retq |
| ; |
| ; NoVLX-LABEL: testnm_and: |
| ; NoVLX: # %bb.0: |
| ; NoVLX-NEXT: # kill: def $ymm3 killed $ymm3 def $zmm3 |
| ; NoVLX-NEXT: # kill: def $ymm2 killed $ymm2 def $zmm2 |
| ; NoVLX-NEXT: vpor %ymm1, %ymm0, %ymm0 |
| ; NoVLX-NEXT: vptestnmd %zmm0, %zmm0, %k1 |
| ; NoVLX-NEXT: vpblendmd %zmm2, %zmm3, %zmm0 {%k1} |
| ; NoVLX-NEXT: # kill: def $ymm0 killed $ymm0 killed $zmm0 |
| ; NoVLX-NEXT: retq |
| %c = icmp eq <8 x i32> %a, zeroinitializer |
| %d = icmp eq <8 x i32> %b, zeroinitializer |
| %e = and <8 x i1> %c, %d |
| %z = select <8 x i1> %e, <8 x i32> %x, <8 x i32> %y |
| ret <8 x i32> %z |
| } |