| ; RUN: llc < %s -mtriple=i686-- -mattr=+mmx,+ssse3,-avx | FileCheck %s --check-prefix=ALL --check-prefix=X86 |
| ; RUN: llc < %s -mtriple=i686-- -mattr=+mmx,+avx | FileCheck %s --check-prefix=ALL --check-prefix=X86 |
| ; RUN: llc < %s -mtriple=x86_64-- -mattr=+mmx,+ssse3,-avx | FileCheck %s --check-prefix=ALL --check-prefix=X64 |
| ; RUN: llc < %s -mtriple=x86_64-- -mattr=+mmx,+avx | FileCheck %s --check-prefix=ALL --check-prefix=X64 |
| |
| declare x86_mmx @llvm.x86.ssse3.phadd.w(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test1(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test1 |
| ; ALL: phaddw |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %2 = bitcast <4 x i16> %1 to x86_mmx |
| %3 = bitcast <4 x i16> %0 to x86_mmx |
| %4 = tail call x86_mmx @llvm.x86.ssse3.phadd.w(x86_mmx %2, x86_mmx %3) nounwind readnone |
| %5 = bitcast x86_mmx %4 to <4 x i16> |
| %6 = bitcast <4 x i16> %5 to <1 x i64> |
| %7 = extractelement <1 x i64> %6, i32 0 |
| ret i64 %7 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pcmpgt.d(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test88(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test88 |
| ; ALL: pcmpgtd |
| entry: |
| %0 = bitcast <1 x i64> %b to <2 x i32> |
| %1 = bitcast <1 x i64> %a to <2 x i32> |
| %mmx_var.i = bitcast <2 x i32> %1 to x86_mmx |
| %mmx_var1.i = bitcast <2 x i32> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.pcmpgt.d(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <2 x i32> |
| %4 = bitcast <2 x i32> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pcmpgt.w(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test87(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test87 |
| ; ALL: pcmpgtw |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %1 to x86_mmx |
| %mmx_var1.i = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.pcmpgt.w(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pcmpgt.b(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test86(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test86 |
| ; ALL: pcmpgtb |
| entry: |
| %0 = bitcast <1 x i64> %b to <8 x i8> |
| %1 = bitcast <1 x i64> %a to <8 x i8> |
| %mmx_var.i = bitcast <8 x i8> %1 to x86_mmx |
| %mmx_var1.i = bitcast <8 x i8> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.pcmpgt.b(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <8 x i8> |
| %4 = bitcast <8 x i8> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pcmpeq.d(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test85(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test85 |
| ; ALL: pcmpeqd |
| entry: |
| %0 = bitcast <1 x i64> %b to <2 x i32> |
| %1 = bitcast <1 x i64> %a to <2 x i32> |
| %mmx_var.i = bitcast <2 x i32> %1 to x86_mmx |
| %mmx_var1.i = bitcast <2 x i32> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.pcmpeq.d(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <2 x i32> |
| %4 = bitcast <2 x i32> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pcmpeq.w(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test84(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test84 |
| ; ALL: pcmpeqw |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %1 to x86_mmx |
| %mmx_var1.i = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.pcmpeq.w(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pcmpeq.b(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test83(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test83 |
| ; ALL: pcmpeqb |
| entry: |
| %0 = bitcast <1 x i64> %b to <8 x i8> |
| %1 = bitcast <1 x i64> %a to <8 x i8> |
| %mmx_var.i = bitcast <8 x i8> %1 to x86_mmx |
| %mmx_var1.i = bitcast <8 x i8> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.pcmpeq.b(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <8 x i8> |
| %4 = bitcast <8 x i8> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.punpckldq(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test82(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test82 |
| ; X86: punpckldq {{.*#+}} mm0 = mm0[0],mem[0] |
| ; X64: punpckldq {{.*#+}} mm0 = mm0[0],mm1[0] |
| entry: |
| %0 = bitcast <1 x i64> %b to <2 x i32> |
| %1 = bitcast <1 x i64> %a to <2 x i32> |
| %mmx_var.i = bitcast <2 x i32> %1 to x86_mmx |
| %mmx_var1.i = bitcast <2 x i32> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.punpckldq(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <2 x i32> |
| %4 = bitcast <2 x i32> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.punpcklwd(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test81(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test81 |
| ; X86: punpcklwd {{.*#+}} mm0 = mm0[0],mem[0],mm0[1],mem[1] |
| ; X64: punpcklwd {{.*#+}} mm0 = mm0[0],mm1[0],mm0[1],mm1[1] |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %1 to x86_mmx |
| %mmx_var1.i = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.punpcklwd(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.punpcklbw(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test80(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test80 |
| ; X86: punpcklbw {{.*#+}} mm0 = mm0[0],mem[0],mm0[1],mem[1],mm0[2],mem[2],mm0[3],mem[3] |
| ; X64: punpcklbw {{.*#+}} mm0 = mm0[0],mm1[0],mm0[1],mm1[1],mm0[2],mm1[2],mm0[3],mm1[3] |
| entry: |
| %0 = bitcast <1 x i64> %b to <8 x i8> |
| %1 = bitcast <1 x i64> %a to <8 x i8> |
| %mmx_var.i = bitcast <8 x i8> %1 to x86_mmx |
| %mmx_var1.i = bitcast <8 x i8> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.punpcklbw(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <8 x i8> |
| %4 = bitcast <8 x i8> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.punpckhdq(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test79(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test79 |
| ; X86: punpckhdq {{.*#+}} mm0 = mm0[1],mem[1] |
| ; X64: punpckhdq {{.*#+}} mm0 = mm0[1],mm1[1] |
| entry: |
| %0 = bitcast <1 x i64> %b to <2 x i32> |
| %1 = bitcast <1 x i64> %a to <2 x i32> |
| %mmx_var.i = bitcast <2 x i32> %1 to x86_mmx |
| %mmx_var1.i = bitcast <2 x i32> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.punpckhdq(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <2 x i32> |
| %4 = bitcast <2 x i32> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.punpckhwd(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test78(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test78 |
| ; X86: punpckhwd {{.*#+}} mm0 = mm0[2],mem[2],mm0[3],mem[3] |
| ; X64: punpckhwd {{.*#+}} mm0 = mm0[2],mm1[2],mm0[3],mm1[3] |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %1 to x86_mmx |
| %mmx_var1.i = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.punpckhwd(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.punpckhbw(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test77(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test77 |
| ; X86: punpckhbw {{.*#+}} mm0 = mm0[4],mem[4],mm0[5],mem[5],mm0[6],mem[6],mm0[7],mem[7] |
| ; X64: punpckhbw {{.*#+}} mm0 = mm0[4],mm1[4],mm0[5],mm1[5],mm0[6],mm1[6],mm0[7],mm1[7] |
| entry: |
| %0 = bitcast <1 x i64> %b to <8 x i8> |
| %1 = bitcast <1 x i64> %a to <8 x i8> |
| %mmx_var.i = bitcast <8 x i8> %1 to x86_mmx |
| %mmx_var1.i = bitcast <8 x i8> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.punpckhbw(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <8 x i8> |
| %4 = bitcast <8 x i8> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.packuswb(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test76(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test76 |
| ; ALL: packuswb |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %1 to x86_mmx |
| %mmx_var1.i = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.packuswb(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <8 x i8> |
| %4 = bitcast <8 x i8> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.packssdw(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test75(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test75 |
| ; ALL: packssdw |
| entry: |
| %0 = bitcast <1 x i64> %b to <2 x i32> |
| %1 = bitcast <1 x i64> %a to <2 x i32> |
| %mmx_var.i = bitcast <2 x i32> %1 to x86_mmx |
| %mmx_var1.i = bitcast <2 x i32> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.packssdw(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.packsswb(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test74(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test74 |
| ; ALL: packsswb |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %1 to x86_mmx |
| %mmx_var1.i = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.packsswb(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <8 x i8> |
| %4 = bitcast <8 x i8> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.psrai.d(x86_mmx, i32) nounwind readnone |
| |
| define i64 @test73(<1 x i64> %a) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test73 |
| ; ALL: psrad |
| entry: |
| %0 = bitcast <1 x i64> %a to <2 x i32> |
| %mmx_var.i = bitcast <2 x i32> %0 to x86_mmx |
| %1 = tail call x86_mmx @llvm.x86.mmx.psrai.d(x86_mmx %mmx_var.i, i32 3) nounwind |
| %2 = bitcast x86_mmx %1 to <2 x i32> |
| %3 = bitcast <2 x i32> %2 to <1 x i64> |
| %4 = extractelement <1 x i64> %3, i32 0 |
| ret i64 %4 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.psrai.w(x86_mmx, i32) nounwind readnone |
| |
| define i64 @test72(<1 x i64> %a) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test72 |
| ; ALL: psraw |
| entry: |
| %0 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %0 to x86_mmx |
| %1 = tail call x86_mmx @llvm.x86.mmx.psrai.w(x86_mmx %mmx_var.i, i32 3) nounwind |
| %2 = bitcast x86_mmx %1 to <4 x i16> |
| %3 = bitcast <4 x i16> %2 to <1 x i64> |
| %4 = extractelement <1 x i64> %3, i32 0 |
| ret i64 %4 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.psrli.q(x86_mmx, i32) nounwind readnone |
| |
| define i64 @test71(<1 x i64> %a) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test71 |
| ; ALL: psrlq |
| entry: |
| %0 = extractelement <1 x i64> %a, i32 0 |
| %mmx_var.i = bitcast i64 %0 to x86_mmx |
| %1 = tail call x86_mmx @llvm.x86.mmx.psrli.q(x86_mmx %mmx_var.i, i32 3) nounwind |
| %2 = bitcast x86_mmx %1 to i64 |
| ret i64 %2 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.psrli.d(x86_mmx, i32) nounwind readnone |
| |
| define i64 @test70(<1 x i64> %a) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test70 |
| ; ALL: psrld |
| entry: |
| %0 = bitcast <1 x i64> %a to <2 x i32> |
| %mmx_var.i = bitcast <2 x i32> %0 to x86_mmx |
| %1 = tail call x86_mmx @llvm.x86.mmx.psrli.d(x86_mmx %mmx_var.i, i32 3) nounwind |
| %2 = bitcast x86_mmx %1 to <2 x i32> |
| %3 = bitcast <2 x i32> %2 to <1 x i64> |
| %4 = extractelement <1 x i64> %3, i32 0 |
| ret i64 %4 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.psrli.w(x86_mmx, i32) nounwind readnone |
| |
| define i64 @test69(<1 x i64> %a) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test69 |
| ; ALL: psrlw |
| entry: |
| %0 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %0 to x86_mmx |
| %1 = tail call x86_mmx @llvm.x86.mmx.psrli.w(x86_mmx %mmx_var.i, i32 3) nounwind |
| %2 = bitcast x86_mmx %1 to <4 x i16> |
| %3 = bitcast <4 x i16> %2 to <1 x i64> |
| %4 = extractelement <1 x i64> %3, i32 0 |
| ret i64 %4 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pslli.q(x86_mmx, i32) nounwind readnone |
| |
| define i64 @test68(<1 x i64> %a) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test68 |
| ; ALL: psllq |
| entry: |
| %0 = extractelement <1 x i64> %a, i32 0 |
| %mmx_var.i = bitcast i64 %0 to x86_mmx |
| %1 = tail call x86_mmx @llvm.x86.mmx.pslli.q(x86_mmx %mmx_var.i, i32 3) nounwind |
| %2 = bitcast x86_mmx %1 to i64 |
| ret i64 %2 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pslli.d(x86_mmx, i32) nounwind readnone |
| |
| define i64 @test67(<1 x i64> %a) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test67 |
| ; ALL: pslld |
| entry: |
| %0 = bitcast <1 x i64> %a to <2 x i32> |
| %mmx_var.i = bitcast <2 x i32> %0 to x86_mmx |
| %1 = tail call x86_mmx @llvm.x86.mmx.pslli.d(x86_mmx %mmx_var.i, i32 3) nounwind |
| %2 = bitcast x86_mmx %1 to <2 x i32> |
| %3 = bitcast <2 x i32> %2 to <1 x i64> |
| %4 = extractelement <1 x i64> %3, i32 0 |
| ret i64 %4 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pslli.w(x86_mmx, i32) nounwind readnone |
| |
| define i64 @test66(<1 x i64> %a) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test66 |
| ; ALL: psllw |
| entry: |
| %0 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %0 to x86_mmx |
| %1 = tail call x86_mmx @llvm.x86.mmx.pslli.w(x86_mmx %mmx_var.i, i32 3) nounwind |
| %2 = bitcast x86_mmx %1 to <4 x i16> |
| %3 = bitcast <4 x i16> %2 to <1 x i64> |
| %4 = extractelement <1 x i64> %3, i32 0 |
| ret i64 %4 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.psra.d(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test65(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test65 |
| ; ALL: psrad |
| entry: |
| %0 = bitcast <1 x i64> %a to <2 x i32> |
| %mmx_var.i = bitcast <2 x i32> %0 to x86_mmx |
| %1 = extractelement <1 x i64> %b, i32 0 |
| %mmx_var1.i = bitcast i64 %1 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.psra.d(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <2 x i32> |
| %4 = bitcast <2 x i32> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.psra.w(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test64(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test64 |
| ; ALL: psraw |
| entry: |
| %0 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %0 to x86_mmx |
| %1 = extractelement <1 x i64> %b, i32 0 |
| %mmx_var1.i = bitcast i64 %1 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.psra.w(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.psrl.q(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test63(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test63 |
| ; ALL: psrlq |
| entry: |
| %0 = extractelement <1 x i64> %a, i32 0 |
| %mmx_var.i = bitcast i64 %0 to x86_mmx |
| %1 = extractelement <1 x i64> %b, i32 0 |
| %mmx_var1.i = bitcast i64 %1 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.psrl.q(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to i64 |
| ret i64 %3 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.psrl.d(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test62(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test62 |
| ; ALL: psrld |
| entry: |
| %0 = bitcast <1 x i64> %a to <2 x i32> |
| %mmx_var.i = bitcast <2 x i32> %0 to x86_mmx |
| %1 = extractelement <1 x i64> %b, i32 0 |
| %mmx_var1.i = bitcast i64 %1 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.psrl.d(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <2 x i32> |
| %4 = bitcast <2 x i32> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.psrl.w(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test61(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test61 |
| ; ALL: psrlw |
| entry: |
| %0 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %0 to x86_mmx |
| %1 = extractelement <1 x i64> %b, i32 0 |
| %mmx_var1.i = bitcast i64 %1 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.psrl.w(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.psll.q(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test60(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test60 |
| ; ALL: psllq |
| entry: |
| %0 = extractelement <1 x i64> %a, i32 0 |
| %mmx_var.i = bitcast i64 %0 to x86_mmx |
| %1 = extractelement <1 x i64> %b, i32 0 |
| %mmx_var1.i = bitcast i64 %1 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.psll.q(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to i64 |
| ret i64 %3 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.psll.d(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test59(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test59 |
| ; ALL: pslld |
| entry: |
| %0 = bitcast <1 x i64> %a to <2 x i32> |
| %mmx_var.i = bitcast <2 x i32> %0 to x86_mmx |
| %1 = extractelement <1 x i64> %b, i32 0 |
| %mmx_var1.i = bitcast i64 %1 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.psll.d(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <2 x i32> |
| %4 = bitcast <2 x i32> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.psll.w(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test58(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test58 |
| ; ALL: psllw |
| entry: |
| %0 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %0 to x86_mmx |
| %1 = extractelement <1 x i64> %b, i32 0 |
| %mmx_var1.i = bitcast i64 %1 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.psll.w(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pxor(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test56(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test56 |
| ; ALL: pxor |
| entry: |
| %0 = bitcast <1 x i64> %b to <2 x i32> |
| %1 = bitcast <1 x i64> %a to <2 x i32> |
| %mmx_var.i = bitcast <2 x i32> %1 to x86_mmx |
| %mmx_var1.i = bitcast <2 x i32> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.pxor(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <2 x i32> |
| %4 = bitcast <2 x i32> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.por(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test55(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test55 |
| ; ALL: por |
| entry: |
| %0 = bitcast <1 x i64> %b to <2 x i32> |
| %1 = bitcast <1 x i64> %a to <2 x i32> |
| %mmx_var.i = bitcast <2 x i32> %1 to x86_mmx |
| %mmx_var1.i = bitcast <2 x i32> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.por(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <2 x i32> |
| %4 = bitcast <2 x i32> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pandn(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test54(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test54 |
| ; ALL: pandn |
| entry: |
| %0 = bitcast <1 x i64> %b to <2 x i32> |
| %1 = bitcast <1 x i64> %a to <2 x i32> |
| %mmx_var.i = bitcast <2 x i32> %1 to x86_mmx |
| %mmx_var1.i = bitcast <2 x i32> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.pandn(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <2 x i32> |
| %4 = bitcast <2 x i32> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pand(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test53(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test53 |
| ; ALL: pand |
| entry: |
| %0 = bitcast <1 x i64> %b to <2 x i32> |
| %1 = bitcast <1 x i64> %a to <2 x i32> |
| %mmx_var.i = bitcast <2 x i32> %1 to x86_mmx |
| %mmx_var1.i = bitcast <2 x i32> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.pand(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <2 x i32> |
| %4 = bitcast <2 x i32> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pmull.w(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test52(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test52 |
| ; ALL: pmullw |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %1 to x86_mmx |
| %mmx_var1.i = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.pmull.w(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| define i64 @test51(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test51 |
| ; ALL: pmullw |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %1 to x86_mmx |
| %mmx_var1.i = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.pmull.w(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pmulh.w(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test50(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test50 |
| ; ALL: pmulhw |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %1 to x86_mmx |
| %mmx_var1.i = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.pmulh.w(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pmadd.wd(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test49(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test49 |
| ; ALL: pmaddwd |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %1 to x86_mmx |
| %mmx_var1.i = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.pmadd.wd(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <2 x i32> |
| %4 = bitcast <2 x i32> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.psubus.w(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test48(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test48 |
| ; ALL: psubusw |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %1 to x86_mmx |
| %mmx_var1.i = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.psubus.w(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.psubus.b(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test47(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test47 |
| ; ALL: psubusb |
| entry: |
| %0 = bitcast <1 x i64> %b to <8 x i8> |
| %1 = bitcast <1 x i64> %a to <8 x i8> |
| %mmx_var.i = bitcast <8 x i8> %1 to x86_mmx |
| %mmx_var1.i = bitcast <8 x i8> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.psubus.b(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <8 x i8> |
| %4 = bitcast <8 x i8> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.psubs.w(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test46(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test46 |
| ; ALL: psubsw |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %1 to x86_mmx |
| %mmx_var1.i = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.psubs.w(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.psubs.b(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test45(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test45 |
| ; ALL: psubsb |
| entry: |
| %0 = bitcast <1 x i64> %b to <8 x i8> |
| %1 = bitcast <1 x i64> %a to <8 x i8> |
| %mmx_var.i = bitcast <8 x i8> %1 to x86_mmx |
| %mmx_var1.i = bitcast <8 x i8> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.psubs.b(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <8 x i8> |
| %4 = bitcast <8 x i8> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| define i64 @test44(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test44 |
| ; ALL: psubq |
| entry: |
| %0 = extractelement <1 x i64> %a, i32 0 |
| %mmx_var = bitcast i64 %0 to x86_mmx |
| %1 = extractelement <1 x i64> %b, i32 0 |
| %mmx_var1 = bitcast i64 %1 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.psub.q(x86_mmx %mmx_var, x86_mmx %mmx_var1) |
| %3 = bitcast x86_mmx %2 to i64 |
| ret i64 %3 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.psub.q(x86_mmx, x86_mmx) nounwind readnone |
| |
| declare x86_mmx @llvm.x86.mmx.psub.d(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test43(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test43 |
| ; ALL: psubd |
| entry: |
| %0 = bitcast <1 x i64> %b to <2 x i32> |
| %1 = bitcast <1 x i64> %a to <2 x i32> |
| %mmx_var.i = bitcast <2 x i32> %1 to x86_mmx |
| %mmx_var1.i = bitcast <2 x i32> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.psub.d(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <2 x i32> |
| %4 = bitcast <2 x i32> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.psub.w(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test42(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test42 |
| ; ALL: psubw |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %1 to x86_mmx |
| %mmx_var1.i = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.psub.w(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.psub.b(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test41(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test41 |
| ; ALL: psubb |
| entry: |
| %0 = bitcast <1 x i64> %b to <8 x i8> |
| %1 = bitcast <1 x i64> %a to <8 x i8> |
| %mmx_var.i = bitcast <8 x i8> %1 to x86_mmx |
| %mmx_var1.i = bitcast <8 x i8> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.psub.b(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <8 x i8> |
| %4 = bitcast <8 x i8> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.paddus.w(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test40(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test40 |
| ; ALL: paddusw |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %1 to x86_mmx |
| %mmx_var1.i = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.paddus.w(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.paddus.b(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test39(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test39 |
| ; ALL: paddusb |
| entry: |
| %0 = bitcast <1 x i64> %b to <8 x i8> |
| %1 = bitcast <1 x i64> %a to <8 x i8> |
| %mmx_var.i = bitcast <8 x i8> %1 to x86_mmx |
| %mmx_var1.i = bitcast <8 x i8> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.paddus.b(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <8 x i8> |
| %4 = bitcast <8 x i8> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.padds.w(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test38(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test38 |
| ; ALL: paddsw |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %1 to x86_mmx |
| %mmx_var1.i = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.padds.w(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.padds.b(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test37(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test37 |
| ; ALL: paddsb |
| entry: |
| %0 = bitcast <1 x i64> %b to <8 x i8> |
| %1 = bitcast <1 x i64> %a to <8 x i8> |
| %mmx_var.i = bitcast <8 x i8> %1 to x86_mmx |
| %mmx_var1.i = bitcast <8 x i8> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.padds.b(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <8 x i8> |
| %4 = bitcast <8 x i8> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.padd.q(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test36(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test36 |
| ; ALL: paddq |
| entry: |
| %0 = extractelement <1 x i64> %a, i32 0 |
| %mmx_var = bitcast i64 %0 to x86_mmx |
| %1 = extractelement <1 x i64> %b, i32 0 |
| %mmx_var1 = bitcast i64 %1 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.padd.q(x86_mmx %mmx_var, x86_mmx %mmx_var1) |
| %3 = bitcast x86_mmx %2 to i64 |
| ret i64 %3 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.padd.d(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test35(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test35 |
| ; ALL: paddd |
| entry: |
| %0 = bitcast <1 x i64> %b to <2 x i32> |
| %1 = bitcast <1 x i64> %a to <2 x i32> |
| %mmx_var.i = bitcast <2 x i32> %1 to x86_mmx |
| %mmx_var1.i = bitcast <2 x i32> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.padd.d(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <2 x i32> |
| %4 = bitcast <2 x i32> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.padd.w(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test34(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test34 |
| ; ALL: paddw |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %1 to x86_mmx |
| %mmx_var1.i = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.padd.w(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.padd.b(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test33(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test33 |
| ; ALL: paddb |
| entry: |
| %0 = bitcast <1 x i64> %b to <8 x i8> |
| %1 = bitcast <1 x i64> %a to <8 x i8> |
| %mmx_var.i = bitcast <8 x i8> %1 to x86_mmx |
| %mmx_var1.i = bitcast <8 x i8> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.padd.b(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <8 x i8> |
| %4 = bitcast <8 x i8> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.psad.bw(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test32(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test32 |
| ; ALL: psadbw |
| entry: |
| %0 = bitcast <1 x i64> %b to <8 x i8> |
| %1 = bitcast <1 x i64> %a to <8 x i8> |
| %mmx_var.i = bitcast <8 x i8> %1 to x86_mmx |
| %mmx_var1.i = bitcast <8 x i8> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.psad.bw(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to i64 |
| ret i64 %3 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pmins.w(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test31(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test31 |
| ; ALL: pminsw |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %1 to x86_mmx |
| %mmx_var1.i = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.pmins.w(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pminu.b(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test30(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test30 |
| ; ALL: pminub |
| entry: |
| %0 = bitcast <1 x i64> %b to <8 x i8> |
| %1 = bitcast <1 x i64> %a to <8 x i8> |
| %mmx_var.i = bitcast <8 x i8> %1 to x86_mmx |
| %mmx_var1.i = bitcast <8 x i8> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.pminu.b(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <8 x i8> |
| %4 = bitcast <8 x i8> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pmaxs.w(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test29(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test29 |
| ; ALL: pmaxsw |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %1 to x86_mmx |
| %mmx_var1.i = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.pmaxs.w(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pmaxu.b(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test28(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test28 |
| ; ALL: pmaxub |
| entry: |
| %0 = bitcast <1 x i64> %b to <8 x i8> |
| %1 = bitcast <1 x i64> %a to <8 x i8> |
| %mmx_var.i = bitcast <8 x i8> %1 to x86_mmx |
| %mmx_var1.i = bitcast <8 x i8> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.pmaxu.b(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <8 x i8> |
| %4 = bitcast <8 x i8> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pavg.w(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test27(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test27 |
| ; ALL: pavgw |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %1 to x86_mmx |
| %mmx_var1.i = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.pavg.w(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pavg.b(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test26(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test26 |
| ; ALL: pavgb |
| entry: |
| %0 = bitcast <1 x i64> %b to <8 x i8> |
| %1 = bitcast <1 x i64> %a to <8 x i8> |
| %mmx_var.i = bitcast <8 x i8> %1 to x86_mmx |
| %mmx_var1.i = bitcast <8 x i8> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.pavg.b(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <8 x i8> |
| %4 = bitcast <8 x i8> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare void @llvm.x86.mmx.movnt.dq(x86_mmx*, x86_mmx) nounwind |
| |
| define void @test25(<1 x i64>* %p, <1 x i64> %a) nounwind optsize ssp { |
| ; ALL-LABEL: @test25 |
| ; ALL: movntq |
| entry: |
| %mmx_ptr_var.i = bitcast <1 x i64>* %p to x86_mmx* |
| %0 = extractelement <1 x i64> %a, i32 0 |
| %mmx_var.i = bitcast i64 %0 to x86_mmx |
| tail call void @llvm.x86.mmx.movnt.dq(x86_mmx* %mmx_ptr_var.i, x86_mmx %mmx_var.i) nounwind |
| ret void |
| } |
| |
| declare i32 @llvm.x86.mmx.pmovmskb(x86_mmx) nounwind readnone |
| |
| define i32 @test24(<1 x i64> %a) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test24 |
| ; ALL: pmovmskb |
| entry: |
| %0 = bitcast <1 x i64> %a to <8 x i8> |
| %mmx_var.i = bitcast <8 x i8> %0 to x86_mmx |
| %1 = tail call i32 @llvm.x86.mmx.pmovmskb(x86_mmx %mmx_var.i) nounwind |
| ret i32 %1 |
| } |
| |
| declare void @llvm.x86.mmx.maskmovq(x86_mmx, x86_mmx, i8*) nounwind |
| |
| define void @test23(<1 x i64> %d, <1 x i64> %n, i8* %p) nounwind optsize ssp { |
| ; ALL-LABEL: @test23 |
| ; ALL: maskmovq |
| entry: |
| %0 = bitcast <1 x i64> %n to <8 x i8> |
| %1 = bitcast <1 x i64> %d to <8 x i8> |
| %mmx_var.i = bitcast <8 x i8> %1 to x86_mmx |
| %mmx_var1.i = bitcast <8 x i8> %0 to x86_mmx |
| tail call void @llvm.x86.mmx.maskmovq(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i, i8* %p) nounwind |
| ret void |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pmulhu.w(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test22(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test22 |
| ; ALL: pmulhuw |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %mmx_var.i = bitcast <4 x i16> %1 to x86_mmx |
| %mmx_var1.i = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.pmulhu.w(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.sse.pshuf.w(x86_mmx, i8) nounwind readnone |
| |
| define i64 @test21(<1 x i64> %a) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test21 |
| ; X86: pshufw {{.*#+}} mm0 = mem[3,0,0,0] |
| ; X64: pshufw {{.*#+}} mm0 = mm0[3,0,0,0] |
| entry: |
| %0 = bitcast <1 x i64> %a to <4 x i16> |
| %1 = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.sse.pshuf.w(x86_mmx %1, i8 3) nounwind readnone |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| define i32 @test21_2(<1 x i64> %a) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test21_2 |
| ; X86: pshufw {{.*#+}} mm0 = mem[3,0,0,0] |
| ; X64: pshufw {{.*#+}} mm0 = mm0[3,0,0,0] |
| ; ALL: movd |
| entry: |
| %0 = bitcast <1 x i64> %a to <4 x i16> |
| %1 = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.sse.pshuf.w(x86_mmx %1, i8 3) nounwind readnone |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <2 x i32> |
| %5 = extractelement <2 x i32> %4, i32 0 |
| ret i32 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.pmulu.dq(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test20(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test20 |
| ; ALL: pmuludq |
| entry: |
| %0 = bitcast <1 x i64> %b to <2 x i32> |
| %1 = bitcast <1 x i64> %a to <2 x i32> |
| %mmx_var.i = bitcast <2 x i32> %1 to x86_mmx |
| %mmx_var1.i = bitcast <2 x i32> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.pmulu.dq(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind |
| %3 = bitcast x86_mmx %2 to i64 |
| ret i64 %3 |
| } |
| |
| declare <2 x double> @llvm.x86.sse.cvtpi2pd(x86_mmx) nounwind readnone |
| |
| define <2 x double> @test19(<1 x i64> %a) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test19 |
| ; ALL: cvtpi2pd |
| entry: |
| %0 = bitcast <1 x i64> %a to <2 x i32> |
| %1 = bitcast <2 x i32> %0 to x86_mmx |
| %2 = tail call <2 x double> @llvm.x86.sse.cvtpi2pd(x86_mmx %1) nounwind readnone |
| ret <2 x double> %2 |
| } |
| |
| declare x86_mmx @llvm.x86.sse.cvttpd2pi(<2 x double>) nounwind readnone |
| |
| define i64 @test18(<2 x double> %a) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test18 |
| ; ALL: cvttpd2pi |
| entry: |
| %0 = tail call x86_mmx @llvm.x86.sse.cvttpd2pi(<2 x double> %a) nounwind readnone |
| %1 = bitcast x86_mmx %0 to <2 x i32> |
| %2 = bitcast <2 x i32> %1 to <1 x i64> |
| %3 = extractelement <1 x i64> %2, i32 0 |
| ret i64 %3 |
| } |
| |
| declare x86_mmx @llvm.x86.sse.cvtpd2pi(<2 x double>) nounwind readnone |
| |
| define i64 @test17(<2 x double> %a) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test17 |
| ; ALL: cvtpd2pi |
| entry: |
| %0 = tail call x86_mmx @llvm.x86.sse.cvtpd2pi(<2 x double> %a) nounwind readnone |
| %1 = bitcast x86_mmx %0 to <2 x i32> |
| %2 = bitcast <2 x i32> %1 to <1 x i64> |
| %3 = extractelement <1 x i64> %2, i32 0 |
| ret i64 %3 |
| } |
| |
| declare x86_mmx @llvm.x86.mmx.palignr.b(x86_mmx, x86_mmx, i8) nounwind readnone |
| |
| define i64 @test16(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test16 |
| ; ALL: palignr |
| entry: |
| %0 = extractelement <1 x i64> %a, i32 0 |
| %mmx_var = bitcast i64 %0 to x86_mmx |
| %1 = extractelement <1 x i64> %b, i32 0 |
| %mmx_var1 = bitcast i64 %1 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.mmx.palignr.b(x86_mmx %mmx_var, x86_mmx %mmx_var1, i8 16) |
| %3 = bitcast x86_mmx %2 to i64 |
| ret i64 %3 |
| } |
| |
| declare x86_mmx @llvm.x86.ssse3.pabs.d(x86_mmx) nounwind readnone |
| |
| define i64 @test15(<1 x i64> %a) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test15 |
| ; ALL: pabsd |
| entry: |
| %0 = bitcast <1 x i64> %a to <2 x i32> |
| %1 = bitcast <2 x i32> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.ssse3.pabs.d(x86_mmx %1) nounwind readnone |
| %3 = bitcast x86_mmx %2 to <2 x i32> |
| %4 = bitcast <2 x i32> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.ssse3.pabs.w(x86_mmx) nounwind readnone |
| |
| define i64 @test14(<1 x i64> %a) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test14 |
| ; ALL: pabsw |
| entry: |
| %0 = bitcast <1 x i64> %a to <4 x i16> |
| %1 = bitcast <4 x i16> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.ssse3.pabs.w(x86_mmx %1) nounwind readnone |
| %3 = bitcast x86_mmx %2 to <4 x i16> |
| %4 = bitcast <4 x i16> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.ssse3.pabs.b(x86_mmx) nounwind readnone |
| |
| define i64 @test13(<1 x i64> %a) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test13 |
| ; ALL: pabsb |
| entry: |
| %0 = bitcast <1 x i64> %a to <8 x i8> |
| %1 = bitcast <8 x i8> %0 to x86_mmx |
| %2 = tail call x86_mmx @llvm.x86.ssse3.pabs.b(x86_mmx %1) nounwind readnone |
| %3 = bitcast x86_mmx %2 to <8 x i8> |
| %4 = bitcast <8 x i8> %3 to <1 x i64> |
| %5 = extractelement <1 x i64> %4, i32 0 |
| ret i64 %5 |
| } |
| |
| declare x86_mmx @llvm.x86.ssse3.psign.d(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test12(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test12 |
| ; ALL: psignd |
| entry: |
| %0 = bitcast <1 x i64> %b to <2 x i32> |
| %1 = bitcast <1 x i64> %a to <2 x i32> |
| %2 = bitcast <2 x i32> %1 to x86_mmx |
| %3 = bitcast <2 x i32> %0 to x86_mmx |
| %4 = tail call x86_mmx @llvm.x86.ssse3.psign.d(x86_mmx %2, x86_mmx %3) nounwind readnone |
| %5 = bitcast x86_mmx %4 to <2 x i32> |
| %6 = bitcast <2 x i32> %5 to <1 x i64> |
| %7 = extractelement <1 x i64> %6, i32 0 |
| ret i64 %7 |
| } |
| |
| declare x86_mmx @llvm.x86.ssse3.psign.w(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test11(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test11 |
| ; ALL: psignw |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %2 = bitcast <4 x i16> %1 to x86_mmx |
| %3 = bitcast <4 x i16> %0 to x86_mmx |
| %4 = tail call x86_mmx @llvm.x86.ssse3.psign.w(x86_mmx %2, x86_mmx %3) nounwind readnone |
| %5 = bitcast x86_mmx %4 to <4 x i16> |
| %6 = bitcast <4 x i16> %5 to <1 x i64> |
| %7 = extractelement <1 x i64> %6, i32 0 |
| ret i64 %7 |
| } |
| |
| declare x86_mmx @llvm.x86.ssse3.psign.b(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test10(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test10 |
| ; ALL: psignb |
| entry: |
| %0 = bitcast <1 x i64> %b to <8 x i8> |
| %1 = bitcast <1 x i64> %a to <8 x i8> |
| %2 = bitcast <8 x i8> %1 to x86_mmx |
| %3 = bitcast <8 x i8> %0 to x86_mmx |
| %4 = tail call x86_mmx @llvm.x86.ssse3.psign.b(x86_mmx %2, x86_mmx %3) nounwind readnone |
| %5 = bitcast x86_mmx %4 to <8 x i8> |
| %6 = bitcast <8 x i8> %5 to <1 x i64> |
| %7 = extractelement <1 x i64> %6, i32 0 |
| ret i64 %7 |
| } |
| |
| declare x86_mmx @llvm.x86.ssse3.pshuf.b(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test9(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test9 |
| ; ALL: pshufb |
| entry: |
| %0 = bitcast <1 x i64> %b to <8 x i8> |
| %1 = bitcast <1 x i64> %a to <8 x i8> |
| %2 = bitcast <8 x i8> %1 to x86_mmx |
| %3 = bitcast <8 x i8> %0 to x86_mmx |
| %4 = tail call x86_mmx @llvm.x86.ssse3.pshuf.b(x86_mmx %2, x86_mmx %3) nounwind readnone |
| %5 = bitcast x86_mmx %4 to <8 x i8> |
| %6 = bitcast <8 x i8> %5 to <1 x i64> |
| %7 = extractelement <1 x i64> %6, i32 0 |
| ret i64 %7 |
| } |
| |
| declare x86_mmx @llvm.x86.ssse3.pmul.hr.sw(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test8(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test8 |
| ; ALL: pmulhrsw |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %2 = bitcast <4 x i16> %1 to x86_mmx |
| %3 = bitcast <4 x i16> %0 to x86_mmx |
| %4 = tail call x86_mmx @llvm.x86.ssse3.pmul.hr.sw(x86_mmx %2, x86_mmx %3) nounwind readnone |
| %5 = bitcast x86_mmx %4 to <4 x i16> |
| %6 = bitcast <4 x i16> %5 to <1 x i64> |
| %7 = extractelement <1 x i64> %6, i32 0 |
| ret i64 %7 |
| } |
| |
| declare x86_mmx @llvm.x86.ssse3.pmadd.ub.sw(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test7(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test7 |
| ; ALL: pmaddubsw |
| entry: |
| %0 = bitcast <1 x i64> %b to <8 x i8> |
| %1 = bitcast <1 x i64> %a to <8 x i8> |
| %2 = bitcast <8 x i8> %1 to x86_mmx |
| %3 = bitcast <8 x i8> %0 to x86_mmx |
| %4 = tail call x86_mmx @llvm.x86.ssse3.pmadd.ub.sw(x86_mmx %2, x86_mmx %3) nounwind readnone |
| %5 = bitcast x86_mmx %4 to <8 x i8> |
| %6 = bitcast <8 x i8> %5 to <1 x i64> |
| %7 = extractelement <1 x i64> %6, i32 0 |
| ret i64 %7 |
| } |
| |
| declare x86_mmx @llvm.x86.ssse3.phsub.sw(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test6(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test6 |
| ; ALL: phsubsw |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %2 = bitcast <4 x i16> %1 to x86_mmx |
| %3 = bitcast <4 x i16> %0 to x86_mmx |
| %4 = tail call x86_mmx @llvm.x86.ssse3.phsub.sw(x86_mmx %2, x86_mmx %3) nounwind readnone |
| %5 = bitcast x86_mmx %4 to <4 x i16> |
| %6 = bitcast <4 x i16> %5 to <1 x i64> |
| %7 = extractelement <1 x i64> %6, i32 0 |
| ret i64 %7 |
| } |
| |
| declare x86_mmx @llvm.x86.ssse3.phsub.d(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test5(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test5 |
| ; ALL: phsubd |
| entry: |
| %0 = bitcast <1 x i64> %b to <2 x i32> |
| %1 = bitcast <1 x i64> %a to <2 x i32> |
| %2 = bitcast <2 x i32> %1 to x86_mmx |
| %3 = bitcast <2 x i32> %0 to x86_mmx |
| %4 = tail call x86_mmx @llvm.x86.ssse3.phsub.d(x86_mmx %2, x86_mmx %3) nounwind readnone |
| %5 = bitcast x86_mmx %4 to <2 x i32> |
| %6 = bitcast <2 x i32> %5 to <1 x i64> |
| %7 = extractelement <1 x i64> %6, i32 0 |
| ret i64 %7 |
| } |
| |
| declare x86_mmx @llvm.x86.ssse3.phsub.w(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test4(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test4 |
| ; ALL: phsubw |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %2 = bitcast <4 x i16> %1 to x86_mmx |
| %3 = bitcast <4 x i16> %0 to x86_mmx |
| %4 = tail call x86_mmx @llvm.x86.ssse3.phsub.w(x86_mmx %2, x86_mmx %3) nounwind readnone |
| %5 = bitcast x86_mmx %4 to <4 x i16> |
| %6 = bitcast <4 x i16> %5 to <1 x i64> |
| %7 = extractelement <1 x i64> %6, i32 0 |
| ret i64 %7 |
| } |
| |
| declare x86_mmx @llvm.x86.ssse3.phadd.sw(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test3(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test3 |
| ; ALL: phaddsw |
| entry: |
| %0 = bitcast <1 x i64> %b to <4 x i16> |
| %1 = bitcast <1 x i64> %a to <4 x i16> |
| %2 = bitcast <4 x i16> %1 to x86_mmx |
| %3 = bitcast <4 x i16> %0 to x86_mmx |
| %4 = tail call x86_mmx @llvm.x86.ssse3.phadd.sw(x86_mmx %2, x86_mmx %3) nounwind readnone |
| %5 = bitcast x86_mmx %4 to <4 x i16> |
| %6 = bitcast <4 x i16> %5 to <1 x i64> |
| %7 = extractelement <1 x i64> %6, i32 0 |
| ret i64 %7 |
| } |
| |
| declare x86_mmx @llvm.x86.ssse3.phadd.d(x86_mmx, x86_mmx) nounwind readnone |
| |
| define i64 @test2(<1 x i64> %a, <1 x i64> %b) nounwind readnone optsize ssp { |
| ; ALL-LABEL: @test2 |
| ; ALL: phaddd |
| entry: |
| %0 = bitcast <1 x i64> %b to <2 x i32> |
| %1 = bitcast <1 x i64> %a to <2 x i32> |
| %2 = bitcast <2 x i32> %1 to x86_mmx |
| %3 = bitcast <2 x i32> %0 to x86_mmx |
| %4 = tail call x86_mmx @llvm.x86.ssse3.phadd.d(x86_mmx %2, x86_mmx %3) nounwind readnone |
| %5 = bitcast x86_mmx %4 to <2 x i32> |
| %6 = bitcast <2 x i32> %5 to <1 x i64> |
| %7 = extractelement <1 x i64> %6, i32 0 |
| ret i64 %7 |
| } |
| |
| define <4 x float> @test89(<4 x float> %a, x86_mmx %b) nounwind { |
| ; ALL-LABEL: @test89 |
| ; ALL: cvtpi2ps |
| %c = tail call <4 x float> @llvm.x86.sse.cvtpi2ps(<4 x float> %a, x86_mmx %b) |
| ret <4 x float> %c |
| } |
| |
| declare <4 x float> @llvm.x86.sse.cvtpi2ps(<4 x float>, x86_mmx) nounwind readnone |
| |
| ; ALL-LABEL: test90 |
| define void @test90() { |
| ; ALL-LABEL: @test90 |
| ; ALL: emms |
| call void @llvm.x86.mmx.emms() |
| ret void |
| } |
| |
| declare void @llvm.x86.mmx.emms() |