| ; RUN: llc < %s -march=sparcv9 -mattr=+popc -disable-sparc-delay-filler -disable-sparc-leaf-proc | FileCheck %s |
| ; RUN: llc < %s -march=sparcv9 -mattr=+popc | FileCheck %s -check-prefix=OPT |
| |
| ; CHECK-LABEL: ret2: |
| ; CHECK: mov %i1, %i0 |
| |
| ; OPT-LABEL: ret2: |
| ; OPT: retl |
| ; OPT: mov %o1, %o0 |
| define i64 @ret2(i64 %a, i64 %b) { |
| ret i64 %b |
| } |
| |
| ; CHECK: shl_imm |
| ; CHECK: sllx %i0, 7, %i0 |
| |
| ; OPT-LABEL: shl_imm: |
| ; OPT: retl |
| ; OPT: sllx %o0, 7, %o0 |
| define i64 @shl_imm(i64 %a) { |
| %x = shl i64 %a, 7 |
| ret i64 %x |
| } |
| |
| ; CHECK: sra_reg |
| ; CHECK: srax %i0, %i1, %i0 |
| |
| ; OPT-LABEL: sra_reg: |
| ; OPT: retl |
| ; OPT: srax %o0, %o1, %o0 |
| define i64 @sra_reg(i64 %a, i64 %b) { |
| %x = ashr i64 %a, %b |
| ret i64 %x |
| } |
| |
| ; Immediate materialization. Many of these patterns could actually be merged |
| ; into the restore instruction: |
| ; |
| ; restore %g0, %g0, %o0 |
| ; |
| ; CHECK: ret_imm0 |
| ; CHECK: mov 0, %i0 |
| |
| ; OPT: ret_imm0 |
| ; OPT: retl |
| ; OPT: mov 0, %o0 |
| define i64 @ret_imm0() { |
| ret i64 0 |
| } |
| |
| ; CHECK: ret_simm13 |
| ; CHECK: mov -4096, %i0 |
| |
| ; OPT: ret_simm13 |
| ; OPT: retl |
| ; OPT: mov -4096, %o0 |
| define i64 @ret_simm13() { |
| ret i64 -4096 |
| } |
| |
| ; CHECK: ret_sethi |
| ; CHECK: sethi 4, %i0 |
| ; CHECK-NOT: or |
| ; CHECK: restore |
| |
| ; OPT: ret_sethi |
| ; OPT: retl |
| ; OPT: sethi 4, %o0 |
| define i64 @ret_sethi() { |
| ret i64 4096 |
| } |
| |
| ; CHECK: ret_sethi_or |
| ; CHECK: sethi 4, [[R:%[goli][0-7]]] |
| ; CHECK: or [[R]], 1, %i0 |
| |
| ; OPT: ret_sethi_or |
| ; OPT: sethi 4, [[R:%[go][0-7]]] |
| ; OPT: retl |
| ; OPT: or [[R]], 1, %o0 |
| |
| define i64 @ret_sethi_or() { |
| ret i64 4097 |
| } |
| |
| ; CHECK: ret_nimm33 |
| ; CHECK: sethi 4, [[R:%[goli][0-7]]] |
| ; CHECK: xor [[R]], -4, %i0 |
| |
| ; OPT: ret_nimm33 |
| ; OPT: sethi 4, [[R:%[go][0-7]]] |
| ; OPT: retl |
| ; OPT: xor [[R]], -4, %o0 |
| |
| define i64 @ret_nimm33() { |
| ret i64 -4100 |
| } |
| |
| ; CHECK: ret_bigimm |
| ; CHECK: sethi |
| ; CHECK: sethi |
| define i64 @ret_bigimm() { |
| ret i64 6800754272627607872 |
| } |
| |
| ; CHECK: ret_bigimm2 |
| ; CHECK: sethi 1048576 |
| define i64 @ret_bigimm2() { |
| ret i64 4611686018427387904 ; 0x4000000000000000 |
| } |
| |
| ; CHECK: reg_reg_alu |
| ; CHECK: add %i0, %i1, [[R0:%[goli][0-7]]] |
| ; CHECK: sub [[R0]], %i2, [[R1:%[goli][0-7]]] |
| ; CHECK: andn [[R1]], %i0, %i0 |
| define i64 @reg_reg_alu(i64 %x, i64 %y, i64 %z) { |
| %a = add i64 %x, %y |
| %b = sub i64 %a, %z |
| %c = xor i64 %x, -1 |
| %d = and i64 %b, %c |
| ret i64 %d |
| } |
| |
| ; CHECK: reg_imm_alu |
| ; CHECK: add %i0, -5, [[R0:%[goli][0-7]]] |
| ; CHECK: xor [[R0]], 2, %i0 |
| define i64 @reg_imm_alu(i64 %x, i64 %y, i64 %z) { |
| %a = add i64 %x, -5 |
| %b = xor i64 %a, 2 |
| ret i64 %b |
| } |
| |
| ; CHECK: loads |
| ; CHECK: ldx [%i0] |
| ; CHECK: stx % |
| ; CHECK: ld [%i1] |
| ; CHECK: st % |
| ; CHECK: ldsw [%i2] |
| ; CHECK: stx % |
| ; CHECK: ldsh [%i3] |
| ; CHECK: sth % |
| define i64 @loads(i64* %p, i32* %q, i32* %r, i16* %s) { |
| %a = load i64, i64* %p |
| %ai = add i64 1, %a |
| store i64 %ai, i64* %p |
| %b = load i32, i32* %q |
| %b2 = zext i32 %b to i64 |
| %bi = trunc i64 %ai to i32 |
| store i32 %bi, i32* %q |
| %c = load i32, i32* %r |
| %c2 = sext i32 %c to i64 |
| store i64 %ai, i64* %p |
| %d = load i16, i16* %s |
| %d2 = sext i16 %d to i64 |
| %di = trunc i64 %ai to i16 |
| store i16 %di, i16* %s |
| |
| %x1 = add i64 %a, %b2 |
| %x2 = add i64 %c2, %d2 |
| %x3 = add i64 %x1, %x2 |
| ret i64 %x3 |
| } |
| |
| ; CHECK: load_bool |
| ; CHECK: ldub [%i0], %i0 |
| define i64 @load_bool(i1* %p) { |
| %a = load i1, i1* %p |
| %b = zext i1 %a to i64 |
| ret i64 %b |
| } |
| |
| ; CHECK: stores |
| ; CHECK: ldx [%i0+8], [[R:%[goli][0-7]]] |
| ; CHECK: stx [[R]], [%i0+16] |
| ; CHECK: st [[R]], [%i1+-8] |
| ; CHECK: sth [[R]], [%i2+40] |
| ; CHECK: stb [[R]], [%i3+-20] |
| define void @stores(i64* %p, i32* %q, i16* %r, i8* %s) { |
| %p1 = getelementptr i64, i64* %p, i64 1 |
| %p2 = getelementptr i64, i64* %p, i64 2 |
| %pv = load i64, i64* %p1 |
| store i64 %pv, i64* %p2 |
| |
| %q2 = getelementptr i32, i32* %q, i32 -2 |
| %qv = trunc i64 %pv to i32 |
| store i32 %qv, i32* %q2 |
| |
| %r2 = getelementptr i16, i16* %r, i16 20 |
| %rv = trunc i64 %pv to i16 |
| store i16 %rv, i16* %r2 |
| |
| %s2 = getelementptr i8, i8* %s, i8 -20 |
| %sv = trunc i64 %pv to i8 |
| store i8 %sv, i8* %s2 |
| |
| ret void |
| } |
| |
| ; CHECK: promote_shifts |
| ; CHECK: ldub [%i0], [[R:%[goli][0-7]]] |
| ; CHECK: sll [[R]], [[R]], %i0 |
| define i8 @promote_shifts(i8* %p) { |
| %L24 = load i8, i8* %p |
| %L32 = load i8, i8* %p |
| %B36 = shl i8 %L24, %L32 |
| ret i8 %B36 |
| } |
| |
| ; CHECK: multiply |
| ; CHECK: mulx %i0, %i1, %i0 |
| define i64 @multiply(i64 %a, i64 %b) { |
| %r = mul i64 %a, %b |
| ret i64 %r |
| } |
| |
| ; CHECK: signed_divide |
| ; CHECK: sdivx %i0, %i1, %i0 |
| define i64 @signed_divide(i64 %a, i64 %b) { |
| %r = sdiv i64 %a, %b |
| ret i64 %r |
| } |
| |
| ; CHECK: unsigned_divide |
| ; CHECK: udivx %i0, %i1, %i0 |
| define i64 @unsigned_divide(i64 %a, i64 %b) { |
| %r = udiv i64 %a, %b |
| ret i64 %r |
| } |
| |
| define void @access_fi() { |
| entry: |
| %b = alloca [32 x i8], align 1 |
| %arraydecay = getelementptr inbounds [32 x i8], [32 x i8]* %b, i64 0, i64 0 |
| call void @g(i8* %arraydecay) #2 |
| ret void |
| } |
| |
| declare void @g(i8*) |
| |
| ; CHECK: expand_setcc |
| ; CHECK: cmp %i0, 1 |
| ; CHECK: movl %xcc, 1, |
| define i32 @expand_setcc(i64 %a) { |
| %cond = icmp sle i64 %a, 0 |
| %cast2 = zext i1 %cond to i32 |
| %RV = sub i32 1, %cast2 |
| ret i32 %RV |
| } |
| |
| ; CHECK: spill_i64 |
| ; CHECK: stx |
| ; CHECK: ldx |
| define i64 @spill_i64(i64 %x) { |
| call void asm sideeffect "", "~{i0},~{i1},~{i2},~{i3},~{i4},~{i5},~{o0},~{o1},~{o2},~{o3},~{o4},~{o5},~{o7},~{l0},~{l1},~{l2},~{l3},~{l4},~{l5},~{l6},~{l7},~{g1},~{g2},~{g3},~{g4},~{g5},~{g6},~{g7}"() |
| ret i64 %x |
| } |
| |
| ; CHECK: bitcast_i64_f64 |
| ; CHECK: std |
| ; CHECK: ldx |
| define i64 @bitcast_i64_f64(double %x) { |
| %y = bitcast double %x to i64 |
| ret i64 %y |
| } |
| |
| ; CHECK: bitcast_f64_i64 |
| ; CHECK: stx |
| ; CHECK: ldd |
| define double @bitcast_f64_i64(i64 %x) { |
| %y = bitcast i64 %x to double |
| ret double %y |
| } |
| |
| ; CHECK-LABEL: store_zero: |
| ; CHECK: stx %g0, [%i0] |
| ; CHECK: stx %g0, [%i1+8] |
| |
| ; OPT-LABEL: store_zero: |
| ; OPT: stx %g0, [%o0] |
| ; OPT: stx %g0, [%o1+8] |
| define i64 @store_zero(i64* nocapture %a, i64* nocapture %b) { |
| entry: |
| store i64 0, i64* %a, align 8 |
| %0 = getelementptr inbounds i64, i64* %b, i32 1 |
| store i64 0, i64* %0, align 8 |
| ret i64 0 |
| } |
| |
| ; CHECK-LABEL: bit_ops |
| ; CHECK: popc |
| |
| ; OPT-LABEL: bit_ops |
| ; OPT: popc |
| |
| define i64 @bit_ops(i64 %arg) { |
| entry: |
| %0 = tail call i64 @llvm.ctpop.i64(i64 %arg) |
| %1 = tail call i64 @llvm.ctlz.i64(i64 %arg, i1 true) |
| %2 = tail call i64 @llvm.cttz.i64(i64 %arg, i1 true) |
| %3 = tail call i64 @llvm.bswap.i64(i64 %arg) |
| %4 = add i64 %0, %1 |
| %5 = add i64 %2, %3 |
| %6 = add i64 %4, %5 |
| ret i64 %6 |
| } |
| |
| declare i64 @llvm.ctpop.i64(i64) nounwind readnone |
| declare i64 @llvm.ctlz.i64(i64, i1) nounwind readnone |
| declare i64 @llvm.cttz.i64(i64, i1) nounwind readnone |
| declare i64 @llvm.bswap.i64(i64) nounwind readnone |