blob: 832f7118eabc347ac2451c72aab68f98134748c1 [file] [log] [blame]
//===- subzero/src/IceTargetLoweringMIPS32.h - MIPS32 lowering ---*- C++-*-===//
//
// The Subzero Code Generator
//
// This file is distributed under the University of Illinois Open Source
// License. See LICENSE.TXT for details.
//
//===----------------------------------------------------------------------===//
///
/// \file
/// \brief Declares the TargetLoweringMIPS32 class, which implements the
/// TargetLowering interface for the MIPS 32-bit architecture.
///
//===----------------------------------------------------------------------===//
#ifndef SUBZERO_SRC_ICETARGETLOWERINGMIPS32_H
#define SUBZERO_SRC_ICETARGETLOWERINGMIPS32_H
#include "IceAssemblerMIPS32.h"
#include "IceDefs.h"
#include "IceInstMIPS32.h"
#include "IceRegistersMIPS32.h"
#include "IceTargetLowering.h"
namespace Ice {
namespace MIPS32 {
class TargetMIPS32 : public TargetLowering {
TargetMIPS32() = delete;
TargetMIPS32(const TargetMIPS32 &) = delete;
TargetMIPS32 &operator=(const TargetMIPS32 &) = delete;
public:
~TargetMIPS32() override = default;
static void staticInit(GlobalContext *Ctx);
static bool shouldBePooled(const Constant *C) {
if (auto *ConstDouble = llvm::dyn_cast<ConstantDouble>(C)) {
return !Utils::isPositiveZero(ConstDouble->getValue());
}
if (auto *ConstFloat = llvm::dyn_cast<ConstantFloat>(C)) {
return !Utils::isPositiveZero(ConstFloat->getValue());
}
return false;
}
static ::Ice::Type getPointerType() { return ::Ice::IceType_i32; }
static std::unique_ptr<::Ice::TargetLowering> create(Cfg *Func) {
return makeUnique<TargetMIPS32>(Func);
}
std::unique_ptr<::Ice::Assembler> createAssembler() const override {
return makeUnique<MIPS32::AssemblerMIPS32>();
}
void initNodeForLowering(CfgNode *Node) override {
Computations.forgetProducers();
Computations.recordProducers(Node);
Computations.dump(Func);
}
void translateOm1() override;
void translateO2() override;
bool doBranchOpt(Inst *Instr, const CfgNode *NextNode) override;
void setImplicitRet(Variable *Ret) { ImplicitRet = Ret; }
Variable *getImplicitRet() const { return ImplicitRet; }
SizeT getNumRegisters() const override { return RegMIPS32::Reg_NUM; }
Variable *getPhysicalRegister(RegNumT RegNum,
Type Ty = IceType_void) override;
const char *getRegName(RegNumT RegNum, Type Ty) const override;
SmallBitVector getRegisterSet(RegSetMask Include,
RegSetMask Exclude) const override;
const SmallBitVector &
getRegistersForVariable(const Variable *Var) const override {
RegClass RC = Var->getRegClass();
assert(RC < RC_Target);
return TypeToRegisterSet[RC];
}
const SmallBitVector &
getAllRegistersForVariable(const Variable *Var) const override {
RegClass RC = Var->getRegClass();
assert(RC < RC_Target);
return TypeToRegisterSetUnfiltered[RC];
}
const SmallBitVector &getAliasesForRegister(RegNumT Reg) const override {
return RegisterAliases[Reg];
}
bool hasFramePointer() const override { return UsesFramePointer; }
void setHasFramePointer() override { UsesFramePointer = true; }
RegNumT getStackReg() const override { return RegMIPS32::Reg_SP; }
RegNumT getFrameReg() const override { return RegMIPS32::Reg_FP; }
RegNumT getFrameOrStackReg() const override {
return UsesFramePointer ? getFrameReg() : getStackReg();
}
RegNumT getReservedTmpReg() const { return RegMIPS32::Reg_AT; }
size_t typeWidthInBytesOnStack(Type Ty) const override {
// Round up to the next multiple of 4 bytes. In particular, i1, i8, and i16
// are rounded up to 4 bytes.
return (typeWidthInBytes(Ty) + 3) & ~3;
}
uint32_t getStackAlignment() const override;
void reserveFixedAllocaArea(size_t Size, size_t Align) override {
FixedAllocaSizeBytes = Size;
assert(llvm::isPowerOf2_32(Align));
FixedAllocaAlignBytes = Align;
PrologEmitsFixedAllocas = true;
}
int32_t getFrameFixedAllocaOffset() const override {
int32_t FixedAllocaOffset =
Utils::applyAlignment(CurrentAllocaOffset, FixedAllocaAlignBytes);
return FixedAllocaOffset - MaxOutArgsSizeBytes;
}
uint32_t maxOutArgsSizeBytes() const override { return MaxOutArgsSizeBytes; }
uint32_t getFramePointerOffset(uint32_t CurrentOffset,
uint32_t Size) const override {
(void)Size;
return CurrentOffset + MaxOutArgsSizeBytes;
}
bool shouldSplitToVariable64On32(Type Ty) const override {
return Ty == IceType_i64;
}
bool shouldSplitToVariableVecOn32(Type Ty) const override {
return isVectorType(Ty);
}
// TODO(ascull): what is the best size of MIPS?
SizeT getMinJumpTableSize() const override { return 3; }
void emitJumpTable(const Cfg *Func,
const InstJumpTable *JumpTable) const override;
void emitVariable(const Variable *Var) const override;
void emit(const ConstantInteger32 *C) const final {
if (!BuildDefs::dump())
return;
Ostream &Str = Ctx->getStrEmit();
Str << C->getValue();
}
void emit(const ConstantInteger64 *C) const final {
(void)C;
llvm::report_fatal_error("Not yet implemented");
}
void emit(const ConstantFloat *C) const final {
(void)C;
llvm::report_fatal_error("Not yet implemented");
}
void emit(const ConstantDouble *C) const final {
(void)C;
llvm::report_fatal_error("Not yet implemented");
}
void emit(const ConstantUndef *C) const final {
(void)C;
llvm::report_fatal_error("Not yet implemented");
}
void emit(const ConstantRelocatable *C) const final {
(void)C;
llvm::report_fatal_error("Not yet implemented");
}
// The following are helpers that insert lowered MIPS32 instructions with
// minimal syntactic overhead, so that the lowering code can look as close to
// assembly as practical.
void _add(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Add>(Dest, Src0, Src1);
}
void _addu(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Addu>(Dest, Src0, Src1);
}
void _and(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32And>(Dest, Src0, Src1);
}
void _andi(Variable *Dest, Variable *Src, uint32_t Imm) {
Context.insert<InstMIPS32Andi>(Dest, Src, Imm);
}
void _br(CfgNode *Target) { Context.insert<InstMIPS32Br>(Target); }
void _br(CfgNode *Target, const InstMIPS32Label *Label) {
Context.insert<InstMIPS32Br>(Target, Label);
}
void _br(CfgNode *TargetTrue, CfgNode *TargetFalse, Operand *Src0,
Operand *Src1, CondMIPS32::Cond Condition) {
Context.insert<InstMIPS32Br>(TargetTrue, TargetFalse, Src0, Src1,
Condition);
}
void _br(CfgNode *TargetTrue, CfgNode *TargetFalse, Operand *Src0,
CondMIPS32::Cond Condition) {
Context.insert<InstMIPS32Br>(TargetTrue, TargetFalse, Src0, Condition);
}
void _br(CfgNode *TargetTrue, CfgNode *TargetFalse, Operand *Src0,
Operand *Src1, const InstMIPS32Label *Label,
CondMIPS32::Cond Condition) {
Context.insert<InstMIPS32Br>(TargetTrue, TargetFalse, Src0, Src1, Label,
Condition);
}
void _ret(Variable *RA, Variable *Src0 = nullptr) {
Context.insert<InstMIPS32Ret>(RA, Src0);
}
void _abs_d(Variable *Dest, Variable *Src) {
Context.insert<InstMIPS32Abs_d>(Dest, Src);
}
void _abs_s(Variable *Dest, Variable *Src) {
Context.insert<InstMIPS32Abs_s>(Dest, Src);
}
void _addi(Variable *Dest, Variable *Src, uint32_t Imm) {
Context.insert<InstMIPS32Addi>(Dest, Src, Imm);
}
void _add_d(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Add_d>(Dest, Src0, Src1);
}
void _add_s(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Add_s>(Dest, Src0, Src1);
}
void _addiu(Variable *Dest, Variable *Src, uint32_t Imm) {
Context.insert<InstMIPS32Addiu>(Dest, Src, Imm);
}
void _addiu(Variable *Dest, Variable *Src0, Operand *Src1, RelocOp Reloc) {
Context.insert<InstMIPS32Addiu>(Dest, Src0, Src1, Reloc);
}
void _c_eq_d(Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32C_eq_d>(Src0, Src1);
}
void _c_eq_s(Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32C_eq_s>(Src0, Src1);
}
void _c_ole_d(Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32C_ole_d>(Src0, Src1);
}
void _c_ole_s(Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32C_ole_s>(Src0, Src1);
}
void _c_olt_d(Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32C_olt_d>(Src0, Src1);
}
void _c_olt_s(Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32C_olt_s>(Src0, Src1);
}
void _c_ueq_d(Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32C_ueq_d>(Src0, Src1);
}
void _c_ueq_s(Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32C_ueq_s>(Src0, Src1);
}
void _c_ule_d(Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32C_ule_d>(Src0, Src1);
}
void _c_ule_s(Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32C_ule_s>(Src0, Src1);
}
void _c_ult_d(Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32C_ult_d>(Src0, Src1);
}
void _c_ult_s(Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32C_ult_s>(Src0, Src1);
}
void _c_un_d(Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32C_un_d>(Src0, Src1);
}
void _c_un_s(Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32C_un_s>(Src0, Src1);
}
void _clz(Variable *Dest, Variable *Src) {
Context.insert<InstMIPS32Clz>(Dest, Src);
}
void _cvt_d_l(Variable *Dest, Variable *Src) {
Context.insert<InstMIPS32Cvt_d_l>(Dest, Src);
}
void _cvt_d_s(Variable *Dest, Variable *Src) {
Context.insert<InstMIPS32Cvt_d_s>(Dest, Src);
}
void _cvt_d_w(Variable *Dest, Variable *Src) {
Context.insert<InstMIPS32Cvt_d_w>(Dest, Src);
}
void _cvt_s_d(Variable *Dest, Variable *Src) {
Context.insert<InstMIPS32Cvt_s_d>(Dest, Src);
}
void _cvt_s_l(Variable *Dest, Variable *Src) {
Context.insert<InstMIPS32Cvt_s_l>(Dest, Src);
}
void _cvt_s_w(Variable *Dest, Variable *Src) {
Context.insert<InstMIPS32Cvt_s_w>(Dest, Src);
}
void _div(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Div>(Dest, Src0, Src1);
}
void _div_d(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Div_d>(Dest, Src0, Src1);
}
void _div_s(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Div_s>(Dest, Src0, Src1);
}
void _divu(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Divu>(Dest, Src0, Src1);
}
void _ldc1(Variable *Value, OperandMIPS32Mem *Mem, RelocOp Reloc = RO_No) {
Context.insert<InstMIPS32Ldc1>(Value, Mem, Reloc);
}
void _ll(Variable *Value, OperandMIPS32Mem *Mem) {
Context.insert<InstMIPS32Ll>(Value, Mem);
}
void _lw(Variable *Value, OperandMIPS32Mem *Mem) {
Context.insert<InstMIPS32Lw>(Value, Mem);
}
void _lwc1(Variable *Value, OperandMIPS32Mem *Mem, RelocOp Reloc = RO_No) {
Context.insert<InstMIPS32Lwc1>(Value, Mem, Reloc);
}
void _lui(Variable *Dest, Operand *Src, RelocOp Reloc = RO_No) {
Context.insert<InstMIPS32Lui>(Dest, Src, Reloc);
}
void _mfc1(Variable *Dest, Variable *Src) {
Context.insert<InstMIPS32Mfc1>(Dest, Src);
}
void _mfhi(Variable *Dest, Operand *Src) {
Context.insert<InstMIPS32Mfhi>(Dest, Src);
}
void _mflo(Variable *Dest, Operand *Src) {
Context.insert<InstMIPS32Mflo>(Dest, Src);
}
void _mov(Variable *Dest, Operand *Src0, Operand *Src1 = nullptr) {
assert(Dest != nullptr);
// Variable* Src0_ = llvm::dyn_cast<Variable>(Src0);
if (llvm::isa<ConstantRelocatable>(Src0)) {
Context.insert<InstMIPS32La>(Dest, Src0);
} else {
auto *Instr = Context.insert<InstMIPS32Mov>(Dest, Src0, Src1);
if (Instr->getDestHi() != nullptr) {
// If DestHi is available, then Dest must be a Variable64On32. We add a
// fake-def for Instr.DestHi here.
assert(llvm::isa<Variable64On32>(Dest));
Context.insert<InstFakeDef>(Instr->getDestHi());
}
}
}
void _mov_redefined(Variable *Dest, Operand *Src0, Operand *Src1 = nullptr) {
if (llvm::isa<ConstantRelocatable>(Src0)) {
Context.insert<InstMIPS32La>(Dest, Src0);
} else {
auto *Instr = Context.insert<InstMIPS32Mov>(Dest, Src0, Src1);
Instr->setDestRedefined();
if (Instr->getDestHi() != nullptr) {
// If Instr is multi-dest, then Dest must be a Variable64On32. We add a
// fake-def for Instr.DestHi here.
assert(llvm::isa<Variable64On32>(Dest));
Context.insert<InstFakeDef>(Instr->getDestHi());
}
}
}
void _mov_fp64_to_i64(Variable *Dest, Operand *Src, Int64Part Int64HiLo) {
assert(Dest != nullptr);
Context.insert<InstMIPS32MovFP64ToI64>(Dest, Src, Int64HiLo);
}
void _mov_d(Variable *Dest, Variable *Src) {
Context.insert<InstMIPS32Mov_d>(Dest, Src);
}
void _mov_s(Variable *Dest, Variable *Src) {
Context.insert<InstMIPS32Mov_s>(Dest, Src);
}
void _movf(Variable *Dest, Variable *Src0, Operand *FCC) {
Context.insert<InstMIPS32Movf>(Dest, Src0, FCC)->setDestRedefined();
}
void _movn(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Movn>(Dest, Src0, Src1)->setDestRedefined();
}
void _movn_d(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Movn_d>(Dest, Src0, Src1)->setDestRedefined();
}
void _movn_s(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Movn_s>(Dest, Src0, Src1)->setDestRedefined();
}
void _movt(Variable *Dest, Variable *Src0, Operand *FCC) {
Context.insert<InstMIPS32Movt>(Dest, Src0, FCC)->setDestRedefined();
}
void _movz(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Movz>(Dest, Src0, Src1)->setDestRedefined();
}
void _movz_d(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Movz_d>(Dest, Src0, Src1)->setDestRedefined();
}
void _movz_s(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Movz_s>(Dest, Src0, Src1)->setDestRedefined();
}
void _mtc1(Variable *Dest, Variable *Src) {
Context.insert<InstMIPS32Mtc1>(Dest, Src);
}
void _mthi(Variable *Dest, Operand *Src) {
Context.insert<InstMIPS32Mthi>(Dest, Src);
}
void _mtlo(Variable *Dest, Operand *Src) {
Context.insert<InstMIPS32Mtlo>(Dest, Src);
}
void _mul(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Mul>(Dest, Src0, Src1);
}
void _mul_d(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Mul_d>(Dest, Src0, Src1);
}
void _mul_s(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Mul_s>(Dest, Src0, Src1);
}
void _mult(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Mult>(Dest, Src0, Src1);
}
void _multu(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Multu>(Dest, Src0, Src1);
}
void _nop() { Context.insert<InstMIPS32Sll>(getZero(), getZero(), 0); }
void _nor(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Nor>(Dest, Src0, Src1);
}
void _not(Variable *Dest, Variable *Src0) {
Context.insert<InstMIPS32Nor>(Dest, Src0, getZero());
}
void _or(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Or>(Dest, Src0, Src1);
}
void _ori(Variable *Dest, Variable *Src, uint32_t Imm) {
Context.insert<InstMIPS32Ori>(Dest, Src, Imm);
}
InstMIPS32Sc *_sc(Variable *Value, OperandMIPS32Mem *Mem) {
return Context.insert<InstMIPS32Sc>(Value, Mem);
}
void _sdc1(Variable *Value, OperandMIPS32Mem *Mem) {
Context.insert<InstMIPS32Sdc1>(Value, Mem);
}
void _sll(Variable *Dest, Variable *Src, uint32_t Imm) {
Context.insert<InstMIPS32Sll>(Dest, Src, Imm);
}
void _sllv(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Sllv>(Dest, Src0, Src1);
}
void _slt(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Slt>(Dest, Src0, Src1);
}
void _slti(Variable *Dest, Variable *Src, uint32_t Imm) {
Context.insert<InstMIPS32Slti>(Dest, Src, Imm);
}
void _sltiu(Variable *Dest, Variable *Src, uint32_t Imm) {
Context.insert<InstMIPS32Sltiu>(Dest, Src, Imm);
}
void _sltu(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Sltu>(Dest, Src0, Src1);
}
void _sqrt_d(Variable *Dest, Variable *Src) {
Context.insert<InstMIPS32Sqrt_d>(Dest, Src);
}
void _sqrt_s(Variable *Dest, Variable *Src) {
Context.insert<InstMIPS32Sqrt_s>(Dest, Src);
}
void _sra(Variable *Dest, Variable *Src, uint32_t Imm) {
Context.insert<InstMIPS32Sra>(Dest, Src, Imm);
}
void _srav(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Srav>(Dest, Src0, Src1);
}
void _srl(Variable *Dest, Variable *Src, uint32_t Imm) {
Context.insert<InstMIPS32Srl>(Dest, Src, Imm);
}
void _srlv(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Srlv>(Dest, Src0, Src1);
}
void _sub(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Sub>(Dest, Src0, Src1);
}
void _sub_d(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Sub_d>(Dest, Src0, Src1);
}
void _sub_s(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Sub_s>(Dest, Src0, Src1);
}
void _subu(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Subu>(Dest, Src0, Src1);
}
void _sw(Variable *Value, OperandMIPS32Mem *Mem) {
Context.insert<InstMIPS32Sw>(Value, Mem);
}
void _swc1(Variable *Value, OperandMIPS32Mem *Mem) {
Context.insert<InstMIPS32Swc1>(Value, Mem);
}
void _sync() { Context.insert<InstMIPS32Sync>(); }
void _teq(Variable *Src0, Variable *Src1, uint32_t TrapCode) {
Context.insert<InstMIPS32Teq>(Src0, Src1, TrapCode);
}
void _trunc_l_d(Variable *Dest, Variable *Src) {
Context.insert<InstMIPS32Trunc_l_d>(Dest, Src);
}
void _trunc_l_s(Variable *Dest, Variable *Src) {
Context.insert<InstMIPS32Trunc_l_s>(Dest, Src);
}
void _trunc_w_d(Variable *Dest, Variable *Src) {
Context.insert<InstMIPS32Trunc_w_d>(Dest, Src);
}
void _trunc_w_s(Variable *Dest, Variable *Src) {
Context.insert<InstMIPS32Trunc_w_s>(Dest, Src);
}
void _xor(Variable *Dest, Variable *Src0, Variable *Src1) {
Context.insert<InstMIPS32Xor>(Dest, Src0, Src1);
}
void _xori(Variable *Dest, Variable *Src, uint32_t Imm) {
Context.insert<InstMIPS32Xori>(Dest, Src, Imm);
}
void lowerArguments() override;
/// Make a pass through the SortedSpilledVariables and actually assign stack
/// slots. SpillAreaPaddingBytes takes into account stack alignment padding.
/// The SpillArea starts after that amount of padding. This matches the scheme
/// in getVarStackSlotParams, where there may be a separate multi-block global
/// var spill area and a local var spill area.
void assignVarStackSlots(VarList &SortedSpilledVariables,
size_t SpillAreaPaddingBytes,
size_t SpillAreaSizeBytes,
size_t GlobalsAndSubsequentPaddingSize);
/// Operand legalization helpers. To deal with address mode constraints,
/// the helpers will create a new Operand and emit instructions that
/// guarantee that the Operand kind is one of those indicated by the
/// LegalMask (a bitmask of allowed kinds). If the input Operand is known
/// to already meet the constraints, it may be simply returned as the result,
/// without creating any new instructions or operands.
enum OperandLegalization {
Legal_None = 0,
Legal_Reg = 1 << 0, // physical register, not stack location
Legal_Imm = 1 << 1,
Legal_Mem = 1 << 2,
Legal_Rematerializable = 1 << 3,
Legal_Default = ~Legal_None
};
typedef uint32_t LegalMask;
Operand *legalize(Operand *From, LegalMask Allowed = Legal_Default,
RegNumT RegNum = RegNumT());
Variable *legalizeToVar(Operand *From, RegNumT RegNum = RegNumT());
Variable *legalizeToReg(Operand *From, RegNumT RegNum = RegNumT());
Variable *makeReg(Type Ty, RegNumT RegNum = RegNumT());
Variable *getZero() {
auto *Zero = makeReg(IceType_i32, RegMIPS32::Reg_ZERO);
Context.insert<InstFakeDef>(Zero);
return Zero;
}
Variable *I32Reg(RegNumT RegNum = RegNumT()) {
return makeReg(IceType_i32, RegNum);
}
Variable *F32Reg(RegNumT RegNum = RegNumT()) {
return makeReg(IceType_f32, RegNum);
}
Variable *F64Reg(RegNumT RegNum = RegNumT()) {
return makeReg(IceType_f64, RegNum);
}
static Type stackSlotType();
Variable *copyToReg(Operand *Src, RegNumT RegNum = RegNumT());
void unsetIfNonLeafFunc();
// Iterates over the CFG and determines the maximum outgoing stack arguments
// bytes. This information is later used during addProlog() to pre-allocate
// the outargs area
void findMaxStackOutArgsSize();
void postLowerLegalization();
void addProlog(CfgNode *Node) override;
void addEpilog(CfgNode *Node) override;
// Ensure that a 64-bit Variable has been split into 2 32-bit
// Variables, creating them if necessary. This is needed for all
// I64 operations.
void split64(Variable *Var);
Operand *loOperand(Operand *Operand);
Operand *hiOperand(Operand *Operand);
Operand *getOperandAtIndex(Operand *Operand, Type BaseType, uint32_t Index);
void finishArgumentLowering(Variable *Arg, bool PartialOnStack,
Variable *FramePtr, size_t BasicFrameOffset,
size_t *InArgsSizeBytes);
Operand *legalizeUndef(Operand *From, RegNumT RegNum = RegNumT());
/// Helper class that understands the Calling Convention and register
/// assignments as per MIPS O32 abi.
class CallingConv {
CallingConv(const CallingConv &) = delete;
CallingConv &operator=(const CallingConv &) = delete;
public:
CallingConv();
~CallingConv() = default;
/// argInReg returns true if there is a Register available for the requested
/// type, and false otherwise. If it returns true, Reg is set to the
/// appropriate register number. Note that, when Ty == IceType_i64, Reg will
/// be an I64 register pair.
bool argInReg(Type Ty, uint32_t ArgNo, RegNumT *Reg);
void discardReg(RegNumT Reg) { GPRegsUsed |= RegisterAliases[Reg]; }
private:
// argInGPR is used to find if any GPR register is available for argument of
// type Ty
bool argInGPR(Type Ty, RegNumT *Reg);
/// argInVFP is to floating-point/vector types what argInGPR is for integer
/// types.
bool argInVFP(Type Ty, RegNumT *Reg);
inline void discardNextGPRAndItsAliases(CfgVector<RegNumT> *Regs);
inline void alignGPR(CfgVector<RegNumT> *Regs);
void discardUnavailableGPRsAndTheirAliases(CfgVector<RegNumT> *Regs);
SmallBitVector GPRegsUsed;
CfgVector<RegNumT> GPRArgs;
CfgVector<RegNumT> I64Args;
void discardUnavailableVFPRegsAndTheirAliases(CfgVector<RegNumT> *Regs);
SmallBitVector VFPRegsUsed;
CfgVector<RegNumT> FP32Args;
CfgVector<RegNumT> FP64Args;
// UseFPRegs is a flag indicating if FP registers can be used
bool UseFPRegs = false;
};
protected:
explicit TargetMIPS32(Cfg *Func);
void postLower() override;
void lowerAlloca(const InstAlloca *Instr) override;
void lowerArithmetic(const InstArithmetic *Instr) override;
void lowerInt64Arithmetic(const InstArithmetic *Instr, Variable *Dest,
Operand *Src0, Operand *Src1);
void lowerAssign(const InstAssign *Instr) override;
void lowerBr(const InstBr *Instr) override;
void lowerBreakpoint(const InstBreakpoint *Instr) override;
void lowerCall(const InstCall *Instr) override;
void lowerCast(const InstCast *Instr) override;
void lowerExtractElement(const InstExtractElement *Instr) override;
void lowerFcmp(const InstFcmp *Instr) override;
void lowerIcmp(const InstIcmp *Instr) override;
void lower64Icmp(const InstIcmp *Instr);
void createArithInst(Intrinsics::AtomicRMWOperation Operation, Variable *Dest,
Variable *Src0, Variable *Src1);
void lowerIntrinsic(const InstIntrinsic *Instr) override;
void lowerInsertElement(const InstInsertElement *Instr) override;
void lowerLoad(const InstLoad *Instr) override;
void lowerPhi(const InstPhi *Instr) override;
void lowerRet(const InstRet *Instr) override;
void lowerSelect(const InstSelect *Instr) override;
void lowerShuffleVector(const InstShuffleVector *Instr) override;
void lowerStore(const InstStore *Instr) override;
void lowerSwitch(const InstSwitch *Instr) override;
void lowerUnreachable(const InstUnreachable *Instr) override;
void lowerOther(const Inst *Instr) override;
void prelowerPhis() override;
uint32_t getCallStackArgumentsSizeBytes(const InstCall *Instr) override;
void genTargetHelperCallFor(Inst *Instr) override;
void doAddressOptLoad() override;
void doAddressOptStore() override;
OperandMIPS32Mem *formMemoryOperand(Operand *Ptr, Type Ty);
class PostLoweringLegalizer {
PostLoweringLegalizer() = delete;
PostLoweringLegalizer(const PostLoweringLegalizer &) = delete;
PostLoweringLegalizer &operator=(const PostLoweringLegalizer &) = delete;
public:
explicit PostLoweringLegalizer(TargetMIPS32 *Target)
: Target(Target), StackOrFrameReg(Target->getPhysicalRegister(
Target->getFrameOrStackReg())) {}
/// Legalizes Mem. if Mem.Base is a rematerializable variable,
/// Mem.Offset is fixed up.
OperandMIPS32Mem *legalizeMemOperand(OperandMIPS32Mem *Mem);
/// Legalizes Immediate if larger value overflows range of 16 bits
Variable *legalizeImmediate(int32_t Imm);
/// Legalizes Mov if its Source (or Destination) is a spilled Variable, or
/// if its Source is a Rematerializable variable (this form is used in lieu
/// of lea, which is not available in MIPS.)
///
/// Moves to memory become store instructions, and moves from memory, loads.
void legalizeMov(InstMIPS32Mov *Mov);
void legalizeMovFp(InstMIPS32MovFP64ToI64 *MovInstr);
private:
/// Creates a new Base register centered around [Base, +/- Offset].
Variable *newBaseRegister(Variable *Base, int32_t Offset,
RegNumT ScratchRegNum);
TargetMIPS32 *const Target;
Variable *const StackOrFrameReg;
};
bool UsesFramePointer = false;
bool NeedsStackAlignment = false;
bool MaybeLeafFunc = true;
bool PrologEmitsFixedAllocas = false;
bool VariableAllocaUsed = false;
uint32_t MaxOutArgsSizeBytes = 0;
uint32_t TotalStackSizeBytes = 0;
uint32_t CurrentAllocaOffset = 0;
uint32_t VariableAllocaAlignBytes = 0;
static SmallBitVector TypeToRegisterSet[RCMIPS32_NUM];
static SmallBitVector TypeToRegisterSetUnfiltered[RCMIPS32_NUM];
static SmallBitVector RegisterAliases[RegMIPS32::Reg_NUM];
SmallBitVector RegsUsed;
VarList PhysicalRegisters[IceType_NUM];
VarList PreservedGPRs;
static constexpr uint32_t CHAR_BITS = 8;
static constexpr uint32_t INT32_BITS = 32;
size_t SpillAreaSizeBytes = 0;
size_t FixedAllocaSizeBytes = 0;
size_t FixedAllocaAlignBytes = 0;
size_t PreservedRegsSizeBytes = 0;
Variable *ImplicitRet = nullptr; /// Implicit return
private:
ENABLE_MAKE_UNIQUE;
OperandMIPS32Mem *formAddressingMode(Type Ty, Cfg *Func, const Inst *LdSt,
Operand *Base);
class ComputationTracker {
public:
ComputationTracker() = default;
~ComputationTracker() = default;
void forgetProducers() { KnownComputations.clear(); }
void recordProducers(CfgNode *Node);
const Inst *getProducerOf(const Operand *Opnd) const {
auto *Var = llvm::dyn_cast<Variable>(Opnd);
if (Var == nullptr) {
return nullptr;
}
auto Iter = KnownComputations.find(Var->getIndex());
if (Iter == KnownComputations.end()) {
return nullptr;
}
return Iter->second.Instr;
}
void dump(const Cfg *Func) const {
if (!BuildDefs::dump() || !Func->isVerbose(IceV_Folding))
return;
OstreamLocker L(Func->getContext());
Ostream &Str = Func->getContext()->getStrDump();
Str << "foldable producer:\n";
for (const auto &Computation : KnownComputations) {
Str << " ";
Computation.second.Instr->dump(Func);
Str << "\n";
}
Str << "\n";
}
private:
class ComputationEntry {
public:
ComputationEntry(Inst *I, Type Ty) : Instr(I), ComputationType(Ty) {}
Inst *const Instr;
// Boolean folding is disabled for variables whose live range is multi
// block. We conservatively initialize IsLiveOut to true, and set it to
// false once we find the end of the live range for the variable defined
// by this instruction. If liveness analysis is not performed (e.g., in
// Om1 mode) IsLiveOut will never be set to false, and folding will be
// disabled.
bool IsLiveOut = true;
int32_t NumUses = 0;
Type ComputationType;
};
// ComputationMap maps a Variable number to a payload identifying which
// instruction defined it.
using ComputationMap = CfgUnorderedMap<SizeT, ComputationEntry>;
ComputationMap KnownComputations;
};
ComputationTracker Computations;
};
class TargetDataMIPS32 final : public TargetDataLowering {
TargetDataMIPS32() = delete;
TargetDataMIPS32(const TargetDataMIPS32 &) = delete;
TargetDataMIPS32 &operator=(const TargetDataMIPS32 &) = delete;
public:
static std::unique_ptr<TargetDataLowering> create(GlobalContext *Ctx) {
return std::unique_ptr<TargetDataLowering>(new TargetDataMIPS32(Ctx));
}
void lowerGlobals(const VariableDeclarationList &Vars,
const std::string &SectionSuffix) override;
void lowerConstants() override;
void lowerJumpTables() override;
void emitTargetRODataSections() override;
protected:
explicit TargetDataMIPS32(GlobalContext *Ctx);
private:
~TargetDataMIPS32() override = default;
};
class TargetHeaderMIPS32 final : public TargetHeaderLowering {
TargetHeaderMIPS32() = delete;
TargetHeaderMIPS32(const TargetHeaderMIPS32 &) = delete;
TargetHeaderMIPS32 &operator=(const TargetHeaderMIPS32 &) = delete;
public:
static std::unique_ptr<TargetHeaderLowering> create(GlobalContext *Ctx) {
return std::unique_ptr<TargetHeaderLowering>(new TargetHeaderMIPS32(Ctx));
}
void lower() override;
protected:
explicit TargetHeaderMIPS32(GlobalContext *Ctx);
private:
~TargetHeaderMIPS32() = default;
};
// This structure (with some minor modifications) is copied from
// llvm/lib/Target/Mips/MCTargetDesc/MipsABIFlagsSection.h file.
struct MipsABIFlagsSection {
// Version of the MIPS.abiflags section
enum AFL_VERSION {
AFL_VERSION_V0 = 0 // Version 0
};
// The level of the ISA: 1-5, 32, 64.
enum AFL_ISA_LEVEL {
AFL_ISA_LEVEL_NONE = 0,
AFL_ISA_LEVEL_MIPS32 = 32, // MIPS32
};
// The revision of ISA: 0 for MIPS V and below, 1-n otherwise.
enum AFL_ISA_REV {
AFL_ISA_REV_NONE = 0,
AFL_ISA_REV_R1 = 1, // R1
};
// Values for the xxx_size bytes of an ABI flags structure.
enum AFL_REG {
AFL_REG_NONE = 0x00, // No registers.
AFL_REG_32 = 0x01, // 32-bit registers.
AFL_REG_64 = 0x02, // 64-bit registers.
AFL_REG_128 = 0x03 // 128-bit registers.
};
// Values for the fp_abi word of an ABI flags structure.
enum AFL_FP_ABI {
AFL_FP_ANY = 0,
AFL_FP_DOUBLE = 1,
AFL_FP_XX = 5,
AFL_FP_64 = 6,
AFL_FP_64A = 7
};
// Values for the isa_ext word of an ABI flags structure.
enum AFL_EXT {
AFL_EXT_NONE = 0,
AFL_EXT_XLR = 1, // RMI Xlr instruction.
AFL_EXT_OCTEON2 = 2, // Cavium Networks Octeon2.
AFL_EXT_OCTEONP = 3, // Cavium Networks OcteonP.
AFL_EXT_LOONGSON_3A = 4, // Loongson 3A.
AFL_EXT_OCTEON = 5, // Cavium Networks Octeon.
AFL_EXT_5900 = 6, // MIPS R5900 instruction.
AFL_EXT_4650 = 7, // MIPS R4650 instruction.
AFL_EXT_4010 = 8, // LSI R4010 instruction.
AFL_EXT_4100 = 9, // NEC VR4100 instruction.
AFL_EXT_3900 = 10, // Toshiba R3900 instruction.
AFL_EXT_10000 = 11, // MIPS R10000 instruction.
AFL_EXT_SB1 = 12, // Broadcom SB-1 instruction.
AFL_EXT_4111 = 13, // NEC VR4111/VR4181 instruction.
AFL_EXT_4120 = 14, // NEC VR4120 instruction.
AFL_EXT_5400 = 15, // NEC VR5400 instruction.
AFL_EXT_5500 = 16, // NEC VR5500 instruction.
AFL_EXT_LOONGSON_2E = 17, // ST Microelectronics Loongson 2E.
AFL_EXT_LOONGSON_2F = 18 // ST Microelectronics Loongson 2F.
};
// Masks for the ases word of an ABI flags structure.
enum AFL_ASE {
AFL_ASE_NONE = 0x00000000,
AFL_ASE_DSP = 0x00000001, // DSP ASE.
AFL_ASE_DSPR2 = 0x00000002, // DSP R2 ASE.
AFL_ASE_EVA = 0x00000004, // Enhanced VA Scheme.
AFL_ASE_MCU = 0x00000008, // MCU (MicroController) ASE.
AFL_ASE_MDMX = 0x00000010, // MDMX ASE.
AFL_ASE_MIPS3D = 0x00000020, // MIPS-3D ASE.
AFL_ASE_MT = 0x00000040, // MT ASE.
AFL_ASE_SMARTMIPS = 0x00000080, // SmartMIPS ASE.
AFL_ASE_VIRT = 0x00000100, // VZ ASE.
AFL_ASE_MSA = 0x00000200, // MSA ASE.
AFL_ASE_MIPS16 = 0x00000400, // MIPS16 ASE.
AFL_ASE_MICROMIPS = 0x00000800, // MICROMIPS ASE.
AFL_ASE_XPA = 0x00001000 // XPA ASE.
};
enum AFL_FLAGS1 { AFL_FLAGS1_NONE = 0, AFL_FLAGS1_ODDSPREG = 1 };
enum AFL_FLAGS2 { AFL_FLAGS2_NONE = 0 };
uint16_t Version = AFL_VERSION_V0;
uint8_t ISALevel = AFL_ISA_LEVEL_MIPS32;
uint8_t ISARevision = AFL_ISA_REV_R1;
uint8_t GPRSize = AFL_REG_32;
uint8_t CPR1Size = AFL_REG_32;
uint8_t CPR2Size = AFL_REG_NONE;
uint8_t FPABI = AFL_FP_DOUBLE;
uint32_t Extension = AFL_EXT_NONE;
uint32_t ASE = AFL_ASE_NONE;
uint32_t Flags1 = AFL_FLAGS1_ODDSPREG;
uint32_t Flags2 = AFL_FLAGS2_NONE;
MipsABIFlagsSection() = default;
};
} // end of namespace MIPS32
} // end of namespace Ice
#endif // SUBZERO_SRC_ICETARGETLOWERINGMIPS32_H