| //===-- VEISelLowering.h - VE DAG Lowering Interface ------------*- C++ -*-===// |
| // |
| // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| // See https://llvm.org/LICENSE.txt for license information. |
| // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| // |
| //===----------------------------------------------------------------------===// |
| // |
| // This file defines the interfaces that VE uses to lower LLVM code into a |
| // selection DAG. |
| // |
| //===----------------------------------------------------------------------===// |
| |
| #ifndef LLVM_LIB_TARGET_VE_VEISELLOWERING_H |
| #define LLVM_LIB_TARGET_VE_VEISELLOWERING_H |
| |
| #include "VE.h" |
| #include "llvm/CodeGen/TargetLowering.h" |
| |
| namespace llvm { |
| class VESubtarget; |
| |
| namespace VEISD { |
| enum NodeType : unsigned { |
| FIRST_NUMBER = ISD::BUILTIN_OP_END, |
| |
| CMPI, // Compare between two signed integer values. |
| CMPU, // Compare between two unsigned integer values. |
| CMPF, // Compare between two floating-point values. |
| CMPQ, // Compare between two quad floating-point values. |
| CMOV, // Select between two values using the result of comparison. |
| |
| CALL, // A call instruction. |
| EH_SJLJ_LONGJMP, // SjLj exception handling longjmp. |
| EH_SJLJ_SETJMP, // SjLj exception handling setjmp. |
| EH_SJLJ_SETUP_DISPATCH, // SjLj exception handling setup_dispatch. |
| GETFUNPLT, // Load function address through %plt insturction. |
| GETTLSADDR, // Load address for TLS access. |
| GETSTACKTOP, // Retrieve address of stack top (first address of |
| // locals and temporaries). |
| GLOBAL_BASE_REG, // Global base reg for PIC. |
| Hi, // Hi/Lo operations, typically on a global address. |
| Lo, // Hi/Lo operations, typically on a global address. |
| RET_FLAG, // Return with a flag operand. |
| TS1AM, // A TS1AM instruction used for 1/2 bytes swap. |
| VEC_UNPACK_LO, // unpack the lo v256 slice of a packed v512 vector. |
| VEC_UNPACK_HI, // unpack the hi v256 slice of a packed v512 vector. |
| // 0: v512 vector, 1: AVL |
| VEC_PACK, // pack a lo and a hi vector into one v512 vector |
| // 0: v256 lo vector, 1: v256 hi vector, 2: AVL |
| |
| VEC_BROADCAST, // A vector broadcast instruction. |
| // 0: scalar value, 1: VL |
| REPL_I32, |
| REPL_F32, // Replicate subregister to other half. |
| |
| // Annotation as a wrapper. LEGALAVL(VL) means that VL refers to 64bit of |
| // data, whereas the raw EVL coming in from VP nodes always refers to number |
| // of elements, regardless of their size. |
| LEGALAVL, |
| |
| // VVP_* nodes. |
| #define ADD_VVP_OP(VVP_NAME, ...) VVP_NAME, |
| #include "VVPNodes.def" |
| }; |
| } |
| |
| class VECustomDAG; |
| |
| class VETargetLowering : public TargetLowering { |
| const VESubtarget *Subtarget; |
| |
| void initRegisterClasses(); |
| void initSPUActions(); |
| void initVPUActions(); |
| |
| public: |
| VETargetLowering(const TargetMachine &TM, const VESubtarget &STI); |
| |
| const char *getTargetNodeName(unsigned Opcode) const override; |
| MVT getScalarShiftAmountTy(const DataLayout &, EVT) const override { |
| return MVT::i32; |
| } |
| |
| Register getRegisterByName(const char *RegName, LLT VT, |
| const MachineFunction &MF) const override; |
| |
| /// getSetCCResultType - Return the ISD::SETCC ValueType |
| EVT getSetCCResultType(const DataLayout &DL, LLVMContext &Context, |
| EVT VT) const override; |
| |
| SDValue LowerFormalArguments(SDValue Chain, CallingConv::ID CallConv, |
| bool isVarArg, |
| const SmallVectorImpl<ISD::InputArg> &Ins, |
| const SDLoc &dl, SelectionDAG &DAG, |
| SmallVectorImpl<SDValue> &InVals) const override; |
| |
| SDValue LowerCall(TargetLowering::CallLoweringInfo &CLI, |
| SmallVectorImpl<SDValue> &InVals) const override; |
| |
| bool CanLowerReturn(CallingConv::ID CallConv, MachineFunction &MF, |
| bool isVarArg, |
| const SmallVectorImpl<ISD::OutputArg> &ArgsFlags, |
| LLVMContext &Context) const override; |
| SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv, bool isVarArg, |
| const SmallVectorImpl<ISD::OutputArg> &Outs, |
| const SmallVectorImpl<SDValue> &OutVals, const SDLoc &dl, |
| SelectionDAG &DAG) const override; |
| |
| /// Helper functions for atomic operations. |
| bool shouldInsertFencesForAtomic(const Instruction *I) const override { |
| // VE uses release consistency, so need fence for each atomics. |
| return true; |
| } |
| Instruction *emitLeadingFence(IRBuilderBase &Builder, Instruction *Inst, |
| AtomicOrdering Ord) const override; |
| Instruction *emitTrailingFence(IRBuilderBase &Builder, Instruction *Inst, |
| AtomicOrdering Ord) const override; |
| TargetLoweringBase::AtomicExpansionKind |
| shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const override; |
| ISD::NodeType getExtendForAtomicOps() const override { |
| return ISD::ANY_EXTEND; |
| } |
| |
| /// Custom Lower { |
| TargetLoweringBase::LegalizeAction |
| getCustomOperationAction(SDNode &) const override; |
| |
| SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override; |
| unsigned getJumpTableEncoding() const override; |
| const MCExpr *LowerCustomJumpTableEntry(const MachineJumpTableInfo *MJTI, |
| const MachineBasicBlock *MBB, |
| unsigned Uid, |
| MCContext &Ctx) const override; |
| SDValue getPICJumpTableRelocBase(SDValue Table, |
| SelectionDAG &DAG) const override; |
| // VE doesn't need getPICJumpTableRelocBaseExpr since it is used for only |
| // EK_LabelDifference32. |
| |
| SDValue lowerATOMIC_FENCE(SDValue Op, SelectionDAG &DAG) const; |
| SDValue lowerATOMIC_SWAP(SDValue Op, SelectionDAG &DAG) const; |
| SDValue lowerBlockAddress(SDValue Op, SelectionDAG &DAG) const; |
| SDValue lowerConstantPool(SDValue Op, SelectionDAG &DAG) const; |
| SDValue lowerDYNAMIC_STACKALLOC(SDValue Op, SelectionDAG &DAG) const; |
| SDValue lowerEH_SJLJ_LONGJMP(SDValue Op, SelectionDAG &DAG) const; |
| SDValue lowerEH_SJLJ_SETJMP(SDValue Op, SelectionDAG &DAG) const; |
| SDValue lowerEH_SJLJ_SETUP_DISPATCH(SDValue Op, SelectionDAG &DAG) const; |
| SDValue lowerGlobalAddress(SDValue Op, SelectionDAG &DAG) const; |
| SDValue lowerGlobalTLSAddress(SDValue Op, SelectionDAG &DAG) const; |
| SDValue lowerINTRINSIC_WO_CHAIN(SDValue Op, SelectionDAG &DAG) const; |
| SDValue lowerJumpTable(SDValue Op, SelectionDAG &DAG) const; |
| SDValue lowerLOAD(SDValue Op, SelectionDAG &DAG) const; |
| SDValue lowerSTORE(SDValue Op, SelectionDAG &DAG) const; |
| SDValue lowerToTLSGeneralDynamicModel(SDValue Op, SelectionDAG &DAG) const; |
| SDValue lowerVASTART(SDValue Op, SelectionDAG &DAG) const; |
| SDValue lowerVAARG(SDValue Op, SelectionDAG &DAG) const; |
| |
| SDValue lowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG) const; |
| SDValue lowerEXTRACT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) const; |
| SDValue lowerINSERT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) const; |
| /// } Custom Lower |
| |
| /// Replace the results of node with an illegal result |
| /// type with new values built out of custom code. |
| /// |
| void ReplaceNodeResults(SDNode *N, SmallVectorImpl<SDValue> &Results, |
| SelectionDAG &DAG) const override; |
| |
| /// Custom Inserter { |
| MachineBasicBlock * |
| EmitInstrWithCustomInserter(MachineInstr &MI, |
| MachineBasicBlock *MBB) const override; |
| MachineBasicBlock *emitEHSjLjLongJmp(MachineInstr &MI, |
| MachineBasicBlock *MBB) const; |
| MachineBasicBlock *emitEHSjLjSetJmp(MachineInstr &MI, |
| MachineBasicBlock *MBB) const; |
| MachineBasicBlock *emitSjLjDispatchBlock(MachineInstr &MI, |
| MachineBasicBlock *BB) const; |
| |
| void setupEntryBlockForSjLj(MachineInstr &MI, MachineBasicBlock *MBB, |
| MachineBasicBlock *DispatchBB, int FI, |
| int Offset) const; |
| // Setup basic block address. |
| Register prepareMBB(MachineBasicBlock &MBB, MachineBasicBlock::iterator I, |
| MachineBasicBlock *TargetBB, const DebugLoc &DL) const; |
| // Prepare function/variable address. |
| Register prepareSymbol(MachineBasicBlock &MBB, MachineBasicBlock::iterator I, |
| StringRef Symbol, const DebugLoc &DL, bool IsLocal, |
| bool IsCall) const; |
| /// } Custom Inserter |
| |
| /// VVP Lowering { |
| SDValue lowerToVVP(SDValue Op, SelectionDAG &DAG) const; |
| SDValue lowerVVP_LOAD_STORE(SDValue Op, VECustomDAG &) const; |
| SDValue lowerVVP_GATHER_SCATTER(SDValue Op, VECustomDAG &) const; |
| |
| SDValue legalizeInternalVectorOp(SDValue Op, SelectionDAG &DAG) const; |
| SDValue legalizeInternalLoadStoreOp(SDValue Op, VECustomDAG &CDAG) const; |
| SDValue splitVectorOp(SDValue Op, VECustomDAG &CDAG) const; |
| SDValue splitPackedLoadStore(SDValue Op, VECustomDAG &CDAG) const; |
| SDValue legalizePackedAVL(SDValue Op, VECustomDAG &CDAG) const; |
| SDValue splitMaskArithmetic(SDValue Op, SelectionDAG &DAG) const; |
| /// } VVPLowering |
| |
| /// Custom DAGCombine { |
| SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const override; |
| |
| SDValue combineSelect(SDNode *N, DAGCombinerInfo &DCI) const; |
| SDValue combineSelectCC(SDNode *N, DAGCombinerInfo &DCI) const; |
| SDValue combineTRUNCATE(SDNode *N, DAGCombinerInfo &DCI) const; |
| /// } Custom DAGCombine |
| |
| SDValue withTargetFlags(SDValue Op, unsigned TF, SelectionDAG &DAG) const; |
| SDValue makeHiLoPair(SDValue Op, unsigned HiTF, unsigned LoTF, |
| SelectionDAG &DAG) const; |
| SDValue makeAddress(SDValue Op, SelectionDAG &DAG) const; |
| |
| bool isOffsetFoldingLegal(const GlobalAddressSDNode *GA) const override; |
| bool isFPImmLegal(const APFloat &Imm, EVT VT, |
| bool ForCodeSize) const override; |
| /// Returns true if the target allows unaligned memory accesses of the |
| /// specified type. |
| bool allowsMisalignedMemoryAccesses(EVT VT, unsigned AS, Align A, |
| MachineMemOperand::Flags Flags, |
| unsigned *Fast) const override; |
| |
| /// Inline Assembly { |
| |
| ConstraintType getConstraintType(StringRef Constraint) const override; |
| std::pair<unsigned, const TargetRegisterClass *> |
| getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI, |
| StringRef Constraint, MVT VT) const override; |
| |
| /// } Inline Assembly |
| |
| /// Target Optimization { |
| |
| // Return lower limit for number of blocks in a jump table. |
| unsigned getMinimumJumpTableEntries() const override; |
| |
| // SX-Aurora VE's s/udiv is 5-9 times slower than multiply. |
| bool isIntDivCheap(EVT, AttributeList) const override { return false; } |
| // VE doesn't have rem. |
| bool hasStandaloneRem(EVT) const override { return false; } |
| // VE LDZ instruction returns 64 if the input is zero. |
| bool isCheapToSpeculateCtlz(Type *) const override { return true; } |
| // VE LDZ instruction is fast. |
| bool isCtlzFast() const override { return true; } |
| // VE has NND instruction. |
| bool hasAndNot(SDValue Y) const override; |
| |
| /// } Target Optimization |
| }; |
| } // namespace llvm |
| |
| #endif // LLVM_LIB_TARGET_VE_VEISELLOWERING_H |