| //===-- VEISelLowering.h - VE DAG Lowering Interface ------------*- C++ -*-===// | 
 | // | 
 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. | 
 | // See https://llvm.org/LICENSE.txt for license information. | 
 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception | 
 | // | 
 | //===----------------------------------------------------------------------===// | 
 | // | 
 | // This file defines the interfaces that VE uses to lower LLVM code into a | 
 | // selection DAG. | 
 | // | 
 | //===----------------------------------------------------------------------===// | 
 |  | 
 | #ifndef LLVM_LIB_TARGET_VE_VEISELLOWERING_H | 
 | #define LLVM_LIB_TARGET_VE_VEISELLOWERING_H | 
 |  | 
 | #include "VE.h" | 
 | #include "llvm/CodeGen/TargetLowering.h" | 
 |  | 
 | namespace llvm { | 
 | class VESubtarget; | 
 |  | 
 | namespace VEISD { | 
 | enum NodeType : unsigned { | 
 |   FIRST_NUMBER = ISD::BUILTIN_OP_END, | 
 |  | 
 |   CMPI, // Compare between two signed integer values. | 
 |   CMPU, // Compare between two unsigned integer values. | 
 |   CMPF, // Compare between two floating-point values. | 
 |   CMPQ, // Compare between two quad floating-point values. | 
 |   CMOV, // Select between two values using the result of comparison. | 
 |  | 
 |   CALL,                   // A call instruction. | 
 |   EH_SJLJ_LONGJMP,        // SjLj exception handling longjmp. | 
 |   EH_SJLJ_SETJMP,         // SjLj exception handling setjmp. | 
 |   EH_SJLJ_SETUP_DISPATCH, // SjLj exception handling setup_dispatch. | 
 |   GETFUNPLT,              // Load function address through %plt insturction. | 
 |   GETTLSADDR,             // Load address for TLS access. | 
 |   GETSTACKTOP,            // Retrieve address of stack top (first address of | 
 |                           // locals and temporaries). | 
 |   GLOBAL_BASE_REG,        // Global base reg for PIC. | 
 |   Hi,                     // Hi/Lo operations, typically on a global address. | 
 |   Lo,                     // Hi/Lo operations, typically on a global address. | 
 |   RET_FLAG,               // Return with a flag operand. | 
 |   TS1AM,                  // A TS1AM instruction used for 1/2 bytes swap. | 
 |   VEC_UNPACK_LO,          // unpack the lo v256 slice of a packed v512 vector. | 
 |   VEC_UNPACK_HI,          // unpack the hi v256 slice of a packed v512 vector. | 
 |                           //    0: v512 vector, 1: AVL | 
 |   VEC_PACK,               // pack a lo and a hi vector into one v512 vector | 
 |                           //    0: v256 lo vector, 1: v256 hi vector, 2: AVL | 
 |  | 
 |   VEC_BROADCAST, // A vector broadcast instruction. | 
 |                  //   0: scalar value, 1: VL | 
 |   REPL_I32, | 
 |   REPL_F32, // Replicate subregister to other half. | 
 |  | 
 |   // Annotation as a wrapper. LEGALAVL(VL) means that VL refers to 64bit of | 
 |   // data, whereas the raw EVL coming in from VP nodes always refers to number | 
 |   // of elements, regardless of their size. | 
 |   LEGALAVL, | 
 |  | 
 | // VVP_* nodes. | 
 | #define ADD_VVP_OP(VVP_NAME, ...) VVP_NAME, | 
 | #include "VVPNodes.def" | 
 | }; | 
 | } | 
 |  | 
 | class VECustomDAG; | 
 |  | 
 | class VETargetLowering : public TargetLowering { | 
 |   const VESubtarget *Subtarget; | 
 |  | 
 |   void initRegisterClasses(); | 
 |   void initSPUActions(); | 
 |   void initVPUActions(); | 
 |  | 
 | public: | 
 |   VETargetLowering(const TargetMachine &TM, const VESubtarget &STI); | 
 |  | 
 |   const char *getTargetNodeName(unsigned Opcode) const override; | 
 |   MVT getScalarShiftAmountTy(const DataLayout &, EVT) const override { | 
 |     return MVT::i32; | 
 |   } | 
 |  | 
 |   Register getRegisterByName(const char *RegName, LLT VT, | 
 |                              const MachineFunction &MF) const override; | 
 |  | 
 |   /// getSetCCResultType - Return the ISD::SETCC ValueType | 
 |   EVT getSetCCResultType(const DataLayout &DL, LLVMContext &Context, | 
 |                          EVT VT) const override; | 
 |  | 
 |   SDValue LowerFormalArguments(SDValue Chain, CallingConv::ID CallConv, | 
 |                                bool isVarArg, | 
 |                                const SmallVectorImpl<ISD::InputArg> &Ins, | 
 |                                const SDLoc &dl, SelectionDAG &DAG, | 
 |                                SmallVectorImpl<SDValue> &InVals) const override; | 
 |  | 
 |   SDValue LowerCall(TargetLowering::CallLoweringInfo &CLI, | 
 |                     SmallVectorImpl<SDValue> &InVals) const override; | 
 |  | 
 |   bool CanLowerReturn(CallingConv::ID CallConv, MachineFunction &MF, | 
 |                       bool isVarArg, | 
 |                       const SmallVectorImpl<ISD::OutputArg> &ArgsFlags, | 
 |                       LLVMContext &Context) const override; | 
 |   SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv, bool isVarArg, | 
 |                       const SmallVectorImpl<ISD::OutputArg> &Outs, | 
 |                       const SmallVectorImpl<SDValue> &OutVals, const SDLoc &dl, | 
 |                       SelectionDAG &DAG) const override; | 
 |  | 
 |   /// Helper functions for atomic operations. | 
 |   bool shouldInsertFencesForAtomic(const Instruction *I) const override { | 
 |     // VE uses release consistency, so need fence for each atomics. | 
 |     return true; | 
 |   } | 
 |   Instruction *emitLeadingFence(IRBuilderBase &Builder, Instruction *Inst, | 
 |                                 AtomicOrdering Ord) const override; | 
 |   Instruction *emitTrailingFence(IRBuilderBase &Builder, Instruction *Inst, | 
 |                                  AtomicOrdering Ord) const override; | 
 |   TargetLoweringBase::AtomicExpansionKind | 
 |   shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const override; | 
 |   ISD::NodeType getExtendForAtomicOps() const override { | 
 |     return ISD::ANY_EXTEND; | 
 |   } | 
 |  | 
 |   /// Custom Lower { | 
 |   TargetLoweringBase::LegalizeAction | 
 |   getCustomOperationAction(SDNode &) const override; | 
 |  | 
 |   SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override; | 
 |   unsigned getJumpTableEncoding() const override; | 
 |   const MCExpr *LowerCustomJumpTableEntry(const MachineJumpTableInfo *MJTI, | 
 |                                           const MachineBasicBlock *MBB, | 
 |                                           unsigned Uid, | 
 |                                           MCContext &Ctx) const override; | 
 |   SDValue getPICJumpTableRelocBase(SDValue Table, | 
 |                                    SelectionDAG &DAG) const override; | 
 |   // VE doesn't need getPICJumpTableRelocBaseExpr since it is used for only | 
 |   // EK_LabelDifference32. | 
 |  | 
 |   SDValue lowerATOMIC_FENCE(SDValue Op, SelectionDAG &DAG) const; | 
 |   SDValue lowerATOMIC_SWAP(SDValue Op, SelectionDAG &DAG) const; | 
 |   SDValue lowerBlockAddress(SDValue Op, SelectionDAG &DAG) const; | 
 |   SDValue lowerConstantPool(SDValue Op, SelectionDAG &DAG) const; | 
 |   SDValue lowerDYNAMIC_STACKALLOC(SDValue Op, SelectionDAG &DAG) const; | 
 |   SDValue lowerEH_SJLJ_LONGJMP(SDValue Op, SelectionDAG &DAG) const; | 
 |   SDValue lowerEH_SJLJ_SETJMP(SDValue Op, SelectionDAG &DAG) const; | 
 |   SDValue lowerEH_SJLJ_SETUP_DISPATCH(SDValue Op, SelectionDAG &DAG) const; | 
 |   SDValue lowerGlobalAddress(SDValue Op, SelectionDAG &DAG) const; | 
 |   SDValue lowerGlobalTLSAddress(SDValue Op, SelectionDAG &DAG) const; | 
 |   SDValue lowerINTRINSIC_WO_CHAIN(SDValue Op, SelectionDAG &DAG) const; | 
 |   SDValue lowerJumpTable(SDValue Op, SelectionDAG &DAG) const; | 
 |   SDValue lowerLOAD(SDValue Op, SelectionDAG &DAG) const; | 
 |   SDValue lowerSTORE(SDValue Op, SelectionDAG &DAG) const; | 
 |   SDValue lowerToTLSGeneralDynamicModel(SDValue Op, SelectionDAG &DAG) const; | 
 |   SDValue lowerVASTART(SDValue Op, SelectionDAG &DAG) const; | 
 |   SDValue lowerVAARG(SDValue Op, SelectionDAG &DAG) const; | 
 |  | 
 |   SDValue lowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG) const; | 
 |   SDValue lowerEXTRACT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) const; | 
 |   SDValue lowerINSERT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) const; | 
 |   /// } Custom Lower | 
 |  | 
 |   /// Replace the results of node with an illegal result | 
 |   /// type with new values built out of custom code. | 
 |   /// | 
 |   void ReplaceNodeResults(SDNode *N, SmallVectorImpl<SDValue> &Results, | 
 |                           SelectionDAG &DAG) const override; | 
 |  | 
 |   /// Custom Inserter { | 
 |   MachineBasicBlock * | 
 |   EmitInstrWithCustomInserter(MachineInstr &MI, | 
 |                               MachineBasicBlock *MBB) const override; | 
 |   MachineBasicBlock *emitEHSjLjLongJmp(MachineInstr &MI, | 
 |                                        MachineBasicBlock *MBB) const; | 
 |   MachineBasicBlock *emitEHSjLjSetJmp(MachineInstr &MI, | 
 |                                       MachineBasicBlock *MBB) const; | 
 |   MachineBasicBlock *emitSjLjDispatchBlock(MachineInstr &MI, | 
 |                                            MachineBasicBlock *BB) const; | 
 |  | 
 |   void setupEntryBlockForSjLj(MachineInstr &MI, MachineBasicBlock *MBB, | 
 |                               MachineBasicBlock *DispatchBB, int FI, | 
 |                               int Offset) const; | 
 |   // Setup basic block address. | 
 |   Register prepareMBB(MachineBasicBlock &MBB, MachineBasicBlock::iterator I, | 
 |                       MachineBasicBlock *TargetBB, const DebugLoc &DL) const; | 
 |   // Prepare function/variable address. | 
 |   Register prepareSymbol(MachineBasicBlock &MBB, MachineBasicBlock::iterator I, | 
 |                          StringRef Symbol, const DebugLoc &DL, bool IsLocal, | 
 |                          bool IsCall) const; | 
 |   /// } Custom Inserter | 
 |  | 
 |   /// VVP Lowering { | 
 |   SDValue lowerToVVP(SDValue Op, SelectionDAG &DAG) const; | 
 |   SDValue lowerVVP_LOAD_STORE(SDValue Op, VECustomDAG &) const; | 
 |   SDValue lowerVVP_GATHER_SCATTER(SDValue Op, VECustomDAG &) const; | 
 |  | 
 |   SDValue legalizeInternalVectorOp(SDValue Op, SelectionDAG &DAG) const; | 
 |   SDValue legalizeInternalLoadStoreOp(SDValue Op, VECustomDAG &CDAG) const; | 
 |   SDValue splitVectorOp(SDValue Op, VECustomDAG &CDAG) const; | 
 |   SDValue splitPackedLoadStore(SDValue Op, VECustomDAG &CDAG) const; | 
 |   SDValue legalizePackedAVL(SDValue Op, VECustomDAG &CDAG) const; | 
 |   SDValue splitMaskArithmetic(SDValue Op, SelectionDAG &DAG) const; | 
 |   /// } VVPLowering | 
 |  | 
 |   /// Custom DAGCombine { | 
 |   SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const override; | 
 |  | 
 |   SDValue combineSelect(SDNode *N, DAGCombinerInfo &DCI) const; | 
 |   SDValue combineSelectCC(SDNode *N, DAGCombinerInfo &DCI) const; | 
 |   SDValue combineTRUNCATE(SDNode *N, DAGCombinerInfo &DCI) const; | 
 |   /// } Custom DAGCombine | 
 |  | 
 |   SDValue withTargetFlags(SDValue Op, unsigned TF, SelectionDAG &DAG) const; | 
 |   SDValue makeHiLoPair(SDValue Op, unsigned HiTF, unsigned LoTF, | 
 |                        SelectionDAG &DAG) const; | 
 |   SDValue makeAddress(SDValue Op, SelectionDAG &DAG) const; | 
 |  | 
 |   bool isOffsetFoldingLegal(const GlobalAddressSDNode *GA) const override; | 
 |   bool isFPImmLegal(const APFloat &Imm, EVT VT, | 
 |                     bool ForCodeSize) const override; | 
 |   /// Returns true if the target allows unaligned memory accesses of the | 
 |   /// specified type. | 
 |   bool allowsMisalignedMemoryAccesses(EVT VT, unsigned AS, Align A, | 
 |                                       MachineMemOperand::Flags Flags, | 
 |                                       unsigned *Fast) const override; | 
 |  | 
 |   /// Inline Assembly { | 
 |  | 
 |   ConstraintType getConstraintType(StringRef Constraint) const override; | 
 |   std::pair<unsigned, const TargetRegisterClass *> | 
 |   getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI, | 
 |                                StringRef Constraint, MVT VT) const override; | 
 |  | 
 |   /// } Inline Assembly | 
 |  | 
 |   /// Target Optimization { | 
 |  | 
 |   // Return lower limit for number of blocks in a jump table. | 
 |   unsigned getMinimumJumpTableEntries() const override; | 
 |  | 
 |   // SX-Aurora VE's s/udiv is 5-9 times slower than multiply. | 
 |   bool isIntDivCheap(EVT, AttributeList) const override { return false; } | 
 |   // VE doesn't have rem. | 
 |   bool hasStandaloneRem(EVT) const override { return false; } | 
 |   // VE LDZ instruction returns 64 if the input is zero. | 
 |   bool isCheapToSpeculateCtlz(Type *) const override { return true; } | 
 |   // VE LDZ instruction is fast. | 
 |   bool isCtlzFast() const override { return true; } | 
 |   // VE has NND instruction. | 
 |   bool hasAndNot(SDValue Y) const override; | 
 |  | 
 |   /// } Target Optimization | 
 | }; | 
 | } // namespace llvm | 
 |  | 
 | #endif // LLVM_LIB_TARGET_VE_VEISELLOWERING_H |