|  | //===- subzero/src/IceAssemblerX86Base.h - base x86 assembler -*- C++ -*---===// | 
|  | // | 
|  | // Copyright (c) 2013, the Dart project authors.  Please see the AUTHORS file | 
|  | // for details. All rights reserved. Use of this source code is governed by a | 
|  | // BSD-style license that can be found in the LICENSE file. | 
|  | // | 
|  | // Modified by the Subzero authors. | 
|  | // | 
|  | //===----------------------------------------------------------------------===// | 
|  | // | 
|  | //                        The Subzero Code Generator | 
|  | // | 
|  | // This file is distributed under the University of Illinois Open Source | 
|  | // License. See LICENSE.TXT for details. | 
|  | // | 
|  | //===----------------------------------------------------------------------===// | 
|  | // | 
|  | /// \file | 
|  | /// \brief Defines the AssemblerX86 template class for x86, the base of all X86 | 
|  | /// assemblers. | 
|  | // | 
|  | //===----------------------------------------------------------------------===// | 
|  |  | 
|  | #ifndef SUBZERO_SRC_ICEASSEMBLERX86BASE_H | 
|  | #define SUBZERO_SRC_ICEASSEMBLERX86BASE_H | 
|  |  | 
|  | #include "IceAssembler.h" | 
|  | #include "IceDefs.h" | 
|  | #include "IceOperand.h" | 
|  | #include "IceTypes.h" | 
|  | #include "IceUtils.h" | 
|  |  | 
|  | namespace Ice { | 
|  |  | 
|  | #ifndef X86NAMESPACE | 
|  | #error "You must define the X86 Target namespace." | 
|  | #endif | 
|  |  | 
|  | namespace X86NAMESPACE { | 
|  |  | 
|  | template <typename TraitsType> | 
|  | class AssemblerX86Base : public ::Ice::Assembler { | 
|  | AssemblerX86Base(const AssemblerX86Base &) = delete; | 
|  | AssemblerX86Base &operator=(const AssemblerX86Base &) = delete; | 
|  |  | 
|  | protected: | 
|  | explicit AssemblerX86Base(bool EmitAddrSizeOverridePrefix = Traits::Is64Bit) | 
|  | : Assembler(Traits::AsmKind), | 
|  | EmitAddrSizeOverridePrefix(EmitAddrSizeOverridePrefix) { | 
|  | assert(Traits::Is64Bit || !EmitAddrSizeOverridePrefix); | 
|  | } | 
|  |  | 
|  | public: | 
|  | using Traits = TraitsType; | 
|  | using Address = typename Traits::Address; | 
|  | using ByteRegister = typename Traits::ByteRegister; | 
|  | using BrCond = typename Traits::Cond::BrCond; | 
|  | using CmppsCond = typename Traits::Cond::CmppsCond; | 
|  | using GPRRegister = typename Traits::GPRRegister; | 
|  | using Operand = typename Traits::Operand; | 
|  | using XmmRegister = typename Traits::XmmRegister; | 
|  |  | 
|  | static constexpr int MAX_NOP_SIZE = 8; | 
|  |  | 
|  | static bool classof(const Assembler *Asm) { | 
|  | return Asm->getKind() == Traits::AsmKind; | 
|  | } | 
|  |  | 
|  | class Immediate { | 
|  | Immediate(const Immediate &) = delete; | 
|  | Immediate &operator=(const Immediate &) = delete; | 
|  |  | 
|  | public: | 
|  | explicit Immediate(int32_t value) : value_(value) {} | 
|  |  | 
|  | explicit Immediate(AssemblerFixup *fixup) : fixup_(fixup) {} | 
|  |  | 
|  | int32_t value() const { return value_; } | 
|  | AssemblerFixup *fixup() const { return fixup_; } | 
|  |  | 
|  | bool is_int8() const { | 
|  | // We currently only allow 32-bit fixups, and they usually have value = 0, | 
|  | // so if fixup_ != nullptr, it shouldn't be classified as int8/16. | 
|  | return fixup_ == nullptr && Utils::IsInt(8, value_); | 
|  | } | 
|  | bool is_uint8() const { | 
|  | return fixup_ == nullptr && Utils::IsUint(8, value_); | 
|  | } | 
|  | bool is_uint16() const { | 
|  | return fixup_ == nullptr && Utils::IsUint(16, value_); | 
|  | } | 
|  |  | 
|  | private: | 
|  | const int32_t value_ = 0; | 
|  | AssemblerFixup *fixup_ = nullptr; | 
|  | }; | 
|  |  | 
|  | /// X86 allows near and far jumps. | 
|  | class Label final : public Ice::Label { | 
|  | Label(const Label &) = delete; | 
|  | Label &operator=(const Label &) = delete; | 
|  |  | 
|  | public: | 
|  | Label() = default; | 
|  | ~Label() = default; | 
|  |  | 
|  | void finalCheck() const override { | 
|  | Ice::Label::finalCheck(); | 
|  | assert(!hasNear()); | 
|  | } | 
|  |  | 
|  | /// Returns the position of an earlier branch instruction which assumes that | 
|  | /// this label is "near", and bumps iterator to the next near position. | 
|  | intptr_t getNearPosition() { | 
|  | assert(hasNear()); | 
|  | intptr_t Pos = UnresolvedNearPositions.back(); | 
|  | UnresolvedNearPositions.pop_back(); | 
|  | return Pos; | 
|  | } | 
|  |  | 
|  | bool hasNear() const { return !UnresolvedNearPositions.empty(); } | 
|  | bool isUnused() const override { | 
|  | return Ice::Label::isUnused() && !hasNear(); | 
|  | } | 
|  |  | 
|  | private: | 
|  | friend class AssemblerX86Base<TraitsType>; | 
|  |  | 
|  | void nearLinkTo(const Assembler &Asm, intptr_t position) { | 
|  | if (Asm.getPreliminary()) | 
|  | return; | 
|  | assert(!isBound()); | 
|  | UnresolvedNearPositions.push_back(position); | 
|  | } | 
|  |  | 
|  | llvm::SmallVector<intptr_t, 20> UnresolvedNearPositions; | 
|  | }; | 
|  |  | 
|  | public: | 
|  | ~AssemblerX86Base() override; | 
|  |  | 
|  | static const bool kNearJump = true; | 
|  | static const bool kFarJump = false; | 
|  |  | 
|  | void alignFunction() override; | 
|  |  | 
|  | SizeT getBundleAlignLog2Bytes() const override { return 5; } | 
|  |  | 
|  | const char *getAlignDirective() const override { return ".p2align"; } | 
|  |  | 
|  | llvm::ArrayRef<uint8_t> getNonExecBundlePadding() const override { | 
|  | static const uint8_t Padding[] = {0xF4}; | 
|  | return llvm::ArrayRef<uint8_t>(Padding, 1); | 
|  | } | 
|  |  | 
|  | void padWithNop(intptr_t Padding) override { | 
|  | while (Padding > MAX_NOP_SIZE) { | 
|  | nop(MAX_NOP_SIZE); | 
|  | Padding -= MAX_NOP_SIZE; | 
|  | } | 
|  | if (Padding) | 
|  | nop(Padding); | 
|  | } | 
|  |  | 
|  | Ice::Label *getCfgNodeLabel(SizeT NodeNumber) override; | 
|  | void bindCfgNodeLabel(const CfgNode *Node) override; | 
|  | Label *getOrCreateCfgNodeLabel(SizeT Number); | 
|  | Label *getOrCreateLocalLabel(SizeT Number); | 
|  | void bindLocalLabel(SizeT Number); | 
|  |  | 
|  | bool fixupIsPCRel(FixupKind Kind) const override { | 
|  | // Currently assuming this is the only PC-rel relocation type used. | 
|  | // TODO(jpp): Traits.PcRelTypes.count(Kind) != 0 | 
|  | return Kind == Traits::FK_PcRel; | 
|  | } | 
|  |  | 
|  | // Operations to emit GPR instructions (and dispatch on operand type). | 
|  | using TypedEmitGPR = void (AssemblerX86Base::*)(Type, GPRRegister); | 
|  | using TypedEmitAddr = void (AssemblerX86Base::*)(Type, const Address &); | 
|  | struct GPREmitterOneOp { | 
|  | TypedEmitGPR Reg; | 
|  | TypedEmitAddr Addr; | 
|  | }; | 
|  |  | 
|  | using TypedEmitGPRGPR = void (AssemblerX86Base::*)(Type, GPRRegister, | 
|  | GPRRegister); | 
|  | using TypedEmitGPRAddr = void (AssemblerX86Base::*)(Type, GPRRegister, | 
|  | const Address &); | 
|  | using TypedEmitGPRImm = void (AssemblerX86Base::*)(Type, GPRRegister, | 
|  | const Immediate &); | 
|  | struct GPREmitterRegOp { | 
|  | TypedEmitGPRGPR GPRGPR; | 
|  | TypedEmitGPRAddr GPRAddr; | 
|  | TypedEmitGPRImm GPRImm; | 
|  | }; | 
|  |  | 
|  | struct GPREmitterShiftOp { | 
|  | // Technically, Addr/GPR and Addr/Imm are also allowed, but */Addr are | 
|  | // not. In practice, we always normalize the Dest to a Register first. | 
|  | TypedEmitGPRGPR GPRGPR; | 
|  | TypedEmitGPRImm GPRImm; | 
|  | }; | 
|  |  | 
|  | using TypedEmitGPRGPRImm = void (AssemblerX86Base::*)(Type, GPRRegister, | 
|  | GPRRegister, | 
|  | const Immediate &); | 
|  | struct GPREmitterShiftD { | 
|  | // Technically AddrGPR and AddrGPRImm are also allowed, but in practice we | 
|  | // always normalize Dest to a Register first. | 
|  | TypedEmitGPRGPR GPRGPR; | 
|  | TypedEmitGPRGPRImm GPRGPRImm; | 
|  | }; | 
|  |  | 
|  | using TypedEmitAddrGPR = void (AssemblerX86Base::*)(Type, const Address &, | 
|  | GPRRegister); | 
|  | using TypedEmitAddrImm = void (AssemblerX86Base::*)(Type, const Address &, | 
|  | const Immediate &); | 
|  | struct GPREmitterAddrOp { | 
|  | TypedEmitAddrGPR AddrGPR; | 
|  | TypedEmitAddrImm AddrImm; | 
|  | }; | 
|  |  | 
|  | // Operations to emit XMM instructions (and dispatch on operand type). | 
|  | using TypedEmitXmmXmm = void (AssemblerX86Base::*)(Type, XmmRegister, | 
|  | XmmRegister); | 
|  | using TypedEmitXmmAddr = void (AssemblerX86Base::*)(Type, XmmRegister, | 
|  | const Address &); | 
|  | struct XmmEmitterRegOp { | 
|  | TypedEmitXmmXmm XmmXmm; | 
|  | TypedEmitXmmAddr XmmAddr; | 
|  | }; | 
|  |  | 
|  | using EmitXmmXmm = void (AssemblerX86Base::*)(XmmRegister, XmmRegister); | 
|  | using EmitXmmAddr = void (AssemblerX86Base::*)(XmmRegister, const Address &); | 
|  | using EmitAddrXmm = void (AssemblerX86Base::*)(const Address &, XmmRegister); | 
|  | struct XmmEmitterMovOps { | 
|  | EmitXmmXmm XmmXmm; | 
|  | EmitXmmAddr XmmAddr; | 
|  | EmitAddrXmm AddrXmm; | 
|  | }; | 
|  |  | 
|  | using TypedEmitXmmImm = void (AssemblerX86Base::*)(Type, XmmRegister, | 
|  | const Immediate &); | 
|  |  | 
|  | struct XmmEmitterShiftOp { | 
|  | TypedEmitXmmXmm XmmXmm; | 
|  | TypedEmitXmmAddr XmmAddr; | 
|  | TypedEmitXmmImm XmmImm; | 
|  | }; | 
|  |  | 
|  | // Cross Xmm/GPR cast instructions. | 
|  | template <typename DReg_t, typename SReg_t> struct CastEmitterRegOp { | 
|  | using TypedEmitRegs = void (AssemblerX86Base::*)(Type, DReg_t, Type, | 
|  | SReg_t); | 
|  | using TypedEmitAddr = void (AssemblerX86Base::*)(Type, DReg_t, Type, | 
|  | const Address &); | 
|  |  | 
|  | TypedEmitRegs RegReg; | 
|  | TypedEmitAddr RegAddr; | 
|  | }; | 
|  |  | 
|  | // Three operand (potentially) cross Xmm/GPR instructions. The last operand | 
|  | // must be an immediate. | 
|  | template <typename DReg_t, typename SReg_t> struct ThreeOpImmEmitter { | 
|  | using TypedEmitRegRegImm = void (AssemblerX86Base::*)(Type, DReg_t, SReg_t, | 
|  | const Immediate &); | 
|  | using TypedEmitRegAddrImm = void (AssemblerX86Base::*)(Type, DReg_t, | 
|  | const Address &, | 
|  | const Immediate &); | 
|  |  | 
|  | TypedEmitRegRegImm RegRegImm; | 
|  | TypedEmitRegAddrImm RegAddrImm; | 
|  | }; | 
|  |  | 
|  | /* | 
|  | * Emit Machine Instructions. | 
|  | */ | 
|  | void call(GPRRegister reg); | 
|  | void call(const Address &address); | 
|  | void call(const ConstantRelocatable *label); // not testable. | 
|  | void call(const Immediate &abs_address); | 
|  |  | 
|  | static const intptr_t kCallExternalLabelSize = 5; | 
|  |  | 
|  | void pushl(GPRRegister reg); | 
|  | void pushl(const Immediate &Imm); | 
|  | void pushl(const ConstantRelocatable *Label); | 
|  |  | 
|  | void popl(GPRRegister reg); | 
|  | void popl(const Address &address); | 
|  |  | 
|  | template <typename T = Traits, | 
|  | typename = typename std::enable_if<T::HasPusha>::type> | 
|  | void pushal(); | 
|  | template <typename T = Traits, | 
|  | typename = typename std::enable_if<T::HasPopa>::type> | 
|  | void popal(); | 
|  |  | 
|  | void setcc(BrCond condition, ByteRegister dst); | 
|  | void setcc(BrCond condition, const Address &address); | 
|  |  | 
|  | void mov(Type Ty, GPRRegister dst, const Immediate &src); | 
|  | void mov(Type Ty, GPRRegister dst, GPRRegister src); | 
|  | void mov(Type Ty, GPRRegister dst, const Address &src); | 
|  | void mov(Type Ty, const Address &dst, GPRRegister src); | 
|  | void mov(Type Ty, const Address &dst, const Immediate &imm); | 
|  |  | 
|  | template <typename T = Traits> | 
|  | typename std::enable_if<T::Is64Bit, void>::type movabs(const GPRRegister Dst, | 
|  | uint64_t Imm64); | 
|  | template <typename T = Traits> | 
|  | typename std::enable_if<!T::Is64Bit, void>::type movabs(const GPRRegister, | 
|  | uint64_t) { | 
|  | llvm::report_fatal_error("movabs is only supported in 64-bit x86 targets."); | 
|  | } | 
|  |  | 
|  | void movzx(Type Ty, GPRRegister dst, GPRRegister src); | 
|  | void movzx(Type Ty, GPRRegister dst, const Address &src); | 
|  | void movsx(Type Ty, GPRRegister dst, GPRRegister src); | 
|  | void movsx(Type Ty, GPRRegister dst, const Address &src); | 
|  |  | 
|  | void lea(Type Ty, GPRRegister dst, const Address &src); | 
|  |  | 
|  | void cmov(Type Ty, BrCond cond, GPRRegister dst, GPRRegister src); | 
|  | void cmov(Type Ty, BrCond cond, GPRRegister dst, const Address &src); | 
|  |  | 
|  | void rep_movsb(); | 
|  |  | 
|  | void movss(Type Ty, XmmRegister dst, const Address &src); | 
|  | void movss(Type Ty, const Address &dst, XmmRegister src); | 
|  | void movss(Type Ty, XmmRegister dst, XmmRegister src); | 
|  |  | 
|  | void movd(Type SrcTy, XmmRegister dst, GPRRegister src); | 
|  | void movd(Type SrcTy, XmmRegister dst, const Address &src); | 
|  | void movd(Type DestTy, GPRRegister dst, XmmRegister src); | 
|  | void movd(Type DestTy, const Address &dst, XmmRegister src); | 
|  |  | 
|  | void movq(XmmRegister dst, XmmRegister src); | 
|  | void movq(const Address &dst, XmmRegister src); | 
|  | void movq(XmmRegister dst, const Address &src); | 
|  |  | 
|  | void addss(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void addss(Type Ty, XmmRegister dst, const Address &src); | 
|  | void subss(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void subss(Type Ty, XmmRegister dst, const Address &src); | 
|  | void mulss(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void mulss(Type Ty, XmmRegister dst, const Address &src); | 
|  | void divss(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void divss(Type Ty, XmmRegister dst, const Address &src); | 
|  |  | 
|  | void movaps(XmmRegister dst, XmmRegister src); | 
|  |  | 
|  | void movups(XmmRegister dst, XmmRegister src); | 
|  | void movups(XmmRegister dst, const Address &src); | 
|  | void movups(const Address &dst, XmmRegister src); | 
|  |  | 
|  | void padd(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void padd(Type Ty, XmmRegister dst, const Address &src); | 
|  | void pand(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void pand(Type Ty, XmmRegister dst, const Address &src); | 
|  | void pandn(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void pandn(Type Ty, XmmRegister dst, const Address &src); | 
|  | void pmull(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void pmull(Type Ty, XmmRegister dst, const Address &src); | 
|  | void pmuludq(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void pmuludq(Type Ty, XmmRegister dst, const Address &src); | 
|  | void por(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void por(Type Ty, XmmRegister dst, const Address &src); | 
|  | void psub(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void psub(Type Ty, XmmRegister dst, const Address &src); | 
|  | void pxor(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void pxor(Type Ty, XmmRegister dst, const Address &src); | 
|  |  | 
|  | void psll(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void psll(Type Ty, XmmRegister dst, const Address &src); | 
|  | void psll(Type Ty, XmmRegister dst, const Immediate &src); | 
|  |  | 
|  | void psra(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void psra(Type Ty, XmmRegister dst, const Address &src); | 
|  | void psra(Type Ty, XmmRegister dst, const Immediate &src); | 
|  | void psrl(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void psrl(Type Ty, XmmRegister dst, const Address &src); | 
|  | void psrl(Type Ty, XmmRegister dst, const Immediate &src); | 
|  |  | 
|  | void addps(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void addps(Type Ty, XmmRegister dst, const Address &src); | 
|  | void subps(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void subps(Type Ty, XmmRegister dst, const Address &src); | 
|  | void divps(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void divps(Type Ty, XmmRegister dst, const Address &src); | 
|  | void mulps(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void mulps(Type Ty, XmmRegister dst, const Address &src); | 
|  | void minps(Type Ty, XmmRegister dst, const Address &src); | 
|  | void minps(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void minss(Type Ty, XmmRegister dst, const Address &src); | 
|  | void minss(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void maxps(Type Ty, XmmRegister dst, const Address &src); | 
|  | void maxps(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void maxss(Type Ty, XmmRegister dst, const Address &src); | 
|  | void maxss(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void andnps(Type Ty, XmmRegister dst, const Address &src); | 
|  | void andnps(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void andps(Type Ty, XmmRegister dst, const Address &src); | 
|  | void andps(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void orps(Type Ty, XmmRegister dst, const Address &src); | 
|  | void orps(Type Ty, XmmRegister dst, XmmRegister src); | 
|  |  | 
|  | void blendvps(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void blendvps(Type Ty, XmmRegister dst, const Address &src); | 
|  | void pblendvb(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void pblendvb(Type Ty, XmmRegister dst, const Address &src); | 
|  |  | 
|  | void cmpps(Type Ty, XmmRegister dst, XmmRegister src, CmppsCond CmpCondition); | 
|  | void cmpps(Type Ty, XmmRegister dst, const Address &src, | 
|  | CmppsCond CmpCondition); | 
|  |  | 
|  | void sqrtps(XmmRegister dst); | 
|  | void rsqrtps(XmmRegister dst); | 
|  | void reciprocalps(XmmRegister dst); | 
|  |  | 
|  | void movhlps(XmmRegister dst, XmmRegister src); | 
|  | void movlhps(XmmRegister dst, XmmRegister src); | 
|  | void unpcklps(XmmRegister dst, XmmRegister src); | 
|  | void unpckhps(XmmRegister dst, XmmRegister src); | 
|  | void unpcklpd(XmmRegister dst, XmmRegister src); | 
|  | void unpckhpd(XmmRegister dst, XmmRegister src); | 
|  |  | 
|  | void set1ps(XmmRegister dst, GPRRegister tmp, const Immediate &imm); | 
|  |  | 
|  | void sqrtpd(XmmRegister dst); | 
|  |  | 
|  | void pshufd(Type Ty, XmmRegister dst, XmmRegister src, const Immediate &mask); | 
|  | void pshufd(Type Ty, XmmRegister dst, const Address &src, | 
|  | const Immediate &mask); | 
|  | void shufps(Type Ty, XmmRegister dst, XmmRegister src, const Immediate &mask); | 
|  | void shufps(Type Ty, XmmRegister dst, const Address &src, | 
|  | const Immediate &mask); | 
|  |  | 
|  | void cvtdq2ps(Type, XmmRegister dst, XmmRegister src); | 
|  | void cvtdq2ps(Type, XmmRegister dst, const Address &src); | 
|  |  | 
|  | void cvttps2dq(Type, XmmRegister dst, XmmRegister src); | 
|  | void cvttps2dq(Type, XmmRegister dst, const Address &src); | 
|  |  | 
|  | void cvtsi2ss(Type DestTy, XmmRegister dst, Type SrcTy, GPRRegister src); | 
|  | void cvtsi2ss(Type DestTy, XmmRegister dst, Type SrcTy, const Address &src); | 
|  |  | 
|  | void cvtfloat2float(Type SrcTy, XmmRegister dst, XmmRegister src); | 
|  | void cvtfloat2float(Type SrcTy, XmmRegister dst, const Address &src); | 
|  |  | 
|  | void cvttss2si(Type DestTy, GPRRegister dst, Type SrcTy, XmmRegister src); | 
|  | void cvttss2si(Type DestTy, GPRRegister dst, Type SrcTy, const Address &src); | 
|  |  | 
|  | void ucomiss(Type Ty, XmmRegister a, XmmRegister b); | 
|  | void ucomiss(Type Ty, XmmRegister a, const Address &b); | 
|  |  | 
|  | void movmskpd(GPRRegister dst, XmmRegister src); | 
|  | void movmskps(GPRRegister dst, XmmRegister src); | 
|  |  | 
|  | void sqrtss(Type Ty, XmmRegister dst, const Address &src); | 
|  | void sqrtss(Type Ty, XmmRegister dst, XmmRegister src); | 
|  |  | 
|  | void xorps(Type Ty, XmmRegister dst, const Address &src); | 
|  | void xorps(Type Ty, XmmRegister dst, XmmRegister src); | 
|  |  | 
|  | void insertps(Type Ty, XmmRegister dst, XmmRegister src, | 
|  | const Immediate &imm); | 
|  | void insertps(Type Ty, XmmRegister dst, const Address &src, | 
|  | const Immediate &imm); | 
|  |  | 
|  | void pinsr(Type Ty, XmmRegister dst, GPRRegister src, const Immediate &imm); | 
|  | void pinsr(Type Ty, XmmRegister dst, const Address &src, | 
|  | const Immediate &imm); | 
|  |  | 
|  | void pextr(Type Ty, GPRRegister dst, XmmRegister src, const Immediate &imm); | 
|  |  | 
|  | void pmovsxdq(XmmRegister dst, XmmRegister src); | 
|  |  | 
|  | void pcmpeq(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void pcmpeq(Type Ty, XmmRegister dst, const Address &src); | 
|  | void pcmpgt(Type Ty, XmmRegister dst, XmmRegister src); | 
|  | void pcmpgt(Type Ty, XmmRegister dst, const Address &src); | 
|  |  | 
|  | enum RoundingMode { | 
|  | kRoundToNearest = 0x0, | 
|  | kRoundDown = 0x1, | 
|  | kRoundUp = 0x2, | 
|  | kRoundToZero = 0x3 | 
|  | }; | 
|  | void roundsd(XmmRegister dst, XmmRegister src, RoundingMode mode); | 
|  |  | 
|  | //---------------------------------------------------------------------------- | 
|  | // | 
|  | // Begin: X87 instructions. Only available when Traits::UsesX87. | 
|  | // | 
|  | //---------------------------------------------------------------------------- | 
|  | template <typename T = Traits, | 
|  | typename = typename std::enable_if<T::UsesX87>::type> | 
|  | void fld(Type Ty, const typename T::Address &src); | 
|  | template <typename T = Traits, | 
|  | typename = typename std::enable_if<T::UsesX87>::type> | 
|  | void fstp(Type Ty, const typename T::Address &dst); | 
|  | template <typename T = Traits, | 
|  | typename = typename std::enable_if<T::UsesX87>::type> | 
|  | void fstp(typename T::X87STRegister st); | 
|  |  | 
|  | template <typename T = Traits, | 
|  | typename = typename std::enable_if<T::UsesX87>::type> | 
|  | void fnstcw(const typename T::Address &dst); | 
|  | template <typename T = Traits, | 
|  | typename = typename std::enable_if<T::UsesX87>::type> | 
|  | void fldcw(const typename T::Address &src); | 
|  |  | 
|  | template <typename T = Traits, | 
|  | typename = typename std::enable_if<T::UsesX87>::type> | 
|  | void fistpl(const typename T::Address &dst); | 
|  | template <typename T = Traits, | 
|  | typename = typename std::enable_if<T::UsesX87>::type> | 
|  | void fistps(const typename T::Address &dst); | 
|  | template <typename T = Traits, | 
|  | typename = typename std::enable_if<T::UsesX87>::type> | 
|  | void fildl(const typename T::Address &src); | 
|  | template <typename T = Traits, | 
|  | typename = typename std::enable_if<T::UsesX87>::type> | 
|  | void filds(const typename T::Address &src); | 
|  |  | 
|  | template <typename T = Traits, | 
|  | typename = typename std::enable_if<T::UsesX87>::type> | 
|  | void fincstp(); | 
|  | //---------------------------------------------------------------------------- | 
|  | // | 
|  | // End: X87 instructions. | 
|  | // | 
|  | //---------------------------------------------------------------------------- | 
|  |  | 
|  | void cmp(Type Ty, GPRRegister reg0, GPRRegister reg1); | 
|  | void cmp(Type Ty, GPRRegister reg, const Address &address); | 
|  | void cmp(Type Ty, GPRRegister reg, const Immediate &imm); | 
|  | void cmp(Type Ty, const Address &address, GPRRegister reg); | 
|  | void cmp(Type Ty, const Address &address, const Immediate &imm); | 
|  |  | 
|  | void test(Type Ty, GPRRegister reg0, GPRRegister reg1); | 
|  | void test(Type Ty, GPRRegister reg, const Immediate &imm); | 
|  | void test(Type Ty, const Address &address, GPRRegister reg); | 
|  | void test(Type Ty, const Address &address, const Immediate &imm); | 
|  |  | 
|  | void And(Type Ty, GPRRegister dst, GPRRegister src); | 
|  | void And(Type Ty, GPRRegister dst, const Address &address); | 
|  | void And(Type Ty, GPRRegister dst, const Immediate &imm); | 
|  | void And(Type Ty, const Address &address, GPRRegister reg); | 
|  | void And(Type Ty, const Address &address, const Immediate &imm); | 
|  |  | 
|  | void Or(Type Ty, GPRRegister dst, GPRRegister src); | 
|  | void Or(Type Ty, GPRRegister dst, const Address &address); | 
|  | void Or(Type Ty, GPRRegister dst, const Immediate &imm); | 
|  | void Or(Type Ty, const Address &address, GPRRegister reg); | 
|  | void Or(Type Ty, const Address &address, const Immediate &imm); | 
|  |  | 
|  | void Xor(Type Ty, GPRRegister dst, GPRRegister src); | 
|  | void Xor(Type Ty, GPRRegister dst, const Address &address); | 
|  | void Xor(Type Ty, GPRRegister dst, const Immediate &imm); | 
|  | void Xor(Type Ty, const Address &address, GPRRegister reg); | 
|  | void Xor(Type Ty, const Address &address, const Immediate &imm); | 
|  |  | 
|  | void add(Type Ty, GPRRegister dst, GPRRegister src); | 
|  | void add(Type Ty, GPRRegister reg, const Address &address); | 
|  | void add(Type Ty, GPRRegister reg, const Immediate &imm); | 
|  | void add(Type Ty, const Address &address, GPRRegister reg); | 
|  | void add(Type Ty, const Address &address, const Immediate &imm); | 
|  |  | 
|  | void adc(Type Ty, GPRRegister dst, GPRRegister src); | 
|  | void adc(Type Ty, GPRRegister dst, const Address &address); | 
|  | void adc(Type Ty, GPRRegister reg, const Immediate &imm); | 
|  | void adc(Type Ty, const Address &address, GPRRegister reg); | 
|  | void adc(Type Ty, const Address &address, const Immediate &imm); | 
|  |  | 
|  | void sub(Type Ty, GPRRegister dst, GPRRegister src); | 
|  | void sub(Type Ty, GPRRegister reg, const Address &address); | 
|  | void sub(Type Ty, GPRRegister reg, const Immediate &imm); | 
|  | void sub(Type Ty, const Address &address, GPRRegister reg); | 
|  | void sub(Type Ty, const Address &address, const Immediate &imm); | 
|  |  | 
|  | void sbb(Type Ty, GPRRegister dst, GPRRegister src); | 
|  | void sbb(Type Ty, GPRRegister reg, const Address &address); | 
|  | void sbb(Type Ty, GPRRegister reg, const Immediate &imm); | 
|  | void sbb(Type Ty, const Address &address, GPRRegister reg); | 
|  | void sbb(Type Ty, const Address &address, const Immediate &imm); | 
|  |  | 
|  | void cbw(); | 
|  | void cwd(); | 
|  | void cdq(); | 
|  | template <typename T = Traits> | 
|  | typename std::enable_if<T::Is64Bit, void>::type cqo(); | 
|  | template <typename T = Traits> | 
|  | typename std::enable_if<!T::Is64Bit, void>::type cqo() { | 
|  | llvm::report_fatal_error("CQO is only available in 64-bit x86 backends."); | 
|  | } | 
|  |  | 
|  | void div(Type Ty, GPRRegister reg); | 
|  | void div(Type Ty, const Address &address); | 
|  |  | 
|  | void idiv(Type Ty, GPRRegister reg); | 
|  | void idiv(Type Ty, const Address &address); | 
|  |  | 
|  | void imul(Type Ty, GPRRegister dst, GPRRegister src); | 
|  | void imul(Type Ty, GPRRegister reg, const Immediate &imm); | 
|  | void imul(Type Ty, GPRRegister reg, const Address &address); | 
|  |  | 
|  | void imul(Type Ty, GPRRegister reg); | 
|  | void imul(Type Ty, const Address &address); | 
|  |  | 
|  | void imul(Type Ty, GPRRegister dst, GPRRegister src, const Immediate &imm); | 
|  | void imul(Type Ty, GPRRegister dst, const Address &address, | 
|  | const Immediate &imm); | 
|  |  | 
|  | void mul(Type Ty, GPRRegister reg); | 
|  | void mul(Type Ty, const Address &address); | 
|  |  | 
|  | template <class T = Traits, | 
|  | typename = typename std::enable_if<!T::Is64Bit>::type> | 
|  | void incl(GPRRegister reg); | 
|  | void incl(const Address &address); | 
|  |  | 
|  | template <class T = Traits, | 
|  | typename = typename std::enable_if<!T::Is64Bit>::type> | 
|  | void decl(GPRRegister reg); | 
|  | void decl(const Address &address); | 
|  |  | 
|  | void rol(Type Ty, GPRRegister reg, const Immediate &imm); | 
|  | void rol(Type Ty, GPRRegister operand, GPRRegister shifter); | 
|  | void rol(Type Ty, const Address &operand, GPRRegister shifter); | 
|  |  | 
|  | void shl(Type Ty, GPRRegister reg, const Immediate &imm); | 
|  | void shl(Type Ty, GPRRegister operand, GPRRegister shifter); | 
|  | void shl(Type Ty, const Address &operand, GPRRegister shifter); | 
|  |  | 
|  | void shr(Type Ty, GPRRegister reg, const Immediate &imm); | 
|  | void shr(Type Ty, GPRRegister operand, GPRRegister shifter); | 
|  | void shr(Type Ty, const Address &operand, GPRRegister shifter); | 
|  |  | 
|  | void sar(Type Ty, GPRRegister reg, const Immediate &imm); | 
|  | void sar(Type Ty, GPRRegister operand, GPRRegister shifter); | 
|  | void sar(Type Ty, const Address &address, GPRRegister shifter); | 
|  |  | 
|  | void shld(Type Ty, GPRRegister dst, GPRRegister src); | 
|  | void shld(Type Ty, GPRRegister dst, GPRRegister src, const Immediate &imm); | 
|  | void shld(Type Ty, const Address &operand, GPRRegister src); | 
|  | void shrd(Type Ty, GPRRegister dst, GPRRegister src); | 
|  | void shrd(Type Ty, GPRRegister dst, GPRRegister src, const Immediate &imm); | 
|  | void shrd(Type Ty, const Address &dst, GPRRegister src); | 
|  |  | 
|  | void neg(Type Ty, GPRRegister reg); | 
|  | void neg(Type Ty, const Address &addr); | 
|  | void notl(GPRRegister reg); | 
|  |  | 
|  | void bsf(Type Ty, GPRRegister dst, GPRRegister src); | 
|  | void bsf(Type Ty, GPRRegister dst, const Address &src); | 
|  | void bsr(Type Ty, GPRRegister dst, GPRRegister src); | 
|  | void bsr(Type Ty, GPRRegister dst, const Address &src); | 
|  |  | 
|  | void bswap(Type Ty, GPRRegister reg); | 
|  |  | 
|  | void bt(GPRRegister base, GPRRegister offset); | 
|  |  | 
|  | void ret(); | 
|  | void ret(const Immediate &imm); | 
|  |  | 
|  | // 'size' indicates size in bytes and must be in the range 1..8. | 
|  | void nop(int size = 1); | 
|  | void int3(); | 
|  | void hlt(); | 
|  | void ud2(); | 
|  |  | 
|  | // j(Label) is fully tested. | 
|  | void j(BrCond condition, Label *label, bool near = kFarJump); | 
|  | void j(BrCond condition, const ConstantRelocatable *label); // not testable. | 
|  |  | 
|  | void jmp(GPRRegister reg); | 
|  | void jmp(Label *label, bool near = kFarJump); | 
|  | void jmp(const ConstantRelocatable *label); // not testable. | 
|  | void jmp(const Immediate &abs_address); | 
|  |  | 
|  | void mfence(); | 
|  |  | 
|  | void lock(); | 
|  | void cmpxchg(Type Ty, const Address &address, GPRRegister reg, bool Locked); | 
|  | void cmpxchg8b(const Address &address, bool Locked); | 
|  | void xadd(Type Ty, const Address &address, GPRRegister reg, bool Locked); | 
|  | void xchg(Type Ty, GPRRegister reg0, GPRRegister reg1); | 
|  | void xchg(Type Ty, const Address &address, GPRRegister reg); | 
|  |  | 
|  | /// \name Intel Architecture Code Analyzer markers. | 
|  | /// @{ | 
|  | void iaca_start(); | 
|  | void iaca_end(); | 
|  | /// @} | 
|  |  | 
|  | void emitSegmentOverride(uint8_t prefix); | 
|  |  | 
|  | intptr_t preferredLoopAlignment() { return 16; } | 
|  | void align(intptr_t alignment, intptr_t offset); | 
|  | void bind(Label *label); | 
|  |  | 
|  | intptr_t CodeSize() const { return Buffer.size(); } | 
|  |  | 
|  | protected: | 
|  | inline void emitUint8(uint8_t value); | 
|  |  | 
|  | private: | 
|  | ENABLE_MAKE_UNIQUE; | 
|  |  | 
|  | // EmidAddrSizeOverridePrefix directs the emission of the 0x67 prefix to | 
|  | // force 32-bit registers when accessing memory. This is only used in native | 
|  | // 64-bit. | 
|  | const bool EmitAddrSizeOverridePrefix; | 
|  |  | 
|  | static constexpr Type RexTypeIrrelevant = IceType_i32; | 
|  | static constexpr Type RexTypeForceRexW = IceType_i64; | 
|  | static constexpr GPRRegister RexRegIrrelevant = | 
|  | Traits::GPRRegister::Encoded_Reg_eax; | 
|  |  | 
|  | inline void emitInt16(int16_t value); | 
|  | inline void emitInt32(int32_t value); | 
|  | inline void emitRegisterOperand(int rm, int reg); | 
|  | template <typename RegType, typename RmType> | 
|  | inline void emitXmmRegisterOperand(RegType reg, RmType rm); | 
|  | inline void emitOperandSizeOverride(); | 
|  |  | 
|  | void emitOperand(int rm, const Operand &operand, RelocOffsetT Addend = 0); | 
|  | void emitImmediate(Type ty, const Immediate &imm); | 
|  | void emitComplexI8(int rm, const Operand &operand, | 
|  | const Immediate &immediate); | 
|  | void emitComplex(Type Ty, int rm, const Operand &operand, | 
|  | const Immediate &immediate); | 
|  | void emitLabel(Label *label, intptr_t instruction_size); | 
|  | void emitLabelLink(Label *label); | 
|  | void emitNearLabelLink(Label *label); | 
|  |  | 
|  | void emitGenericShift(int rm, Type Ty, GPRRegister reg, const Immediate &imm); | 
|  | void emitGenericShift(int rm, Type Ty, const Operand &operand, | 
|  | GPRRegister shifter); | 
|  |  | 
|  | using LabelVector = std::vector<Label *>; | 
|  | // A vector of pool-allocated x86 labels for CFG nodes. | 
|  | LabelVector CfgNodeLabels; | 
|  | // A vector of pool-allocated x86 labels for Local labels. | 
|  | LabelVector LocalLabels; | 
|  |  | 
|  | Label *getOrCreateLabel(SizeT Number, LabelVector &Labels); | 
|  |  | 
|  | void emitAddrSizeOverridePrefix() { | 
|  | if (!Traits::Is64Bit || !EmitAddrSizeOverridePrefix) { | 
|  | return; | 
|  | } | 
|  | static constexpr uint8_t AddrSizeOverridePrefix = 0x67; | 
|  | emitUint8(AddrSizeOverridePrefix); | 
|  | } | 
|  |  | 
|  | // The arith_int() methods factor out the commonality between the encodings | 
|  | // of add(), Or(), adc(), sbb(), And(), sub(), Xor(), and cmp(). The Tag | 
|  | // parameter is statically asserted to be less than 8. | 
|  | template <uint32_t Tag> | 
|  | void arith_int(Type Ty, GPRRegister reg, const Immediate &imm); | 
|  |  | 
|  | template <uint32_t Tag> | 
|  | void arith_int(Type Ty, GPRRegister reg0, GPRRegister reg1); | 
|  |  | 
|  | template <uint32_t Tag> | 
|  | void arith_int(Type Ty, GPRRegister reg, const Address &address); | 
|  |  | 
|  | template <uint32_t Tag> | 
|  | void arith_int(Type Ty, const Address &address, GPRRegister reg); | 
|  |  | 
|  | template <uint32_t Tag> | 
|  | void arith_int(Type Ty, const Address &address, const Immediate &imm); | 
|  |  | 
|  | // gprEncoding returns Reg encoding for operand emission. For x86-64 we mask | 
|  | // out the 4th bit as it is encoded in the REX.[RXB] bits. No other bits are | 
|  | // touched because we don't want to mask errors. | 
|  | template <typename RegType, typename T = Traits> | 
|  | typename std::enable_if<T::Is64Bit, typename T::GPRRegister>::type | 
|  | gprEncoding(const RegType Reg) { | 
|  | return static_cast<GPRRegister>(static_cast<uint8_t>(Reg) & ~0x08); | 
|  | } | 
|  |  | 
|  | template <typename RegType, typename T = Traits> | 
|  | typename std::enable_if<!T::Is64Bit, typename T::GPRRegister>::type | 
|  | gprEncoding(const RegType Reg) { | 
|  | return static_cast<typename T::GPRRegister>(Reg); | 
|  | } | 
|  |  | 
|  | template <typename RegType> | 
|  | bool is8BitRegisterRequiringRex(const Type Ty, const RegType Reg) { | 
|  | static constexpr bool IsGPR = | 
|  | std::is_same<typename std::decay<RegType>::type, ByteRegister>::value || | 
|  | std::is_same<typename std::decay<RegType>::type, GPRRegister>::value; | 
|  |  | 
|  | // At this point in the assembler, we have encoded regs, so it is not | 
|  | // possible to distinguish between the "new" low byte registers introduced | 
|  | // in x86-64 and the legacy [abcd]h registers. Because x86, we may still | 
|  | // see ah (div) in the assembler, so we whitelist it here. | 
|  | // | 
|  | // The "local" uint32_t Encoded_Reg_ah is needed because RegType is an | 
|  | // enum that is not necessarily the same type of | 
|  | // Traits::RegisterSet::Encoded_Reg_ah. | 
|  | constexpr uint32_t Encoded_Reg_ah = Traits::RegisterSet::Encoded_Reg_ah; | 
|  | return IsGPR && (Reg & 0x04) != 0 && (Reg & 0x08) == 0 && | 
|  | isByteSizedType(Ty) && (Reg != Encoded_Reg_ah); | 
|  | } | 
|  |  | 
|  | // assembleAndEmitRex is used for determining which (if any) rex prefix | 
|  | // should be emitted for the current instruction. It allows different types | 
|  | // for Reg and Rm because they could be of different types (e.g., in | 
|  | // mov[sz]x instructions.) If Addr is not nullptr, then Rm is ignored, and | 
|  | // Rex.B is determined by Addr instead. TyRm is still used to determine | 
|  | // Addr's size. | 
|  | template <typename RegType, typename RmType, typename T = Traits> | 
|  | typename std::enable_if<T::Is64Bit, void>::type | 
|  | assembleAndEmitRex(const Type TyReg, const RegType Reg, const Type TyRm, | 
|  | const RmType Rm, | 
|  | const typename T::Address *Addr = nullptr) { | 
|  | const uint8_t W = (TyReg == IceType_i64 || TyRm == IceType_i64) | 
|  | ? T::Operand::RexW | 
|  | : T::Operand::RexNone; | 
|  | const uint8_t R = (Reg & 0x08) ? T::Operand::RexR : T::Operand::RexNone; | 
|  | const uint8_t X = (Addr != nullptr) | 
|  | ? (typename T::Operand::RexBits)Addr->rexX() | 
|  | : T::Operand::RexNone; | 
|  | const uint8_t B = | 
|  | (Addr != nullptr) | 
|  | ? (typename T::Operand::RexBits)Addr->rexB() | 
|  | : (Rm & 0x08) ? T::Operand::RexB : T::Operand::RexNone; | 
|  | const uint8_t Prefix = W | R | X | B; | 
|  | if (Prefix != T::Operand::RexNone) { | 
|  | emitUint8(Prefix); | 
|  | } else if (is8BitRegisterRequiringRex(TyReg, Reg) || | 
|  | (Addr == nullptr && is8BitRegisterRequiringRex(TyRm, Rm))) { | 
|  | emitUint8(T::Operand::RexBase); | 
|  | } | 
|  | } | 
|  |  | 
|  | template <typename RegType, typename RmType, typename T = Traits> | 
|  | typename std::enable_if<!T::Is64Bit, void>::type | 
|  | assembleAndEmitRex(const Type, const RegType, const Type, const RmType, | 
|  | const typename T::Address * = nullptr) {} | 
|  |  | 
|  | // emitRexRB is used for emitting a Rex prefix instructions with two | 
|  | // explicit register operands in its mod-rm byte. | 
|  | template <typename RegType, typename RmType> | 
|  | void emitRexRB(const Type Ty, const RegType Reg, const RmType Rm) { | 
|  | assembleAndEmitRex(Ty, Reg, Ty, Rm); | 
|  | } | 
|  |  | 
|  | template <typename RegType, typename RmType> | 
|  | void emitRexRB(const Type TyReg, const RegType Reg, const Type TyRm, | 
|  | const RmType Rm) { | 
|  | assembleAndEmitRex(TyReg, Reg, TyRm, Rm); | 
|  | } | 
|  |  | 
|  | // emitRexB is used for emitting a Rex prefix if one is needed on encoding | 
|  | // the Reg field in an x86 instruction. It is invoked by the template when | 
|  | // Reg is the single register operand in the instruction (e.g., push Reg.) | 
|  | template <typename RmType> void emitRexB(const Type Ty, const RmType Rm) { | 
|  | emitRexRB(Ty, RexRegIrrelevant, Ty, Rm); | 
|  | } | 
|  |  | 
|  | // emitRex is used for emitting a Rex prefix for an address and a GPR. The | 
|  | // address may contain zero, one, or two registers. | 
|  | template <typename RegType> | 
|  | void emitRex(const Type Ty, const Address &Addr, const RegType Reg) { | 
|  | assembleAndEmitRex(Ty, Reg, Ty, RexRegIrrelevant, &Addr); | 
|  | } | 
|  |  | 
|  | template <typename RegType> | 
|  | void emitRex(const Type AddrTy, const Address &Addr, const Type TyReg, | 
|  | const RegType Reg) { | 
|  | assembleAndEmitRex(TyReg, Reg, AddrTy, RexRegIrrelevant, &Addr); | 
|  | } | 
|  | }; | 
|  |  | 
|  | template <typename TraitsType> | 
|  | inline void AssemblerX86Base<TraitsType>::emitUint8(uint8_t value) { | 
|  | Buffer.emit<uint8_t>(value); | 
|  | } | 
|  |  | 
|  | template <typename TraitsType> | 
|  | inline void AssemblerX86Base<TraitsType>::emitInt16(int16_t value) { | 
|  | Buffer.emit<int16_t>(value); | 
|  | } | 
|  |  | 
|  | template <typename TraitsType> | 
|  | inline void AssemblerX86Base<TraitsType>::emitInt32(int32_t value) { | 
|  | Buffer.emit<int32_t>(value); | 
|  | } | 
|  |  | 
|  | template <typename TraitsType> | 
|  | inline void AssemblerX86Base<TraitsType>::emitRegisterOperand(int reg, int rm) { | 
|  | assert(reg >= 0 && reg < 8); | 
|  | assert(rm >= 0 && rm < 8); | 
|  | Buffer.emit<uint8_t>(0xC0 + (reg << 3) + rm); | 
|  | } | 
|  |  | 
|  | template <typename TraitsType> | 
|  | template <typename RegType, typename RmType> | 
|  | inline void AssemblerX86Base<TraitsType>::emitXmmRegisterOperand(RegType reg, | 
|  | RmType rm) { | 
|  | emitRegisterOperand(gprEncoding(reg), gprEncoding(rm)); | 
|  | } | 
|  |  | 
|  | template <typename TraitsType> | 
|  | inline void AssemblerX86Base<TraitsType>::emitOperandSizeOverride() { | 
|  | emitUint8(0x66); | 
|  | } | 
|  |  | 
|  | } // end of namespace X86NAMESPACE | 
|  |  | 
|  | } // end of namespace Ice | 
|  |  | 
|  | #include "IceAssemblerX86BaseImpl.h" | 
|  |  | 
|  | #endif // SUBZERO_SRC_ICEASSEMBLERX86BASE_H |