//===- subzero/src/IceAssemblerX86Base.h - base x86 assembler -*- C++ -*---===// // // Copyright (c) 2013, the Dart project authors. Please see the AUTHORS file // for details. All rights reserved. Use of this source code is governed by a // BSD-style license that can be found in the LICENSE file. // // Modified by the Subzero authors. // //===----------------------------------------------------------------------===// // // The Subzero Code Generator // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// // /// \file /// \brief Defines the AssemblerX86 template class for x86, the base of all X86 /// assemblers. // //===----------------------------------------------------------------------===// #ifndef SUBZERO_SRC_ICEASSEMBLERX86BASE_H #define SUBZERO_SRC_ICEASSEMBLERX86BASE_H #include "IceAssembler.h" #include "IceDefs.h" #include "IceOperand.h" #include "IceTypes.h" #include "IceUtils.h" namespace Ice { #ifndef X86NAMESPACE #error "You must define the X86 Target namespace." #endif namespace X86NAMESPACE { template <typename TraitsType> class AssemblerX86Base : public ::Ice::Assembler { AssemblerX86Base(const AssemblerX86Base &) = delete; AssemblerX86Base &operator=(const AssemblerX86Base &) = delete; protected: explicit AssemblerX86Base( bool EmitAddrSizeOverridePrefix = TraitsType::Is64Bit) : Assembler(Traits::AsmKind), EmitAddrSizeOverridePrefix(EmitAddrSizeOverridePrefix) { assert(Traits::Is64Bit || !EmitAddrSizeOverridePrefix); } public: using Traits = TraitsType; using Address = typename Traits::Address; using ByteRegister = typename Traits::ByteRegister; using BrCond = typename Traits::Cond::BrCond; using CmppsCond = typename Traits::Cond::CmppsCond; using GPRRegister = typename Traits::GPRRegister; using Operand = typename Traits::Operand; using XmmRegister = typename Traits::XmmRegister; static constexpr int MAX_NOP_SIZE = 8; static bool classof(const Assembler *Asm) { return Asm->getKind() == Traits::AsmKind; } class Immediate { Immediate(const Immediate &) = delete; Immediate &operator=(const Immediate &) = delete; public: explicit Immediate(int32_t value) : value_(value) {} explicit Immediate(AssemblerFixup *fixup) : fixup_(fixup) {} int32_t value() const { return value_; } AssemblerFixup *fixup() const { return fixup_; } bool is_int8() const { // We currently only allow 32-bit fixups, and they usually have value = 0, // so if fixup_ != nullptr, it shouldn't be classified as int8/16. return fixup_ == nullptr && Utils::IsInt(8, value_); } bool is_uint8() const { return fixup_ == nullptr && Utils::IsUint(8, value_); } bool is_uint16() const { return fixup_ == nullptr && Utils::IsUint(16, value_); } private: const int32_t value_ = 0; AssemblerFixup *fixup_ = nullptr; }; /// X86 allows near and far jumps. class Label final : public Ice::Label { Label(const Label &) = delete; Label &operator=(const Label &) = delete; public: Label() = default; ~Label() = default; void finalCheck() const override { Ice::Label::finalCheck(); assert(!hasNear()); } /// Returns the position of an earlier branch instruction which assumes that /// this label is "near", and bumps iterator to the next near position. intptr_t getNearPosition() { assert(hasNear()); intptr_t Pos = UnresolvedNearPositions.back(); UnresolvedNearPositions.pop_back(); return Pos; } bool hasNear() const { return !UnresolvedNearPositions.empty(); } bool isUnused() const override { return Ice::Label::isUnused() && !hasNear(); } private: friend class AssemblerX86Base<TraitsType>; void nearLinkTo(const Assembler &Asm, intptr_t position) { if (Asm.getPreliminary()) return; assert(!isBound()); UnresolvedNearPositions.push_back(position); } llvm::SmallVector<intptr_t, 20> UnresolvedNearPositions; }; public: ~AssemblerX86Base() override; static const bool kNearJump = true; static const bool kFarJump = false; void alignFunction() override; SizeT getBundleAlignLog2Bytes() const override { return 5; } const char *getAlignDirective() const override { return ".p2align"; } llvm::ArrayRef<uint8_t> getNonExecBundlePadding() const override { static const uint8_t Padding[] = {0xF4}; return llvm::ArrayRef<uint8_t>(Padding, 1); } void padWithNop(intptr_t Padding) override { while (Padding > MAX_NOP_SIZE) { nop(MAX_NOP_SIZE); Padding -= MAX_NOP_SIZE; } if (Padding) nop(Padding); } Ice::Label *getCfgNodeLabel(SizeT NodeNumber) override; void bindCfgNodeLabel(const CfgNode *Node) override; Label *getOrCreateCfgNodeLabel(SizeT Number); Label *getOrCreateLocalLabel(SizeT Number); void bindLocalLabel(SizeT Number); bool fixupIsPCRel(FixupKind Kind) const override { // Currently assuming this is the only PC-rel relocation type used. // TODO(jpp): Traits.PcRelTypes.count(Kind) != 0 return Kind == Traits::FK_PcRel; } // Operations to emit GPR instructions (and dispatch on operand type). using TypedEmitGPR = void (AssemblerX86Base::*)(Type, GPRRegister); using TypedEmitAddr = void (AssemblerX86Base::*)(Type, const Address &); struct GPREmitterOneOp { TypedEmitGPR Reg; TypedEmitAddr Addr; }; using TypedEmitGPRGPR = void (AssemblerX86Base::*)(Type, GPRRegister, GPRRegister); using TypedEmitGPRAddr = void (AssemblerX86Base::*)(Type, GPRRegister, const Address &); using TypedEmitGPRImm = void (AssemblerX86Base::*)(Type, GPRRegister, const Immediate &); struct GPREmitterRegOp { TypedEmitGPRGPR GPRGPR; TypedEmitGPRAddr GPRAddr; TypedEmitGPRImm GPRImm; }; struct GPREmitterShiftOp { // Technically, Addr/GPR and Addr/Imm are also allowed, but */Addr are // not. In practice, we always normalize the Dest to a Register first. TypedEmitGPRGPR GPRGPR; TypedEmitGPRImm GPRImm; }; using TypedEmitGPRGPRImm = void (AssemblerX86Base::*)(Type, GPRRegister, GPRRegister, const Immediate &); struct GPREmitterShiftD { // Technically AddrGPR and AddrGPRImm are also allowed, but in practice we // always normalize Dest to a Register first. TypedEmitGPRGPR GPRGPR; TypedEmitGPRGPRImm GPRGPRImm; }; using TypedEmitAddrGPR = void (AssemblerX86Base::*)(Type, const Address &, GPRRegister); using TypedEmitAddrImm = void (AssemblerX86Base::*)(Type, const Address &, const Immediate &); struct GPREmitterAddrOp { TypedEmitAddrGPR AddrGPR; TypedEmitAddrImm AddrImm; }; // Operations to emit XMM instructions (and dispatch on operand type). using TypedEmitXmmXmm = void (AssemblerX86Base::*)(Type, XmmRegister, XmmRegister); using TypedEmitXmmAddr = void (AssemblerX86Base::*)(Type, XmmRegister, const Address &); struct XmmEmitterRegOp { TypedEmitXmmXmm XmmXmm; TypedEmitXmmAddr XmmAddr; }; using EmitXmmXmm = void (AssemblerX86Base::*)(XmmRegister, XmmRegister); using EmitXmmAddr = void (AssemblerX86Base::*)(XmmRegister, const Address &); using EmitAddrXmm = void (AssemblerX86Base::*)(const Address &, XmmRegister); struct XmmEmitterMovOps { EmitXmmXmm XmmXmm; EmitXmmAddr XmmAddr; EmitAddrXmm AddrXmm; }; using TypedEmitXmmImm = void (AssemblerX86Base::*)(Type, XmmRegister, const Immediate &); struct XmmEmitterShiftOp { TypedEmitXmmXmm XmmXmm; TypedEmitXmmAddr XmmAddr; TypedEmitXmmImm XmmImm; }; // Cross Xmm/GPR cast instructions. template <typename DReg_t, typename SReg_t> struct CastEmitterRegOp { using TypedEmitRegs = void (AssemblerX86Base::*)(Type, DReg_t, Type, SReg_t); using TypedEmitAddr = void (AssemblerX86Base::*)(Type, DReg_t, Type, const Address &); TypedEmitRegs RegReg; TypedEmitAddr RegAddr; }; // Three operand (potentially) cross Xmm/GPR instructions. The last operand // must be an immediate. template <typename DReg_t, typename SReg_t> struct ThreeOpImmEmitter { using TypedEmitRegRegImm = void (AssemblerX86Base::*)(Type, DReg_t, SReg_t, const Immediate &); using TypedEmitRegAddrImm = void (AssemblerX86Base::*)(Type, DReg_t, const Address &, const Immediate &); TypedEmitRegRegImm RegRegImm; TypedEmitRegAddrImm RegAddrImm; }; /* * Emit Machine Instructions. */ void call(GPRRegister reg); void call(const Address &address); void call(const ConstantRelocatable *label); // not testable. void call(const Immediate &abs_address); static const intptr_t kCallExternalLabelSize = 5; void pushl(GPRRegister reg); void pushl(const Immediate &Imm); void pushl(const ConstantRelocatable *Label); void popl(GPRRegister reg); void popl(const Address &address); template <typename T = Traits, typename = typename std::enable_if<T::HasPusha>::type> void pushal(); template <typename T = Traits, typename = typename std::enable_if<T::HasPopa>::type> void popal(); void setcc(BrCond condition, ByteRegister dst); void setcc(BrCond condition, const Address &address); void mov(Type Ty, GPRRegister dst, const Immediate &src); void mov(Type Ty, GPRRegister dst, GPRRegister src); void mov(Type Ty, GPRRegister dst, const Address &src); void mov(Type Ty, const Address &dst, GPRRegister src); void mov(Type Ty, const Address &dst, const Immediate &imm); template <typename T = Traits> typename std::enable_if<T::Is64Bit, void>::type movabs(const GPRRegister Dst, uint64_t Imm64); template <typename T = Traits> typename std::enable_if<!T::Is64Bit, void>::type movabs(const GPRRegister, uint64_t) { llvm::report_fatal_error("movabs is only supported in 64-bit x86 targets."); } void movzx(Type Ty, GPRRegister dst, GPRRegister src); void movzx(Type Ty, GPRRegister dst, const Address &src); void movsx(Type Ty, GPRRegister dst, GPRRegister src); void movsx(Type Ty, GPRRegister dst, const Address &src); void lea(Type Ty, GPRRegister dst, const Address &src); void cmov(Type Ty, BrCond cond, GPRRegister dst, GPRRegister src); void cmov(Type Ty, BrCond cond, GPRRegister dst, const Address &src); void rep_movsb(); void movss(Type Ty, XmmRegister dst, const Address &src); void movss(Type Ty, const Address &dst, XmmRegister src); void movss(Type Ty, XmmRegister dst, XmmRegister src); void movd(Type SrcTy, XmmRegister dst, GPRRegister src); void movd(Type SrcTy, XmmRegister dst, const Address &src); void movd(Type DestTy, GPRRegister dst, XmmRegister src); void movd(Type DestTy, const Address &dst, XmmRegister src); void movq(XmmRegister dst, XmmRegister src); void movq(const Address &dst, XmmRegister src); void movq(XmmRegister dst, const Address &src); void addss(Type Ty, XmmRegister dst, XmmRegister src); void addss(Type Ty, XmmRegister dst, const Address &src); void subss(Type Ty, XmmRegister dst, XmmRegister src); void subss(Type Ty, XmmRegister dst, const Address &src); void mulss(Type Ty, XmmRegister dst, XmmRegister src); void mulss(Type Ty, XmmRegister dst, const Address &src); void divss(Type Ty, XmmRegister dst, XmmRegister src); void divss(Type Ty, XmmRegister dst, const Address &src); void movaps(XmmRegister dst, XmmRegister src); void movups(XmmRegister dst, XmmRegister src); void movups(XmmRegister dst, const Address &src); void movups(const Address &dst, XmmRegister src); void padd(Type Ty, XmmRegister dst, XmmRegister src); void padd(Type Ty, XmmRegister dst, const Address &src); void padds(Type Ty, XmmRegister dst, XmmRegister src); void padds(Type Ty, XmmRegister dst, const Address &src); void paddus(Type Ty, XmmRegister dst, XmmRegister src); void paddus(Type Ty, XmmRegister dst, const Address &src); void pand(Type Ty, XmmRegister dst, XmmRegister src); void pand(Type Ty, XmmRegister dst, const Address &src); void pandn(Type Ty, XmmRegister dst, XmmRegister src); void pandn(Type Ty, XmmRegister dst, const Address &src); void pmull(Type Ty, XmmRegister dst, XmmRegister src); void pmull(Type Ty, XmmRegister dst, const Address &src); void pmulhw(Type Ty, XmmRegister dst, XmmRegister src); void pmulhw(Type Ty, XmmRegister dst, const Address &src); void pmulhuw(Type Ty, XmmRegister dst, XmmRegister src); void pmulhuw(Type Ty, XmmRegister dst, const Address &src); void pmaddwd(Type Ty, XmmRegister dst, XmmRegister src); void pmaddwd(Type Ty, XmmRegister dst, const Address &src); void pmuludq(Type Ty, XmmRegister dst, XmmRegister src); void pmuludq(Type Ty, XmmRegister dst, const Address &src); void por(Type Ty, XmmRegister dst, XmmRegister src); void por(Type Ty, XmmRegister dst, const Address &src); void psub(Type Ty, XmmRegister dst, XmmRegister src); void psub(Type Ty, XmmRegister dst, const Address &src); void psubs(Type Ty, XmmRegister dst, XmmRegister src); void psubs(Type Ty, XmmRegister dst, const Address &src); void psubus(Type Ty, XmmRegister dst, XmmRegister src); void psubus(Type Ty, XmmRegister dst, const Address &src); void pxor(Type Ty, XmmRegister dst, XmmRegister src); void pxor(Type Ty, XmmRegister dst, const Address &src); void psll(Type Ty, XmmRegister dst, XmmRegister src); void psll(Type Ty, XmmRegister dst, const Address &src); void psll(Type Ty, XmmRegister dst, const Immediate &src); void psra(Type Ty, XmmRegister dst, XmmRegister src); void psra(Type Ty, XmmRegister dst, const Address &src); void psra(Type Ty, XmmRegister dst, const Immediate &src); void psrl(Type Ty, XmmRegister dst, XmmRegister src); void psrl(Type Ty, XmmRegister dst, const Address &src); void psrl(Type Ty, XmmRegister dst, const Immediate &src); void addps(Type Ty, XmmRegister dst, XmmRegister src); void addps(Type Ty, XmmRegister dst, const Address &src); void subps(Type Ty, XmmRegister dst, XmmRegister src); void subps(Type Ty, XmmRegister dst, const Address &src); void divps(Type Ty, XmmRegister dst, XmmRegister src); void divps(Type Ty, XmmRegister dst, const Address &src); void mulps(Type Ty, XmmRegister dst, XmmRegister src); void mulps(Type Ty, XmmRegister dst, const Address &src); void minps(Type Ty, XmmRegister dst, const Address &src); void minps(Type Ty, XmmRegister dst, XmmRegister src); void minss(Type Ty, XmmRegister dst, const Address &src); void minss(Type Ty, XmmRegister dst, XmmRegister src); void maxps(Type Ty, XmmRegister dst, const Address &src); void maxps(Type Ty, XmmRegister dst, XmmRegister src); void maxss(Type Ty, XmmRegister dst, const Address &src); void maxss(Type Ty, XmmRegister dst, XmmRegister src); void andnps(Type Ty, XmmRegister dst, const Address &src); void andnps(Type Ty, XmmRegister dst, XmmRegister src); void andps(Type Ty, XmmRegister dst, const Address &src); void andps(Type Ty, XmmRegister dst, XmmRegister src); void orps(Type Ty, XmmRegister dst, const Address &src); void orps(Type Ty, XmmRegister dst, XmmRegister src); void blendvps(Type Ty, XmmRegister dst, XmmRegister src); void blendvps(Type Ty, XmmRegister dst, const Address &src); void pblendvb(Type Ty, XmmRegister dst, XmmRegister src); void pblendvb(Type Ty, XmmRegister dst, const Address &src); void cmpps(Type Ty, XmmRegister dst, XmmRegister src, CmppsCond CmpCondition); void cmpps(Type Ty, XmmRegister dst, const Address &src, CmppsCond CmpCondition); void sqrtps(XmmRegister dst); void rsqrtps(XmmRegister dst); void reciprocalps(XmmRegister dst); void movhlps(XmmRegister dst, XmmRegister src); void movlhps(XmmRegister dst, XmmRegister src); void unpcklps(XmmRegister dst, XmmRegister src); void unpckhps(XmmRegister dst, XmmRegister src); void unpcklpd(XmmRegister dst, XmmRegister src); void unpckhpd(XmmRegister dst, XmmRegister src); void set1ps(XmmRegister dst, GPRRegister tmp, const Immediate &imm); void sqrtpd(XmmRegister dst); void pshufb(Type Ty, XmmRegister dst, XmmRegister src); void pshufb(Type Ty, XmmRegister dst, const Address &src); void pshufd(Type Ty, XmmRegister dst, XmmRegister src, const Immediate &mask); void pshufd(Type Ty, XmmRegister dst, const Address &src, const Immediate &mask); void punpckl(Type Ty, XmmRegister Dst, XmmRegister Src); void punpckl(Type Ty, XmmRegister Dst, const Address &Src); void punpckh(Type Ty, XmmRegister Dst, XmmRegister Src); void punpckh(Type Ty, XmmRegister Dst, const Address &Src); void packss(Type Ty, XmmRegister Dst, XmmRegister Src); void packss(Type Ty, XmmRegister Dst, const Address &Src); void packus(Type Ty, XmmRegister Dst, XmmRegister Src); void packus(Type Ty, XmmRegister Dst, const Address &Src); void shufps(Type Ty, XmmRegister dst, XmmRegister src, const Immediate &mask); void shufps(Type Ty, XmmRegister dst, const Address &src, const Immediate &mask); void cvtdq2ps(Type, XmmRegister dst, XmmRegister src); void cvtdq2ps(Type, XmmRegister dst, const Address &src); void cvttps2dq(Type, XmmRegister dst, XmmRegister src); void cvttps2dq(Type, XmmRegister dst, const Address &src); void cvtps2dq(Type, XmmRegister dst, XmmRegister src); void cvtps2dq(Type, XmmRegister dst, const Address &src); void cvtsi2ss(Type DestTy, XmmRegister dst, Type SrcTy, GPRRegister src); void cvtsi2ss(Type DestTy, XmmRegister dst, Type SrcTy, const Address &src); void cvtfloat2float(Type SrcTy, XmmRegister dst, XmmRegister src); void cvtfloat2float(Type SrcTy, XmmRegister dst, const Address &src); void cvttss2si(Type DestTy, GPRRegister dst, Type SrcTy, XmmRegister src); void cvttss2si(Type DestTy, GPRRegister dst, Type SrcTy, const Address &src); void cvtss2si(Type DestTy, GPRRegister dst, Type SrcTy, XmmRegister src); void cvtss2si(Type DestTy, GPRRegister dst, Type SrcTy, const Address &src); void ucomiss(Type Ty, XmmRegister a, XmmRegister b); void ucomiss(Type Ty, XmmRegister a, const Address &b); void movmsk(Type Ty, GPRRegister dst, XmmRegister src); void sqrt(Type Ty, XmmRegister dst, const Address &src); void sqrt(Type Ty, XmmRegister dst, XmmRegister src); void xorps(Type Ty, XmmRegister dst, const Address &src); void xorps(Type Ty, XmmRegister dst, XmmRegister src); void insertps(Type Ty, XmmRegister dst, XmmRegister src, const Immediate &imm); void insertps(Type Ty, XmmRegister dst, const Address &src, const Immediate &imm); void pinsr(Type Ty, XmmRegister dst, GPRRegister src, const Immediate &imm); void pinsr(Type Ty, XmmRegister dst, const Address &src, const Immediate &imm); void pextr(Type Ty, GPRRegister dst, XmmRegister src, const Immediate &imm); void pmovsxdq(XmmRegister dst, XmmRegister src); void pcmpeq(Type Ty, XmmRegister dst, XmmRegister src); void pcmpeq(Type Ty, XmmRegister dst, const Address &src); void pcmpgt(Type Ty, XmmRegister dst, XmmRegister src); void pcmpgt(Type Ty, XmmRegister dst, const Address &src); enum RoundingMode { kRoundToNearest = 0x0, kRoundDown = 0x1, kRoundUp = 0x2, kRoundToZero = 0x3 }; void round(Type Ty, XmmRegister dst, XmmRegister src, const Immediate &mode); void round(Type Ty, XmmRegister dst, const Address &src, const Immediate &mode); //---------------------------------------------------------------------------- // // Begin: X87 instructions. Only available when Traits::UsesX87. // //---------------------------------------------------------------------------- template <typename T = Traits, typename = typename std::enable_if<T::UsesX87>::type> void fld(Type Ty, const typename T::Address &src); template <typename T = Traits, typename = typename std::enable_if<T::UsesX87>::type> void fstp(Type Ty, const typename T::Address &dst); template <typename T = Traits, typename = typename std::enable_if<T::UsesX87>::type> void fstp(typename T::X87STRegister st); template <typename T = Traits, typename = typename std::enable_if<T::UsesX87>::type> void fnstcw(const typename T::Address &dst); template <typename T = Traits, typename = typename std::enable_if<T::UsesX87>::type> void fldcw(const typename T::Address &src); template <typename T = Traits, typename = typename std::enable_if<T::UsesX87>::type> void fistpl(const typename T::Address &dst); template <typename T = Traits, typename = typename std::enable_if<T::UsesX87>::type> void fistps(const typename T::Address &dst); template <typename T = Traits, typename = typename std::enable_if<T::UsesX87>::type> void fildl(const typename T::Address &src); template <typename T = Traits, typename = typename std::enable_if<T::UsesX87>::type> void filds(const typename T::Address &src); template <typename T = Traits, typename = typename std::enable_if<T::UsesX87>::type> void fincstp(); //---------------------------------------------------------------------------- // // End: X87 instructions. // //---------------------------------------------------------------------------- void cmp(Type Ty, GPRRegister reg0, GPRRegister reg1); void cmp(Type Ty, GPRRegister reg, const Address &address); void cmp(Type Ty, GPRRegister reg, const Immediate &imm); void cmp(Type Ty, const Address &address, GPRRegister reg); void cmp(Type Ty, const Address &address, const Immediate &imm); void test(Type Ty, GPRRegister reg0, GPRRegister reg1); void test(Type Ty, GPRRegister reg, const Immediate &imm); void test(Type Ty, const Address &address, GPRRegister reg); void test(Type Ty, const Address &address, const Immediate &imm); void And(Type Ty, GPRRegister dst, GPRRegister src); void And(Type Ty, GPRRegister dst, const Address &address); void And(Type Ty, GPRRegister dst, const Immediate &imm); void And(Type Ty, const Address &address, GPRRegister reg); void And(Type Ty, const Address &address, const Immediate &imm); void Or(Type Ty, GPRRegister dst, GPRRegister src); void Or(Type Ty, GPRRegister dst, const Address &address); void Or(Type Ty, GPRRegister dst, const Immediate &imm); void Or(Type Ty, const Address &address, GPRRegister reg); void Or(Type Ty, const Address &address, const Immediate &imm); void Xor(Type Ty, GPRRegister dst, GPRRegister src); void Xor(Type Ty, GPRRegister dst, const Address &address); void Xor(Type Ty, GPRRegister dst, const Immediate &imm); void Xor(Type Ty, const Address &address, GPRRegister reg); void Xor(Type Ty, const Address &address, const Immediate &imm); void add(Type Ty, GPRRegister dst, GPRRegister src); void add(Type Ty, GPRRegister reg, const Address &address); void add(Type Ty, GPRRegister reg, const Immediate &imm); void add(Type Ty, const Address &address, GPRRegister reg); void add(Type Ty, const Address &address, const Immediate &imm); void adc(Type Ty, GPRRegister dst, GPRRegister src); void adc(Type Ty, GPRRegister dst, const Address &address); void adc(Type Ty, GPRRegister reg, const Immediate &imm); void adc(Type Ty, const Address &address, GPRRegister reg); void adc(Type Ty, const Address &address, const Immediate &imm); void sub(Type Ty, GPRRegister dst, GPRRegister src); void sub(Type Ty, GPRRegister reg, const Address &address); void sub(Type Ty, GPRRegister reg, const Immediate &imm); void sub(Type Ty, const Address &address, GPRRegister reg); void sub(Type Ty, const Address &address, const Immediate &imm); void sbb(Type Ty, GPRRegister dst, GPRRegister src); void sbb(Type Ty, GPRRegister reg, const Address &address); void sbb(Type Ty, GPRRegister reg, const Immediate &imm); void sbb(Type Ty, const Address &address, GPRRegister reg); void sbb(Type Ty, const Address &address, const Immediate &imm); void cbw(); void cwd(); void cdq(); template <typename T = Traits> typename std::enable_if<T::Is64Bit, void>::type cqo(); template <typename T = Traits> typename std::enable_if<!T::Is64Bit, void>::type cqo() { llvm::report_fatal_error("CQO is only available in 64-bit x86 backends."); } void div(Type Ty, GPRRegister reg); void div(Type Ty, const Address &address); void idiv(Type Ty, GPRRegister reg); void idiv(Type Ty, const Address &address); void imul(Type Ty, GPRRegister dst, GPRRegister src); void imul(Type Ty, GPRRegister reg, const Immediate &imm); void imul(Type Ty, GPRRegister reg, const Address &address); void imul(Type Ty, GPRRegister reg); void imul(Type Ty, const Address &address); void imul(Type Ty, GPRRegister dst, GPRRegister src, const Immediate &imm); void imul(Type Ty, GPRRegister dst, const Address &address, const Immediate &imm); void mul(Type Ty, GPRRegister reg); void mul(Type Ty, const Address &address); template <class T = Traits, typename = typename std::enable_if<!T::Is64Bit>::type> void incl(GPRRegister reg); void incl(const Address &address); template <class T = Traits, typename = typename std::enable_if<!T::Is64Bit>::type> void decl(GPRRegister reg); void decl(const Address &address); void rol(Type Ty, GPRRegister reg, const Immediate &imm); void rol(Type Ty, GPRRegister operand, GPRRegister shifter); void rol(Type Ty, const Address &operand, GPRRegister shifter); void shl(Type Ty, GPRRegister reg, const Immediate &imm); void shl(Type Ty, GPRRegister operand, GPRRegister shifter); void shl(Type Ty, const Address &operand, GPRRegister shifter); void shr(Type Ty, GPRRegister reg, const Immediate &imm); void shr(Type Ty, GPRRegister operand, GPRRegister shifter); void shr(Type Ty, const Address &operand, GPRRegister shifter); void sar(Type Ty, GPRRegister reg, const Immediate &imm); void sar(Type Ty, GPRRegister operand, GPRRegister shifter); void sar(Type Ty, const Address &address, GPRRegister shifter); void shld(Type Ty, GPRRegister dst, GPRRegister src); void shld(Type Ty, GPRRegister dst, GPRRegister src, const Immediate &imm); void shld(Type Ty, const Address &operand, GPRRegister src); void shrd(Type Ty, GPRRegister dst, GPRRegister src); void shrd(Type Ty, GPRRegister dst, GPRRegister src, const Immediate &imm); void shrd(Type Ty, const Address &dst, GPRRegister src); void neg(Type Ty, GPRRegister reg); void neg(Type Ty, const Address &addr); void notl(GPRRegister reg); void bsf(Type Ty, GPRRegister dst, GPRRegister src); void bsf(Type Ty, GPRRegister dst, const Address &src); void bsr(Type Ty, GPRRegister dst, GPRRegister src); void bsr(Type Ty, GPRRegister dst, const Address &src); void bswap(Type Ty, GPRRegister reg); void bt(GPRRegister base, GPRRegister offset); void ret(); void ret(const Immediate &imm); // 'size' indicates size in bytes and must be in the range 1..8. void nop(int size = 1); void int3(); void hlt(); void ud2(); // j(Label) is fully tested. void j(BrCond condition, Label *label, bool near = kFarJump); void j(BrCond condition, const ConstantRelocatable *label); // not testable. void jmp(GPRRegister reg); void jmp(Label *label, bool near = kFarJump); void jmp(const ConstantRelocatable *label); // not testable. void jmp(const Immediate &abs_address); void mfence(); void lock(); void cmpxchg(Type Ty, const Address &address, GPRRegister reg, bool Locked); void cmpxchg8b(const Address &address, bool Locked); void xadd(Type Ty, const Address &address, GPRRegister reg, bool Locked); void xchg(Type Ty, GPRRegister reg0, GPRRegister reg1); void xchg(Type Ty, const Address &address, GPRRegister reg); /// \name Intel Architecture Code Analyzer markers. /// @{ void iaca_start(); void iaca_end(); /// @} void emitSegmentOverride(uint8_t prefix); intptr_t preferredLoopAlignment() { return 16; } void align(intptr_t alignment, intptr_t offset); void bind(Label *label); intptr_t CodeSize() const { return Buffer.size(); } protected: inline void emitUint8(uint8_t value); private: ENABLE_MAKE_UNIQUE; // EmidAddrSizeOverridePrefix directs the emission of the 0x67 prefix to // force 32-bit registers when accessing memory. This is only used in native // 64-bit. const bool EmitAddrSizeOverridePrefix; static constexpr Type RexTypeIrrelevant = IceType_i32; static constexpr Type RexTypeForceRexW = IceType_i64; static constexpr GPRRegister RexRegIrrelevant = Traits::GPRRegister::Encoded_Reg_eax; inline void emitInt16(int16_t value); inline void emitInt32(int32_t value); inline void emitRegisterOperand(int rm, int reg); template <typename RegType, typename RmType> inline void emitXmmRegisterOperand(RegType reg, RmType rm); inline void emitOperandSizeOverride(); void emitOperand(int rm, const Operand &operand, RelocOffsetT Addend = 0); void emitImmediate(Type ty, const Immediate &imm); void emitComplexI8(int rm, const Operand &operand, const Immediate &immediate); void emitComplex(Type Ty, int rm, const Operand &operand, const Immediate &immediate); void emitLabel(Label *label, intptr_t instruction_size); void emitLabelLink(Label *label); void emitNearLabelLink(Label *label); void emitGenericShift(int rm, Type Ty, GPRRegister reg, const Immediate &imm); void emitGenericShift(int rm, Type Ty, const Operand &operand, GPRRegister shifter); using LabelVector = std::vector<Label *>; // A vector of pool-allocated x86 labels for CFG nodes. LabelVector CfgNodeLabels; // A vector of pool-allocated x86 labels for Local labels. LabelVector LocalLabels; Label *getOrCreateLabel(SizeT Number, LabelVector &Labels); void emitAddrSizeOverridePrefix() { if (!Traits::Is64Bit || !EmitAddrSizeOverridePrefix) { return; } static constexpr uint8_t AddrSizeOverridePrefix = 0x67; emitUint8(AddrSizeOverridePrefix); } // The arith_int() methods factor out the commonality between the encodings // of add(), Or(), adc(), sbb(), And(), sub(), Xor(), and cmp(). The Tag // parameter is statically asserted to be less than 8. template <uint32_t Tag> void arith_int(Type Ty, GPRRegister reg, const Immediate &imm); template <uint32_t Tag> void arith_int(Type Ty, GPRRegister reg0, GPRRegister reg1); template <uint32_t Tag> void arith_int(Type Ty, GPRRegister reg, const Address &address); template <uint32_t Tag> void arith_int(Type Ty, const Address &address, GPRRegister reg); template <uint32_t Tag> void arith_int(Type Ty, const Address &address, const Immediate &imm); // gprEncoding returns Reg encoding for operand emission. For x86-64 we mask // out the 4th bit as it is encoded in the REX.[RXB] bits. No other bits are // touched because we don't want to mask errors. template <typename RegType, typename T = Traits> typename std::enable_if<T::Is64Bit, typename T::GPRRegister>::type gprEncoding(const RegType Reg) { return static_cast<GPRRegister>(static_cast<uint8_t>(Reg) & ~0x08); } template <typename RegType, typename T = Traits> typename std::enable_if<!T::Is64Bit, typename T::GPRRegister>::type gprEncoding(const RegType Reg) { return static_cast<typename T::GPRRegister>(Reg); } template <typename RegType> bool is8BitRegisterRequiringRex(const Type Ty, const RegType Reg) { static constexpr bool IsGPR = std::is_same<typename std::decay<RegType>::type, ByteRegister>::value || std::is_same<typename std::decay<RegType>::type, GPRRegister>::value; // At this point in the assembler, we have encoded regs, so it is not // possible to distinguish between the "new" low byte registers introduced // in x86-64 and the legacy [abcd]h registers. Because x86, we may still // see ah (div) in the assembler, so we whitelist it here. // // The "local" uint32_t Encoded_Reg_ah is needed because RegType is an // enum that is not necessarily the same type of // Traits::RegisterSet::Encoded_Reg_ah. constexpr uint32_t Encoded_Reg_ah = Traits::RegisterSet::Encoded_Reg_ah; return IsGPR && (Reg & 0x04) != 0 && (Reg & 0x08) == 0 && isByteSizedType(Ty) && (Reg != Encoded_Reg_ah); } // assembleAndEmitRex is used for determining which (if any) rex prefix // should be emitted for the current instruction. It allows different types // for Reg and Rm because they could be of different types (e.g., in // mov[sz]x instructions.) If Addr is not nullptr, then Rm is ignored, and // Rex.B is determined by Addr instead. TyRm is still used to determine // Addr's size. template <typename RegType, typename RmType, typename T = Traits> typename std::enable_if<T::Is64Bit, void>::type assembleAndEmitRex(const Type TyReg, const RegType Reg, const Type TyRm, const RmType Rm, const typename T::Address *Addr = nullptr) { const uint8_t W = (TyReg == IceType_i64 || TyRm == IceType_i64) ? T::Operand::RexW : T::Operand::RexNone; const uint8_t R = (Reg & 0x08) ? T::Operand::RexR : T::Operand::RexNone; const uint8_t X = (Addr != nullptr) ? (typename T::Operand::RexBits)Addr->rexX() : T::Operand::RexNone; const uint8_t B = (Addr != nullptr) ? (typename T::Operand::RexBits)Addr->rexB() : (Rm & 0x08) ? T::Operand::RexB : T::Operand::RexNone; const uint8_t Prefix = W | R | X | B; if (Prefix != T::Operand::RexNone) { emitUint8(Prefix); } else if (is8BitRegisterRequiringRex(TyReg, Reg) || (Addr == nullptr && is8BitRegisterRequiringRex(TyRm, Rm))) { emitUint8(T::Operand::RexBase); } } template <typename RegType, typename RmType, typename T = Traits> typename std::enable_if<!T::Is64Bit, void>::type assembleAndEmitRex(const Type, const RegType, const Type, const RmType, const typename T::Address * = nullptr) {} // emitRexRB is used for emitting a Rex prefix instructions with two // explicit register operands in its mod-rm byte. template <typename RegType, typename RmType> void emitRexRB(const Type Ty, const RegType Reg, const RmType Rm) { assembleAndEmitRex(Ty, Reg, Ty, Rm); } template <typename RegType, typename RmType> void emitRexRB(const Type TyReg, const RegType Reg, const Type TyRm, const RmType Rm) { assembleAndEmitRex(TyReg, Reg, TyRm, Rm); } // emitRexB is used for emitting a Rex prefix if one is needed on encoding // the Reg field in an x86 instruction. It is invoked by the template when // Reg is the single register operand in the instruction (e.g., push Reg.) template <typename RmType> void emitRexB(const Type Ty, const RmType Rm) { emitRexRB(Ty, RexRegIrrelevant, Ty, Rm); } // emitRex is used for emitting a Rex prefix for an address and a GPR. The // address may contain zero, one, or two registers. template <typename RegType> void emitRex(const Type Ty, const Address &Addr, const RegType Reg) { assembleAndEmitRex(Ty, Reg, Ty, RexRegIrrelevant, &Addr); } template <typename RegType> void emitRex(const Type AddrTy, const Address &Addr, const Type TyReg, const RegType Reg) { assembleAndEmitRex(TyReg, Reg, AddrTy, RexRegIrrelevant, &Addr); } }; template <typename TraitsType> inline void AssemblerX86Base<TraitsType>::emitUint8(uint8_t value) { Buffer.emit<uint8_t>(value); } template <typename TraitsType> inline void AssemblerX86Base<TraitsType>::emitInt16(int16_t value) { Buffer.emit<int16_t>(value); } template <typename TraitsType> inline void AssemblerX86Base<TraitsType>::emitInt32(int32_t value) { Buffer.emit<int32_t>(value); } template <typename TraitsType> inline void AssemblerX86Base<TraitsType>::emitRegisterOperand(int reg, int rm) { assert(reg >= 0 && reg < 8); assert(rm >= 0 && rm < 8); Buffer.emit<uint8_t>(0xC0 + (reg << 3) + rm); } template <typename TraitsType> template <typename RegType, typename RmType> inline void AssemblerX86Base<TraitsType>::emitXmmRegisterOperand(RegType reg, RmType rm) { emitRegisterOperand(gprEncoding(reg), gprEncoding(rm)); } template <typename TraitsType> inline void AssemblerX86Base<TraitsType>::emitOperandSizeOverride() { emitUint8(0x66); } } // end of namespace X86NAMESPACE } // end of namespace Ice #include "IceAssemblerX86BaseImpl.h" #endif // SUBZERO_SRC_ICEASSEMBLERX86BASE_H