/*
* Copyright (C) 2011 The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#ifndef ART_RUNTIME_DEX_INSTRUCTION_H_
#define ART_RUNTIME_DEX_INSTRUCTION_H_
#include "base/logging.h"
#include "base/macros.h"
#include "globals.h"
typedef uint8_t uint4_t;
typedef int8_t int4_t;
namespace art {
class DexFile;
enum {
kNumPackedOpcodes = 0x100
};
class Instruction {
public:
// NOP-encoded switch-statement signatures.
enum Signatures {
kPackedSwitchSignature = 0x0100,
kSparseSwitchSignature = 0x0200,
kArrayDataSignature = 0x0300,
};
struct PACKED(4) PackedSwitchPayload {
const uint16_t ident;
const uint16_t case_count;
const int32_t first_key;
const int32_t targets[];
private:
DISALLOW_COPY_AND_ASSIGN(PackedSwitchPayload);
};
struct PACKED(4) SparseSwitchPayload {
const uint16_t ident;
const uint16_t case_count;
const int32_t keys_and_targets[];
public:
const int32_t* GetKeys() const {
return keys_and_targets;
}
const int32_t* GetTargets() const {
return keys_and_targets + case_count;
}
private:
DISALLOW_COPY_AND_ASSIGN(SparseSwitchPayload);
};
struct PACKED(4) ArrayDataPayload {
const uint16_t ident;
const uint16_t element_width;
const uint32_t element_count;
const uint8_t data[];
private:
DISALLOW_COPY_AND_ASSIGN(ArrayDataPayload);
};
enum Code { // private marker to avoid generate-operator-out.py from processing.
#define INSTRUCTION_ENUM(opcode, cname, p, f, r, i, a, v) cname = opcode,
#include "dex_instruction_list.h"
DEX_INSTRUCTION_LIST(INSTRUCTION_ENUM)
#undef DEX_INSTRUCTION_LIST
#undef INSTRUCTION_ENUM
RSUB_INT_LIT16 = RSUB_INT,
};
enum Format {
k10x, // op
k12x, // op vA, vB
k11n, // op vA, #+B
k11x, // op vAA
k10t, // op +AA
k20t, // op +AAAA
k22x, // op vAA, vBBBB
k21t, // op vAA, +BBBB
k21s, // op vAA, #+BBBB
k21h, // op vAA, #+BBBB00000[00000000]
k21c, // op vAA, thing@BBBB
k23x, // op vAA, vBB, vCC
k22b, // op vAA, vBB, #+CC
k22t, // op vA, vB, +CCCC
k22s, // op vA, vB, #+CCCC
k22c, // op vA, vB, thing@CCCC
k32x, // op vAAAA, vBBBB
k30t, // op +AAAAAAAA
k31t, // op vAA, +BBBBBBBB
k31i, // op vAA, #+BBBBBBBB
k31c, // op vAA, thing@BBBBBBBB
k35c, // op {vC, vD, vE, vF, vG}, thing@BBBB (B: count, A: vG)
k3rc, // op {vCCCC .. v(CCCC+AA-1)}, meth@BBBB
k51l, // op vAA, #+BBBBBBBBBBBBBBBB
};
enum Flags {
kBranch = 0x000001, // conditional or unconditional branch
kContinue = 0x000002, // flow can continue to next statement
kSwitch = 0x000004, // switch statement
kThrow = 0x000008, // could cause an exception to be thrown
kReturn = 0x000010, // returns, no additional statements
kInvoke = 0x000020, // a flavor of invoke
kUnconditional = 0x000040, // unconditional branch
kAdd = 0x000080, // addition
kSubtract = 0x000100, // subtract
kMultiply = 0x000200, // multiply
kDivide = 0x000400, // division
kRemainder = 0x000800, // remainder
kAnd = 0x001000, // and
kOr = 0x002000, // or
kXor = 0x004000, // xor
kShl = 0x008000, // shl
kShr = 0x010000, // shr
kUshr = 0x020000, // ushr
kCast = 0x040000, // cast
kStore = 0x080000, // store opcode
kLoad = 0x100000, // load opcode
kClobber = 0x200000, // clobbers memory in a big way (not just a write)
kRegCFieldOrConstant = 0x400000, // is the third virtual register a field or literal constant (vC)
kRegBFieldOrConstant = 0x800000, // is the second virtual register a field or literal constant (vB)
};
enum VerifyFlag {
kVerifyNone = 0x000000,
kVerifyRegA = 0x000001,
kVerifyRegAWide = 0x000002,
kVerifyRegB = 0x000004,
kVerifyRegBField = 0x000008,
kVerifyRegBMethod = 0x000010,
kVerifyRegBNewInstance = 0x000020,
kVerifyRegBString = 0x000040,
kVerifyRegBType = 0x000080,
kVerifyRegBWide = 0x000100,
kVerifyRegC = 0x000200,
kVerifyRegCField = 0x000400,
kVerifyRegCNewArray = 0x000800,
kVerifyRegCType = 0x001000,
kVerifyRegCWide = 0x002000,
kVerifyArrayData = 0x004000,
kVerifyBranchTarget = 0x008000,
kVerifySwitchTargets = 0x010000,
kVerifyVarArg = 0x020000,
kVerifyVarArgNonZero = 0x040000,
kVerifyVarArgRange = 0x080000,
kVerifyVarArgRangeNonZero = 0x100000,
kVerifyRuntimeOnly = 0x200000,
kVerifyError = 0x400000,
};
static constexpr uint32_t kMaxVarArgRegs = 5;
// Returns the size (in 2 byte code units) of this instruction.
size_t SizeInCodeUnits() const {
int result = kInstructionSizeInCodeUnits[Opcode()];
if (UNLIKELY(result < 0)) {
return SizeInCodeUnitsComplexOpcode();
} else {
return static_cast<size_t>(result);
}
}
// Reads an instruction out of the stream at the specified address.
static const Instruction* At(const uint16_t* code) {
DCHECK(code != nullptr);
return reinterpret_cast<const Instruction*>(code);
}
// Reads an instruction out of the stream from the current address plus an offset.
const Instruction* RelativeAt(int32_t offset) const WARN_UNUSED {
return At(reinterpret_cast<const uint16_t*>(this) + offset);
}
// Returns a pointer to the next instruction in the stream.
const Instruction* Next() const {
return RelativeAt(SizeInCodeUnits());
}
// Returns a pointer to the instruction after this 1xx instruction in the stream.
const Instruction* Next_1xx() const {
DCHECK(FormatOf(Opcode()) >= k10x && FormatOf(Opcode()) <= k10t);
return RelativeAt(1);
}
// Returns a pointer to the instruction after this 2xx instruction in the stream.
const Instruction* Next_2xx() const {
DCHECK(FormatOf(Opcode()) >= k20t && FormatOf(Opcode()) <= k22c);
return RelativeAt(2);
}
// Returns a pointer to the instruction after this 3xx instruction in the stream.
const Instruction* Next_3xx() const {
DCHECK(FormatOf(Opcode()) >= k32x && FormatOf(Opcode()) <= k3rc);
return RelativeAt(3);
}
// Returns a pointer to the instruction after this 51l instruction in the stream.
const Instruction* Next_51l() const {
DCHECK(FormatOf(Opcode()) == k51l);
return RelativeAt(5);
}
// Returns the name of this instruction's opcode.
const char* Name() const {
return Instruction::Name(Opcode());
}
// Returns the name of the given opcode.
static const char* Name(Code opcode) {
return kInstructionNames[opcode];
}
// VRegA
bool HasVRegA() const;
int32_t VRegA() const;
int8_t VRegA_10t() const {
return VRegA_10t(Fetch16(0));
}
uint8_t VRegA_10x() const {
return VRegA_10x(Fetch16(0));
}
uint4_t VRegA_11n() const {
return VRegA_11n(Fetch16(0));
}
uint8_t VRegA_11x() const {
return VRegA_11x(Fetch16(0));
}
uint4_t VRegA_12x() const {
return VRegA_12x(Fetch16(0));
}
int16_t VRegA_20t() const;
uint8_t VRegA_21c() const {
return VRegA_21c(Fetch16(0));
}
uint8_t VRegA_21h() const {
return VRegA_21h(Fetch16(0));
}
uint8_t VRegA_21s() const {
return VRegA_21s(Fetch16(0));
}
uint8_t VRegA_21t() const {
return VRegA_21t(Fetch16(0));
}
uint8_t VRegA_22b() const {
return VRegA_22b(Fetch16(0));
}
uint4_t VRegA_22c() const {
return VRegA_22c(Fetch16(0));
}
uint4_t VRegA_22s() const {
return VRegA_22s(Fetch16(0));
}
uint4_t VRegA_22t() const {
return VRegA_22t(Fetch16(0));
}
uint8_t VRegA_22x() const {
return VRegA_22x(Fetch16(0));
}
uint8_t VRegA_23x() const {
return VRegA_23x(Fetch16(0));
}
int32_t VRegA_30t() const;
uint8_t VRegA_31c() const {
return VRegA_31c(Fetch16(0));
}
uint8_t VRegA_31i() const {
return VRegA_31i(Fetch16(0));
}
uint8_t VRegA_31t() const {
return VRegA_31t(Fetch16(0));
}
uint16_t VRegA_32x() const;
uint4_t VRegA_35c() const {
return VRegA_35c(Fetch16(0));
}
uint8_t VRegA_3rc() const {
return VRegA_3rc(Fetch16(0));
}
uint8_t VRegA_51l() const {
return VRegA_51l(Fetch16(0));
}
// The following methods return the vA operand for various instruction formats. The "inst_data"
// parameter holds the first 16 bits of instruction which the returned value is decoded from.
int8_t VRegA_10t(uint16_t inst_data) const;
uint8_t VRegA_10x(uint16_t inst_data) const;
uint4_t VRegA_11n(uint16_t inst_data) const;
uint8_t VRegA_11x(uint16_t inst_data) const;
uint4_t VRegA_12x(uint16_t inst_data) const;
uint8_t VRegA_21c(uint16_t inst_data) const;
uint8_t VRegA_21h(uint16_t inst_data) const;
uint8_t VRegA_21s(uint16_t inst_data) const;
uint8_t VRegA_21t(uint16_t inst_data) const;
uint8_t VRegA_22b(uint16_t inst_data) const;
uint4_t VRegA_22c(uint16_t inst_data) const;
uint4_t VRegA_22s(uint16_t inst_data) const;
uint4_t VRegA_22t(uint16_t inst_data) const;
uint8_t VRegA_22x(uint16_t inst_data) const;
uint8_t VRegA_23x(uint16_t inst_data) const;
uint8_t VRegA_31c(uint16_t inst_data) const;
uint8_t VRegA_31i(uint16_t inst_data) const;
uint8_t VRegA_31t(uint16_t inst_data) const;
uint4_t VRegA_35c(uint16_t inst_data) const;
uint8_t VRegA_3rc(uint16_t inst_data) const;
uint8_t VRegA_51l(uint16_t inst_data) const;
// VRegB
bool HasVRegB() const;
int32_t VRegB() const;
bool HasWideVRegB() const;
uint64_t WideVRegB() const;
int4_t VRegB_11n() const {
return VRegB_11n(Fetch16(0));
}
uint4_t VRegB_12x() const {
return VRegB_12x(Fetch16(0));
}
uint16_t VRegB_21c() const;
uint16_t VRegB_21h() const;
int16_t VRegB_21s() const;
int16_t VRegB_21t() const;
uint8_t VRegB_22b() const;
uint4_t VRegB_22c() const {
return VRegB_22c(Fetch16(0));
}
uint4_t VRegB_22s() const {
return VRegB_22s(Fetch16(0));
}
uint4_t VRegB_22t() const {
return VRegB_22t(Fetch16(0));
}
uint16_t VRegB_22x() const;
uint8_t VRegB_23x() const;
uint32_t VRegB_31c() const;
int32_t VRegB_31i() const;
int32_t VRegB_31t() const;
uint16_t VRegB_32x() const;
uint16_t VRegB_35c() const;
uint16_t VRegB_3rc() const;
uint64_t VRegB_51l() const; // vB_wide
// The following methods return the vB operand for all instruction formats where it is encoded in
// the first 16 bits of instruction. The "inst_data" parameter holds these 16 bits. The returned
// value is decoded from it.
int4_t VRegB_11n(uint16_t inst_data) const;
uint4_t VRegB_12x(uint16_t inst_data) const;
uint4_t VRegB_22c(uint16_t inst_data) const;
uint4_t VRegB_22s(uint16_t inst_data) const;
uint4_t VRegB_22t(uint16_t inst_data) const;
// VRegC
bool HasVRegC() const;
int32_t VRegC() const;
int8_t VRegC_22b() const;
uint16_t VRegC_22c() const;
int16_t VRegC_22s() const;
int16_t VRegC_22t() const;
uint8_t VRegC_23x() const;
uint4_t VRegC_35c() const;
uint16_t VRegC_3rc() const;
// Fills the given array with the 'arg' array of the instruction.
bool HasVarArgs() const;
void GetVarArgs(uint32_t args[kMaxVarArgRegs], uint16_t inst_data) const;
void GetVarArgs(uint32_t args[kMaxVarArgRegs]) const {
return GetVarArgs(args, Fetch16(0));
}
// Returns the opcode field of the instruction. The given "inst_data" parameter must be the first
// 16 bits of instruction.
Code Opcode(uint16_t inst_data) const {
DCHECK_EQ(inst_data, Fetch16(0));
return static_cast<Code>(inst_data & 0xFF);
}
// Returns the opcode field of the instruction from the first 16 bits of instruction.
Code Opcode() const {
return Opcode(Fetch16(0));
}
void SetOpcode(Code opcode) {
DCHECK_LT(static_cast<uint16_t>(opcode), 256u);
uint16_t* insns = reinterpret_cast<uint16_t*>(this);
insns[0] = (insns[0] & 0xff00) | static_cast<uint16_t>(opcode);
}
void SetVRegA_10x(uint8_t val) {
DCHECK(FormatOf(Opcode()) == k10x);
uint16_t* insns = reinterpret_cast<uint16_t*>(this);
insns[0] = (val << 8) | (insns[0] & 0x00ff);
}
void SetVRegB_3rc(uint16_t val) {
DCHECK(FormatOf(Opcode()) == k3rc);
uint16_t* insns = reinterpret_cast<uint16_t*>(this);
insns[1] = val;
}
void SetVRegB_35c(uint16_t val) {
DCHECK(FormatOf(Opcode()) == k35c);
uint16_t* insns = reinterpret_cast<uint16_t*>(this);
insns[1] = val;
}
void SetVRegC_22c(uint16_t val) {
DCHECK(FormatOf(Opcode()) == k22c);
uint16_t* insns = reinterpret_cast<uint16_t*>(this);
insns[1] = val;
}
// Returns the format of the given opcode.
static Format FormatOf(Code opcode) {
return kInstructionFormats[opcode];
}
// Returns the flags for the given opcode.
static int FlagsOf(Code opcode) {
return kInstructionFlags[opcode];
}
// Return the verify flags for the given opcode.
static int VerifyFlagsOf(Code opcode) {
return kInstructionVerifyFlags[opcode];
}
// Returns true if this instruction is a branch.
bool IsBranch() const {
return (kInstructionFlags[Opcode()] & kBranch) != 0;
}
// Returns true if this instruction is a unconditional branch.
bool IsUnconditional() const {
return (kInstructionFlags[Opcode()] & kUnconditional) != 0;
}
// Returns the branch offset if this instruction is a branch.
int32_t GetTargetOffset() const;
// Returns true if the instruction allows control flow to go to the following instruction.
bool CanFlowThrough() const;
// Returns true if this instruction is a switch.
bool IsSwitch() const {
return (kInstructionFlags[Opcode()] & kSwitch) != 0;
}
// Returns true if this instruction can throw.
bool IsThrow() const {
return (kInstructionFlags[Opcode()] & kThrow) != 0;
}
// Determine if the instruction is any of 'return' instructions.
bool IsReturn() const {
return (kInstructionFlags[Opcode()] & kReturn) != 0;
}
// Determine if this instruction ends execution of its basic block.
bool IsBasicBlockEnd() const {
return IsBranch() || IsReturn() || Opcode() == THROW;
}
// Determine if this instruction is an invoke.
bool IsInvoke() const {
return (kInstructionFlags[Opcode()] & kInvoke) != 0;
}
int GetVerifyTypeArgumentA() const {
return (kInstructionVerifyFlags[Opcode()] & (kVerifyRegA | kVerifyRegAWide));
}
int GetVerifyTypeArgumentB() const {
return (kInstructionVerifyFlags[Opcode()] & (kVerifyRegB | kVerifyRegBField |
kVerifyRegBMethod | kVerifyRegBNewInstance | kVerifyRegBString | kVerifyRegBType |
kVerifyRegBWide));
}
int GetVerifyTypeArgumentC() const {
return (kInstructionVerifyFlags[Opcode()] & (kVerifyRegC | kVerifyRegCField |
kVerifyRegCNewArray | kVerifyRegCType | kVerifyRegCWide));
}
int GetVerifyExtraFlags() const {
return (kInstructionVerifyFlags[Opcode()] & (kVerifyArrayData | kVerifyBranchTarget |
kVerifySwitchTargets | kVerifyVarArg | kVerifyVarArgNonZero | kVerifyVarArgRange |
kVerifyVarArgRangeNonZero | kVerifyError));
}
bool GetVerifyIsRuntimeOnly() const {
return (kInstructionVerifyFlags[Opcode()] & kVerifyRuntimeOnly) != 0;
}
// Get the dex PC of this instruction as a offset in code units from the beginning of insns.
uint32_t GetDexPc(const uint16_t* insns) const {
return (reinterpret_cast<const uint16_t*>(this) - insns);
}
// Dump decoded version of instruction
std::string DumpString(const DexFile*) const;
// Dump code_units worth of this instruction, padding to code_units for shorter instructions
std::string DumpHex(size_t code_units) const;
// Little-endian dump code_units worth of this instruction, padding to code_units for
// shorter instructions
std::string DumpHexLE(size_t instr_code_units) const;
uint16_t Fetch16(size_t offset) const {
const uint16_t* insns = reinterpret_cast<const uint16_t*>(this);
return insns[offset];
}
private:
size_t SizeInCodeUnitsComplexOpcode() const;
uint32_t Fetch32(size_t offset) const {
return (Fetch16(offset) | ((uint32_t) Fetch16(offset + 1) << 16));
}
uint4_t InstA() const {
return InstA(Fetch16(0));
}
uint4_t InstB() const {
return InstB(Fetch16(0));
}
uint8_t InstAA() const {
return InstAA(Fetch16(0));
}
uint4_t InstA(uint16_t inst_data) const {
DCHECK_EQ(inst_data, Fetch16(0));
return static_cast<uint4_t>((inst_data >> 8) & 0x0f);
}
uint4_t InstB(uint16_t inst_data) const {
DCHECK_EQ(inst_data, Fetch16(0));
return static_cast<uint4_t>(inst_data >> 12);
}
uint8_t InstAA(uint16_t inst_data) const {
DCHECK_EQ(inst_data, Fetch16(0));
return static_cast<uint8_t>(inst_data >> 8);
}
static const char* const kInstructionNames[];
static Format const kInstructionFormats[];
static int const kInstructionFlags[];
static int const kInstructionVerifyFlags[];
static int const kInstructionSizeInCodeUnits[];
DISALLOW_IMPLICIT_CONSTRUCTORS(Instruction);
};
std::ostream& operator<<(std::ostream& os, const Instruction::Code& code);
std::ostream& operator<<(std::ostream& os, const Instruction::Format& format);
std::ostream& operator<<(std::ostream& os, const Instruction::Flags& flags);
std::ostream& operator<<(std::ostream& os, const Instruction::VerifyFlag& vflags);
} // namespace art
#endif // ART_RUNTIME_DEX_INSTRUCTION_H_