diff options
Diffstat (limited to 'capstone/arch/ARM/ARMBaseInfo.h')
-rw-r--r-- | capstone/arch/ARM/ARMBaseInfo.h | 486 |
1 files changed, 486 insertions, 0 deletions
diff --git a/capstone/arch/ARM/ARMBaseInfo.h b/capstone/arch/ARM/ARMBaseInfo.h new file mode 100644 index 000000000..b7279569f --- /dev/null +++ b/capstone/arch/ARM/ARMBaseInfo.h @@ -0,0 +1,486 @@ +//===-- ARMBaseInfo.h - Top level definitions for ARM -------- --*- C++ -*-===// +// +// The LLVM Compiler Infrastructure +// +// This file is distributed under the University of Illinois Open Source +// License. See LICENSE.TXT for details. +// +//===----------------------------------------------------------------------===// +// +// This file contains small standalone helper functions and enum definitions for +// the ARM target useful for the compiler back-end and the MC libraries. +// As such, it deliberately does not include references to LLVM core +// code gen types, passes, etc.. +// +//===----------------------------------------------------------------------===// + +/* Capstone Disassembly Engine */ +/* By Nguyen Anh Quynh <aquynh@gmail.com>, 2013-2019 */ + +#ifndef CS_ARMBASEINFO_H +#define CS_ARMBASEINFO_H + +#include "capstone/arm.h" + +// Defines symbolic names for ARM registers. This defines a mapping from +// register name to register number. +// +#define GET_REGINFO_ENUM +#include "ARMGenRegisterInfo.inc" + +// Enums corresponding to ARM condition codes +// The CondCodes constants map directly to the 4-bit encoding of the +// condition field for predicated instructions. +typedef enum ARMCC_CondCodes { // Meaning (integer) Meaning (floating-point) + ARMCC_EQ, // Equal Equal + ARMCC_NE, // Not equal Not equal, or unordered + ARMCC_HS, // Carry set >, ==, or unordered + ARMCC_LO, // Carry clear Less than + ARMCC_MI, // Minus, negative Less than + ARMCC_PL, // Plus, positive or zero >, ==, or unordered + ARMCC_VS, // Overflow Unordered + ARMCC_VC, // No overflow Not unordered + ARMCC_HI, // Unsigned higher Greater than, or unordered + ARMCC_LS, // Unsigned lower or same Less than or equal + ARMCC_GE, // Greater than or equal Greater than or equal + ARMCC_LT, // Less than Less than, or unordered + ARMCC_GT, // Greater than Greater than + ARMCC_LE, // Less than or equal <, ==, or unordered + ARMCC_AL // Always (unconditional) Always (unconditional) +} ARMCC_CondCodes; + +inline static ARMCC_CondCodes ARMCC_getOppositeCondition(ARMCC_CondCodes CC) +{ + switch (CC) { + case ARMCC_EQ: return ARMCC_NE; + case ARMCC_NE: return ARMCC_EQ; + case ARMCC_HS: return ARMCC_LO; + case ARMCC_LO: return ARMCC_HS; + case ARMCC_MI: return ARMCC_PL; + case ARMCC_PL: return ARMCC_MI; + case ARMCC_VS: return ARMCC_VC; + case ARMCC_VC: return ARMCC_VS; + case ARMCC_HI: return ARMCC_LS; + case ARMCC_LS: return ARMCC_HI; + case ARMCC_GE: return ARMCC_LT; + case ARMCC_LT: return ARMCC_GE; + case ARMCC_GT: return ARMCC_LE; + case ARMCC_LE: return ARMCC_GT; + default: return ARMCC_AL; + } +} + +inline static const char *ARMCC_ARMCondCodeToString(ARMCC_CondCodes CC) +{ + switch (CC) { + case ARMCC_EQ: return "eq"; + case ARMCC_NE: return "ne"; + case ARMCC_HS: return "hs"; + case ARMCC_LO: return "lo"; + case ARMCC_MI: return "mi"; + case ARMCC_PL: return "pl"; + case ARMCC_VS: return "vs"; + case ARMCC_VC: return "vc"; + case ARMCC_HI: return "hi"; + case ARMCC_LS: return "ls"; + case ARMCC_GE: return "ge"; + case ARMCC_LT: return "lt"; + case ARMCC_GT: return "gt"; + case ARMCC_LE: return "le"; + case ARMCC_AL: return "al"; + default: return ""; + } +} + +inline static const char *ARM_PROC_IFlagsToString(unsigned val) +{ + switch (val) { + case ARM_CPSFLAG_F: return "f"; + case ARM_CPSFLAG_I: return "i"; + case ARM_CPSFLAG_A: return "a"; + default: return ""; + } +} + +inline static const char *ARM_PROC_IModToString(unsigned val) +{ + switch (val) { + case ARM_CPSMODE_IE: return "ie"; + case ARM_CPSMODE_ID: return "id"; + default: return ""; + } +} + +inline static const char *ARM_MB_MemBOptToString(unsigned val, bool HasV8) +{ + // TODO: add details + switch (val + 1) { + default: return "BUGBUG"; + case ARM_MB_SY: return "sy"; + case ARM_MB_ST: return "st"; + case ARM_MB_LD: return HasV8 ? "ld" : "#0xd"; + case ARM_MB_RESERVED_12: return "#0xc"; + case ARM_MB_ISH: return "ish"; + case ARM_MB_ISHST: return "ishst"; + case ARM_MB_ISHLD: return HasV8 ? "ishld" : "#9"; + case ARM_MB_RESERVED_8: return "#8"; + case ARM_MB_NSH: return "nsh"; + case ARM_MB_NSHST: return "nshst"; + case ARM_MB_NSHLD: return HasV8 ? "nshld" : "#5"; + case ARM_MB_RESERVED_4: return "#4"; + case ARM_MB_OSH: return "osh"; + case ARM_MB_OSHST: return "oshst"; + case ARM_MB_OSHLD: return HasV8 ? "oshld" : "#1"; + case ARM_MB_RESERVED_0: return "#0"; + } +} + +enum ARM_ISB_InstSyncBOpt { + ARM_ISB_RESERVED_0 = 0, + ARM_ISB_RESERVED_1 = 1, + ARM_ISB_RESERVED_2 = 2, + ARM_ISB_RESERVED_3 = 3, + ARM_ISB_RESERVED_4 = 4, + ARM_ISB_RESERVED_5 = 5, + ARM_ISB_RESERVED_6 = 6, + ARM_ISB_RESERVED_7 = 7, + ARM_ISB_RESERVED_8 = 8, + ARM_ISB_RESERVED_9 = 9, + ARM_ISB_RESERVED_10 = 10, + ARM_ISB_RESERVED_11 = 11, + ARM_ISB_RESERVED_12 = 12, + ARM_ISB_RESERVED_13 = 13, + ARM_ISB_RESERVED_14 = 14, + ARM_ISB_SY = 15 +}; + +inline static const char *ARM_ISB_InstSyncBOptToString(unsigned val) +{ + switch (val) { + default: // never reach + case ARM_ISB_RESERVED_0: return "#0x0"; + case ARM_ISB_RESERVED_1: return "#0x1"; + case ARM_ISB_RESERVED_2: return "#0x2"; + case ARM_ISB_RESERVED_3: return "#0x3"; + case ARM_ISB_RESERVED_4: return "#0x4"; + case ARM_ISB_RESERVED_5: return "#0x5"; + case ARM_ISB_RESERVED_6: return "#0x6"; + case ARM_ISB_RESERVED_7: return "#0x7"; + case ARM_ISB_RESERVED_8: return "#0x8"; + case ARM_ISB_RESERVED_9: return "#0x9"; + case ARM_ISB_RESERVED_10: return "#0xa"; + case ARM_ISB_RESERVED_11: return "#0xb"; + case ARM_ISB_RESERVED_12: return "#0xc"; + case ARM_ISB_RESERVED_13: return "#0xd"; + case ARM_ISB_RESERVED_14: return "#0xe"; + case ARM_ISB_SY: return "sy"; + } +} + +/// isARMLowRegister - Returns true if the register is a low register (r0-r7). +/// +static inline bool isARMLowRegister(unsigned Reg) +{ + //using namespace ARM; + switch (Reg) { + case ARM_R0: case ARM_R1: case ARM_R2: case ARM_R3: + case ARM_R4: case ARM_R5: case ARM_R6: case ARM_R7: + return true; + default: + return false; + } +} + +/// ARMII - This namespace holds all of the target specific flags that +/// instruction info tracks. +/// +/// ARM Index Modes +enum ARMII_IndexMode { + ARMII_IndexModeNone = 0, + ARMII_IndexModePre = 1, + ARMII_IndexModePost = 2, + ARMII_IndexModeUpd = 3 +}; + +/// ARM Addressing Modes +typedef enum ARMII_AddrMode { + ARMII_AddrModeNone = 0, + ARMII_AddrMode1 = 1, + ARMII_AddrMode2 = 2, + ARMII_AddrMode3 = 3, + ARMII_AddrMode4 = 4, + ARMII_AddrMode5 = 5, + ARMII_AddrMode6 = 6, + ARMII_AddrModeT1_1 = 7, + ARMII_AddrModeT1_2 = 8, + ARMII_AddrModeT1_4 = 9, + ARMII_AddrModeT1_s = 10, // i8 * 4 for pc and sp relative data + ARMII_AddrModeT2_i12 = 11, + ARMII_AddrModeT2_i8 = 12, + ARMII_AddrModeT2_so = 13, + ARMII_AddrModeT2_pc = 14, // +/- i12 for pc relative data + ARMII_AddrModeT2_i8s4 = 15, // i8 * 4 + ARMII_AddrMode_i12 = 16 +} ARMII_AddrMode; + +inline static const char *ARMII_AddrModeToString(ARMII_AddrMode addrmode) +{ + switch (addrmode) { + case ARMII_AddrModeNone: return "AddrModeNone"; + case ARMII_AddrMode1: return "AddrMode1"; + case ARMII_AddrMode2: return "AddrMode2"; + case ARMII_AddrMode3: return "AddrMode3"; + case ARMII_AddrMode4: return "AddrMode4"; + case ARMII_AddrMode5: return "AddrMode5"; + case ARMII_AddrMode6: return "AddrMode6"; + case ARMII_AddrModeT1_1: return "AddrModeT1_1"; + case ARMII_AddrModeT1_2: return "AddrModeT1_2"; + case ARMII_AddrModeT1_4: return "AddrModeT1_4"; + case ARMII_AddrModeT1_s: return "AddrModeT1_s"; + case ARMII_AddrModeT2_i12: return "AddrModeT2_i12"; + case ARMII_AddrModeT2_i8: return "AddrModeT2_i8"; + case ARMII_AddrModeT2_so: return "AddrModeT2_so"; + case ARMII_AddrModeT2_pc: return "AddrModeT2_pc"; + case ARMII_AddrModeT2_i8s4: return "AddrModeT2_i8s4"; + case ARMII_AddrMode_i12: return "AddrMode_i12"; + } +} + +/// Target Operand Flag enum. +enum ARMII_TOF { + //===------------------------------------------------------------------===// + // ARM Specific MachineOperand flags. + + ARMII_MO_NO_FLAG, + + /// MO_LO16 - On a symbol operand, this represents a relocation containing + /// lower 16 bit of the address. Used only via movw instruction. + ARMII_MO_LO16, + + /// MO_HI16 - On a symbol operand, this represents a relocation containing + /// higher 16 bit of the address. Used only via movt instruction. + ARMII_MO_HI16, + + /// MO_LO16_NONLAZY - On a symbol operand "FOO", this represents a + /// relocation containing lower 16 bit of the non-lazy-ptr indirect symbol, + /// i.e. "FOO$non_lazy_ptr". + /// Used only via movw instruction. + ARMII_MO_LO16_NONLAZY, + + /// MO_HI16_NONLAZY - On a symbol operand "FOO", this represents a + /// relocation containing lower 16 bit of the non-lazy-ptr indirect symbol, + /// i.e. "FOO$non_lazy_ptr". Used only via movt instruction. + ARMII_MO_HI16_NONLAZY, + + /// MO_LO16_NONLAZY_PIC - On a symbol operand "FOO", this represents a + /// relocation containing lower 16 bit of the PC relative address of the + /// non-lazy-ptr indirect symbol, i.e. "FOO$non_lazy_ptr - LABEL". + /// Used only via movw instruction. + ARMII_MO_LO16_NONLAZY_PIC, + + /// MO_HI16_NONLAZY_PIC - On a symbol operand "FOO", this represents a + /// relocation containing lower 16 bit of the PC relative address of the + /// non-lazy-ptr indirect symbol, i.e. "FOO$non_lazy_ptr - LABEL". + /// Used only via movt instruction. + ARMII_MO_HI16_NONLAZY_PIC, + + /// MO_PLT - On a symbol operand, this represents an ELF PLT reference on a + /// call operand. + ARMII_MO_PLT +}; + +enum { + //===------------------------------------------------------------------===// + // Instruction Flags. + + //===------------------------------------------------------------------===// + // This four-bit field describes the addressing mode used. + ARMII_AddrModeMask = 0x1f, // The AddrMode enums are declared in ARMBaseInfo.h + + // IndexMode - Unindex, pre-indexed, or post-indexed are valid for load + // and store ops only. Generic "updating" flag is used for ld/st multiple. + // The index mode enums are declared in ARMBaseInfo.h + ARMII_IndexModeShift = 5, + ARMII_IndexModeMask = 3 << ARMII_IndexModeShift, + + //===------------------------------------------------------------------===// + // Instruction encoding formats. + // + ARMII_FormShift = 7, + ARMII_FormMask = 0x3f << ARMII_FormShift, + + // Pseudo instructions + ARMII_Pseudo = 0 << ARMII_FormShift, + + // Multiply instructions + ARMII_MulFrm = 1 << ARMII_FormShift, + + // Branch instructions + ARMII_BrFrm = 2 << ARMII_FormShift, + ARMII_BrMiscFrm = 3 << ARMII_FormShift, + + // Data Processing instructions + ARMII_DPFrm = 4 << ARMII_FormShift, + ARMII_DPSoRegFrm = 5 << ARMII_FormShift, + + // Load and Store + ARMII_LdFrm = 6 << ARMII_FormShift, + ARMII_StFrm = 7 << ARMII_FormShift, + ARMII_LdMiscFrm = 8 << ARMII_FormShift, + ARMII_StMiscFrm = 9 << ARMII_FormShift, + ARMII_LdStMulFrm = 10 << ARMII_FormShift, + + ARMII_LdStExFrm = 11 << ARMII_FormShift, + + // Miscellaneous arithmetic instructions + ARMII_ArithMiscFrm = 12 << ARMII_FormShift, + ARMII_SatFrm = 13 << ARMII_FormShift, + + // Extend instructions + ARMII_ExtFrm = 14 << ARMII_FormShift, + + // VFP formats + ARMII_VFPUnaryFrm = 15 << ARMII_FormShift, + ARMII_VFPBinaryFrm = 16 << ARMII_FormShift, + ARMII_VFPConv1Frm = 17 << ARMII_FormShift, + ARMII_VFPConv2Frm = 18 << ARMII_FormShift, + ARMII_VFPConv3Frm = 19 << ARMII_FormShift, + ARMII_VFPConv4Frm = 20 << ARMII_FormShift, + ARMII_VFPConv5Frm = 21 << ARMII_FormShift, + ARMII_VFPLdStFrm = 22 << ARMII_FormShift, + ARMII_VFPLdStMulFrm = 23 << ARMII_FormShift, + ARMII_VFPMiscFrm = 24 << ARMII_FormShift, + + // Thumb format + ARMII_ThumbFrm = 25 << ARMII_FormShift, + + // Miscelleaneous format + ARMII_MiscFrm = 26 << ARMII_FormShift, + + // NEON formats + ARMII_NGetLnFrm = 27 << ARMII_FormShift, + ARMII_NSetLnFrm = 28 << ARMII_FormShift, + ARMII_NDupFrm = 29 << ARMII_FormShift, + ARMII_NLdStFrm = 30 << ARMII_FormShift, + ARMII_N1RegModImmFrm= 31 << ARMII_FormShift, + ARMII_N2RegFrm = 32 << ARMII_FormShift, + ARMII_NVCVTFrm = 33 << ARMII_FormShift, + ARMII_NVDupLnFrm = 34 << ARMII_FormShift, + ARMII_N2RegVShLFrm = 35 << ARMII_FormShift, + ARMII_N2RegVShRFrm = 36 << ARMII_FormShift, + ARMII_N3RegFrm = 37 << ARMII_FormShift, + ARMII_N3RegVShFrm = 38 << ARMII_FormShift, + ARMII_NVExtFrm = 39 << ARMII_FormShift, + ARMII_NVMulSLFrm = 40 << ARMII_FormShift, + ARMII_NVTBLFrm = 41 << ARMII_FormShift, + + //===------------------------------------------------------------------===// + // Misc flags. + + // UnaryDP - Indicates this is a unary data processing instruction, i.e. + // it doesn't have a Rn operand. + ARMII_UnaryDP = 1 << 13, + + // Xform16Bit - Indicates this Thumb2 instruction may be transformed into + // a 16-bit Thumb instruction if certain conditions are met. + ARMII_Xform16Bit = 1 << 14, + + // ThumbArithFlagSetting - The instruction is a 16-bit flag setting Thumb + // instruction. Used by the parser to determine whether to require the 'S' + // suffix on the mnemonic (when not in an IT block) or preclude it (when + // in an IT block). + ARMII_ThumbArithFlagSetting = 1 << 18, + + //===------------------------------------------------------------------===// + // Code domain. + ARMII_DomainShift = 15, + ARMII_DomainMask = 7 << ARMII_DomainShift, + ARMII_DomainGeneral = 0 << ARMII_DomainShift, + ARMII_DomainVFP = 1 << ARMII_DomainShift, + ARMII_DomainNEON = 2 << ARMII_DomainShift, + ARMII_DomainNEONA8 = 4 << ARMII_DomainShift, + + //===------------------------------------------------------------------===// + // Field shifts - such shifts are used to set field while generating + // machine instructions. + // + // FIXME: This list will need adjusting/fixing as the MC code emitter + // takes shape and the ARMCodeEmitter.cpp bits go away. + ARMII_ShiftTypeShift = 4, + + ARMII_M_BitShift = 5, + ARMII_ShiftImmShift = 5, + ARMII_ShiftShift = 7, + ARMII_N_BitShift = 7, + ARMII_ImmHiShift = 8, + ARMII_SoRotImmShift = 8, + ARMII_RegRsShift = 8, + ARMII_ExtRotImmShift = 10, + ARMII_RegRdLoShift = 12, + ARMII_RegRdShift = 12, + ARMII_RegRdHiShift = 16, + ARMII_RegRnShift = 16, + ARMII_S_BitShift = 20, + ARMII_W_BitShift = 21, + ARMII_AM3_I_BitShift = 22, + ARMII_D_BitShift = 22, + ARMII_U_BitShift = 23, + ARMII_P_BitShift = 24, + ARMII_I_BitShift = 25, + ARMII_CondShift = 28 +}; + +typedef struct MClassSysReg { + const char *Name; + arm_sysreg sysreg; + uint16_t M1Encoding12; + uint16_t M2M3Encoding8; + uint16_t Encoding; + int FeaturesRequired[2]; // 2 is enough for MClassSysRegsList +} MClassSysReg; + +enum TraceSyncBOpt { + CSYNC = 0 +}; + +const MClassSysReg *lookupMClassSysRegByM2M3Encoding8(uint16_t encoding); +const MClassSysReg *lookupMClassSysRegByM1Encoding12(uint16_t M1Encoding12); + +// returns APSR with _<bits> qualifier. +// Note: ARMv7-M deprecates using MSR APSR without a _<bits> qualifier +static inline const MClassSysReg *lookupMClassSysRegAPSRNonDeprecated(unsigned SYSm) +{ + return lookupMClassSysRegByM2M3Encoding8((1<<9) | (SYSm & 0xFF)); +} + +static inline const MClassSysReg *lookupMClassSysRegBy8bitSYSmValue(unsigned SYSm) +{ + return lookupMClassSysRegByM2M3Encoding8((1<<8) | (SYSm & 0xFF)); +} + +// returns true if TestFeatures are all present in FeaturesRequired +static inline bool MClassSysReg_isInRequiredFeatures(const MClassSysReg *TheReg, int TestFeatures) +{ + return (TheReg->FeaturesRequired[0] == TestFeatures || TheReg->FeaturesRequired[1] == TestFeatures); +} + +// lookup system register using 12-bit SYSm value. +// Note: the search is uniqued using M1 mask +static inline const MClassSysReg *lookupMClassSysRegBy12bitSYSmValue(unsigned SYSm) +{ + return lookupMClassSysRegByM1Encoding12(SYSm); +} + +static inline const char *ARM_TSB_TraceSyncBOptToString(unsigned val) +{ + switch (val) { + default: + // llvm_unreachable("Unknown trace synchronization barrier operation"); + return NULL; + + case CSYNC: + return "csync"; + } +} + +#endif |