Blame - utils/TableGen/X86RecognizableInstr.h - platform_external_llvm

2009-12-19 02:59:52 +0000

[diff] [blame]

1

//===- X86RecognizableInstr.h - Disassembler instruction spec ----*- C++ -*-===//

2

//

3

// The LLVM Compiler Infrastructure

4

//

5

// This file is distributed under the University of Illinois Open Source

6

// License. See LICENSE.TXT for details.

7

//

8

//===----------------------------------------------------------------------===//

9

//

10

// This file is part of the X86 Disassembler Emitter.

11

// It contains the interface of a single recognizable instruction.

12

// Documentation for the disassembler emitter in general can be found in

Hiroshi Inoue

b08063c

2017-07-04 13:09:29 +0000

[diff] [blame]

13

// X86DisassemblerEmitter.h.

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

14

//

15

//===----------------------------------------------------------------------===//

16

Benjamin Kramer

00e08fc

2014-08-13 16:26:38 +0000

[diff] [blame]

17

#ifndef LLVM_UTILS_TABLEGEN_X86RECOGNIZABLEINSTR_H

18

#define LLVM_UTILS_TABLEGEN_X86RECOGNIZABLEINSTR_H

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

19

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

20

#include "CodeGenTarget.h"

Chandler Carruth

4ffd89f

2012-12-04 10:37:14 +0000

[diff] [blame]

21

#include "X86DisassemblerTables.h"

Chandler Carruth

4ffd89f

2012-12-04 10:37:14 +0000

[diff] [blame]

22

#include "llvm/Support/DataTypes.h"

23

#include "llvm/TableGen/Record.h"

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

namespace llvm {

Ayman Musa

2017-05-11 11:51:12 +0000

[diff] [blame]

27

#define X86_INSTR_MRM_MAPPING \

MAP(C0, 64) \

MAP(C1, 65) \

MAP(C2, 66) \

MAP(C3, 67) \

MAP(C4, 68) \

MAP(C5, 69) \

MAP(C6, 70) \

MAP(C7, 71) \

MAP(C8, 72) \

MAP(C9, 73) \

MAP(CA, 74) \

MAP(CB, 75) \

MAP(CC, 76) \

MAP(CD, 77) \

MAP(CE, 78) \

MAP(CF, 79) \

MAP(D0, 80) \

MAP(D1, 81) \

MAP(D2, 82) \

MAP(D3, 83) \

MAP(D4, 84) \

MAP(D5, 85) \

MAP(D6, 86) \

MAP(D7, 87) \

MAP(D8, 88) \

MAP(D9, 89) \

MAP(DA, 90) \

MAP(DB, 91) \

MAP(DC, 92) \

MAP(DD, 93) \

MAP(DE, 94) \

MAP(DF, 95) \

MAP(E0, 96) \

MAP(E1, 97) \

MAP(E2, 98) \

MAP(E3, 99) \

MAP(E4, 100) \

MAP(E5, 101) \

MAP(E6, 102) \

MAP(E7, 103) \

MAP(E8, 104) \

MAP(E9, 105) \

MAP(EA, 106) \

MAP(EB, 107) \

MAP(EC, 108) \

MAP(ED, 109) \

MAP(EE, 110) \

MAP(EF, 111) \

MAP(F0, 112) \

MAP(F1, 113) \

MAP(F2, 114) \

MAP(F3, 115) \

MAP(F4, 116) \

MAP(F5, 117) \

MAP(F6, 118) \

MAP(F7, 119) \

MAP(F8, 120) \

MAP(F9, 121) \

MAP(FA, 122) \

MAP(FB, 123) \

MAP(FC, 124) \

MAP(FD, 125) \

MAP(FE, 126) \

MAP(FF, 127)

// A clone of X86 since we can't depend on something that is generated.

namespace X86Local {

enum {

Pseudo = 0,

RawFrm = 1,

AddRegFrm = 2,

RawFrmMemOffs = 3,

RawFrmSrc = 4,

RawFrmDst = 5,

RawFrmDstSrc = 6,

RawFrmImm8 = 7,

RawFrmImm16 = 8,

MRMDestMem = 32,

MRMSrcMem = 33,

MRMSrcMem4VOp3 = 34,

MRMSrcMemOp4 = 35,

MRMXm = 39,

MRM0m = 40, MRM1m = 41, MRM2m = 42, MRM3m = 43,

111

MRM4m = 44, MRM5m = 45, MRM6m = 46, MRM7m = 47,

MRMDestReg = 48,

MRMSrcReg = 49,

MRMSrcReg4VOp3 = 50,

MRMSrcRegOp4 = 51,

MRMXr = 55,

MRM0r = 56, MRM1r = 57, MRM2r = 58, MRM3r = 59,

118

MRM4r = 60, MRM5r = 61, MRM6r = 62, MRM7r = 63,

119

#define MAP(from, to) MRM_##from = to,

120

X86_INSTR_MRM_MAPPING

#undef MAP

};

enum {

Craig Topper

f0c0da8

2018-03-24 06:04:12 +0000

[diff] [blame]

125

OB = 0, TB = 1, T8 = 2, TA = 3, XOP8 = 4, XOP9 = 5, XOPA = 6, ThreeDNow = 7

Ayman Musa

059f03a

2017-05-11 11:51:12 +0000

[diff] [blame]

126

};

127

128

enum {

Craig Topper

16fa906

2018-04-03 06:37:04 +0000

[diff] [blame]

129

PD = 1, XS = 2, XD = 3, PS = 4

Ayman Musa

059f03a

2017-05-11 11:51:12 +0000

[diff] [blame]

};

enum {

VEX = 1, XOP = 2, EVEX = 3

};

enum {

OpSize16 = 1, OpSize32 = 2

};

enum {

AdSize16 = 1, AdSize32 = 2, AdSize64 = 3

142

};

143

144

enum {

Craig Topper

023b407

2018-06-19 04:24:42 +0000

[diff] [blame]

145

VEX_W0 = 0, VEX_W1 = 1, VEX_WIG = 2, VEX_W1X = 3

Ayman Musa

059f03a

2017-05-11 11:51:12 +0000

[diff] [blame]

};

}

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

149

namespace X86Disassembler {

150

151

/// RecognizableInstr - Encapsulates all information required to decode a single

152

/// instruction, as extracted from the LLVM instruction tables. Has methods

153

/// to interpret the information available in the LLVM tables, and to emit the

154

/// instruction into DisassemblerTables.

155

class RecognizableInstr {

156

private:

157

/// The opcode of the instruction, as used in an MCInst

158

InstrUID UID;

159

/// The record from the .td files corresponding to this instruction

160

const Record* Rec;

Craig Topper

f0b161d

2014-01-31 08:47:06 +0000

[diff] [blame]

161

/// The OpPrefix field from the record

162

uint8_t OpPrefix;

163

/// The OpMap field from the record

164

uint8_t OpMap;

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

165

/// The opcode field from the record; this is the opcode used in the Intel

166

/// encoding and therefore distinct from the UID

167

uint8_t Opcode;

168

/// The form field from the record

169

uint8_t Form;

Craig Topper

1415ca1

2014-02-02 07:08:01 +0000

[diff] [blame]

170

// The encoding field from the record

171

uint8_t Encoding;

Craig Topper

2014-02-02 09:25:09 +0000

[diff] [blame]

172

/// The OpSize field from the record

173

uint8_t OpSize;

Craig Topper

3bc4397

2014-12-24 06:05:22 +0000

[diff] [blame]

174

/// The AdSize field from the record

175

uint8_t AdSize;

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

176

/// The hasREX_WPrefix field from the record

177

bool HasREX_WPrefix;

Craig Topper

1415ca1

2014-02-02 07:08:01 +0000

[diff] [blame]

178

/// The hasVEX_4V field from the record

179

bool HasVEX_4V;

Ayman Musa

5cb2278

2017-02-20 08:27:54 +0000

[diff] [blame]

180

/// The VEX_WPrefix field from the record

181

uint8_t VEX_WPrefix;

Sean Callanan

a21e2ea

2011-03-15 01:23:15 +0000

[diff] [blame]

182

/// Inferred from the operands; indicates whether the L bit in the VEX prefix is set

183

bool HasVEX_LPrefix;

Craig Topper

e6a3a29

2011-12-30 05:20:36 +0000

[diff] [blame]

184

/// The ignoreVEX_L field from the record

Craig Topper

6744a17

2011-10-04 06:30:42 +0000

[diff] [blame]

185

bool IgnoresVEX_L;

Elena Demikhovsky

c18f4ef

2013-07-28 08:28:38 +0000

[diff] [blame]

186

/// The hasEVEX_L2Prefix field from the record

187

bool HasEVEX_L2Prefix;

188

/// The hasEVEX_K field from the record

189

bool HasEVEX_K;

Elena Demikhovsky

633f98b

2013-11-03 13:46:31 +0000

[diff] [blame]

190

/// The hasEVEX_KZ field from the record

191

bool HasEVEX_KZ;

Elena Demikhovsky

c18f4ef

2013-07-28 08:28:38 +0000

[diff] [blame]

192

/// The hasEVEX_B field from the record

193

bool HasEVEX_B;

Craig Topper

0f7dce5

2017-10-23 02:26:24 +0000

[diff] [blame]

194

/// Indicates that the instruction uses the L and L' fields for RC.

195

bool EncodeRC;

Craig Topper

527f132

2014-01-05 04:17:28 +0000

[diff] [blame]

196

/// The isCodeGenOnly field from the record

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

197

bool IsCodeGenOnly;

Craig Topper

527f132

2014-01-05 04:17:28 +0000

[diff] [blame]

198

/// The ForceDisassemble field from the record

199

bool ForceDisassemble;

Adam Nemet

6ae2941

2014-07-17 17:04:56 +0000

[diff] [blame]

200

// The CD8_Scale field from the record

201

uint8_t CD8_Scale;

Craig Topper

4da632e

2011-09-23 06:57:25 +0000

[diff] [blame]

202

// Whether the instruction has the predicate "In64BitMode"

Eli Friedman

7105259

2011-07-16 02:41:28 +0000

[diff] [blame]

203

bool Is64Bit;

Craig Topper

4da632e

2011-09-23 06:57:25 +0000

[diff] [blame]

204

// Whether the instruction has the predicate "In32BitMode"

205

bool Is32Bit;

Craig Topper

1773084

2011-10-16 03:51:13 +0000

[diff] [blame]

206

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

207

/// The instruction name as listed in the tables

208

std::string Name;

Craig Topper

38e6f73

2014-01-15 05:02:02 +0000

[diff] [blame]

209

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

210

/// Indicates whether the instruction should be emitted into the decode

211

/// tables; regardless, it will be emitted into the instruction info table

212

bool ShouldBeEmitted;

Rafael Auler

2018-02-15 21:20:31 +0000

[diff] [blame]

213

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

214

/// The operands of the instruction, as listed in the CodeGenInstruction.

215

/// They are not one-to-one with operands listed in the MCInst; for example,

216

/// memory operands expand to 5 operands in the MCInst

Chris Lattner

c240bb0

2010-11-01 04:03:32 +0000

[diff] [blame]

217

const std::vector<CGIOperandList::OperandInfo>* Operands;

Rafael Auler

2018-02-15 21:20:31 +0000

[diff] [blame]

218

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

219

/// The description of the instruction that is emitted into the instruction

220

/// info table

221

InstructionSpecifier* Spec;

222

223

/// insnContext - Returns the primary context in which the instruction is

224

/// valid.

225

///

226

/// @return - The context in which the instruction is valid.

227

InstructionContext insnContext() const;

Sean Callanan

a21e2ea

2011-03-15 01:23:15 +0000

[diff] [blame]

228

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

229

/// typeFromString - Translates an operand type from the string provided in

230

/// the LLVM tables to an OperandType for use in the operand specifier.

231

///

232

/// @param s - The string, as extracted by calling Rec->getName()

233

/// on a CodeGenInstruction::OperandInfo.

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

234

/// @param hasREX_WPrefix - Indicates whether the instruction has a REX.W

235

/// prefix. If it does, 32-bit register operands stay

236

/// 32-bit regardless of the operand size.

Craig Topper

2014-02-02 09:25:09 +0000

[diff] [blame]

237

/// @param OpSize Indicates the operand size of the instruction.

238

/// If register size does not match OpSize, then

239

/// register sizes keep their size.

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

240

/// @return - The operand's type.

Craig Topper

2014-02-02 09:25:09 +0000

[diff] [blame]

241

static OperandType typeFromString(const std::string& s,

242

bool hasREX_WPrefix, uint8_t OpSize);

243

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

244

/// immediateEncodingFromString - Translates an immediate encoding from the

245

/// string provided in the LLVM tables to an OperandEncoding for use in

246

/// the operand specifier.

247

///

Craig Topper

2014-02-02 09:25:09 +0000

[diff] [blame]

248

/// @param s - See typeFromString().

249

/// @param OpSize - Indicates whether this is an OpSize16 instruction.

250

/// If it is not, then 16-bit immediate operands stay 16-bit.

251

/// @return - The operand's encoding.

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

252

static OperandEncoding immediateEncodingFromString(const std::string &s,

Craig Topper

2014-02-02 09:25:09 +0000

[diff] [blame]

253

uint8_t OpSize);

254

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

255

/// rmRegisterEncodingFromString - Like immediateEncodingFromString, but

256

/// handles operands that are in the REG field of the ModR/M byte.

257

static OperandEncoding rmRegisterEncodingFromString(const std::string &s,

Craig Topper

2014-02-02 09:25:09 +0000

[diff] [blame]

258

uint8_t OpSize);

259

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

260

/// rmRegisterEncodingFromString - Like immediateEncodingFromString, but

261

/// handles operands that are in the REG field of the ModR/M byte.

262

static OperandEncoding roRegisterEncodingFromString(const std::string &s,

Craig Topper

2014-02-02 09:25:09 +0000

[diff] [blame]

263

uint8_t OpSize);

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

264

static OperandEncoding memoryEncodingFromString(const std::string &s,

Craig Topper

2014-02-02 09:25:09 +0000

[diff] [blame]

265

uint8_t OpSize);

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

266

static OperandEncoding relocationEncodingFromString(const std::string &s,

Craig Topper

2014-02-02 09:25:09 +0000

[diff] [blame]

267

uint8_t OpSize);

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

268

static OperandEncoding opcodeModifierEncodingFromString(const std::string &s,

Craig Topper

2014-02-02 09:25:09 +0000

[diff] [blame]

269

uint8_t OpSize);

Sean Callanan

a21e2ea

2011-03-15 01:23:15 +0000

[diff] [blame]

270

static OperandEncoding vvvvRegisterEncodingFromString(const std::string &s,

Craig Topper

2014-02-02 09:25:09 +0000

[diff] [blame]

271

uint8_t OpSize);

Elena Demikhovsky

c18f4ef

2013-07-28 08:28:38 +0000

[diff] [blame]

272

static OperandEncoding writemaskRegisterEncodingFromString(const std::string &s,

Craig Topper

2014-02-02 09:25:09 +0000

[diff] [blame]

273

uint8_t OpSize);

274

Adrian Prantl

26b584c

2018-05-01 15:54:18 +0000

[diff] [blame]

275

/// Adjust the encoding type for an operand based on the instruction.

Adam Nemet

6ae2941

2014-07-17 17:04:56 +0000

[diff] [blame]

276

void adjustOperandEncoding(OperandEncoding &encoding);

277

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

278

/// handleOperand - Converts a single operand from the LLVM table format to

279

/// the emitted table format, handling any duplicate operands it encounters

280

/// and then one non-duplicate.

281

///

282

/// @param optional - Determines whether to assert that the

283

/// operand exists.

284

/// @param operandIndex - The index into the generated operand table.

285

/// Incremented by this function one or more

Rafael Auler

2018-02-15 21:20:31 +0000

[diff] [blame]

286

/// times to reflect possible duplicate

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

287

/// operands).

288

/// @param physicalOperandIndex - The index of the current operand into the

289

/// set of non-duplicate ('physical') operands.

290

/// Incremented by this function once.

291

/// @param numPhysicalOperands - The number of non-duplicate operands in the

292

/// instructions.

293

/// @param operandMapping - The operand mapping, which has an entry for

294

/// each operand that indicates whether it is a

295

/// duplicate, and of what.

296

void handleOperand(bool optional,

297

unsigned &operandIndex,

298

unsigned &physicalOperandIndex,

Craig Topper

69dced0

2016-02-16 04:24:56 +0000

[diff] [blame]

299

unsigned numPhysicalOperands,

Craig Topper

5aba78b

2012-07-12 06:52:41 +0000

[diff] [blame]

300

const unsigned *operandMapping,

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

301

OperandEncoding (*encodingFromString)

302

(const std::string&,

Craig Topper

2014-02-02 09:25:09 +0000

[diff] [blame]

303

uint8_t OpSize));

304

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

305

/// shouldBeEmitted - Returns the shouldBeEmitted field. Although filter()

306

/// filters out many instructions, at various points in decoding we

307

/// determine that the instruction should not actually be decodable. In

308

/// particular, MMX MOV instructions aren't emitted, but they're only

309

/// identified during operand parsing.

310

///

311

/// @return - true if at this point we believe the instruction should be

312

/// emitted; false if not. This will return false if filter() returns false

313

/// once emitInstructionSpecifier() has been called.

314

bool shouldBeEmitted() const {

315

return ShouldBeEmitted;

316

}

Rafael Auler

2018-02-15 21:20:31 +0000

[diff] [blame]

317

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

318

/// emitInstructionSpecifier - Loads the instruction specifier for the current

319

/// instruction into a DisassemblerTables.

320

///

Craig Topper

e61c70a

2014-01-02 03:58:45 +0000

[diff] [blame]

321

void emitInstructionSpecifier();

Rafael Auler

2018-02-15 21:20:31 +0000

[diff] [blame]

322

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

323

/// emitDecodePath - Populates the proper fields in the decode tables

324

/// corresponding to the decode paths for this instruction.

325

///

Dmitri Gribenko

2012-09-13 12:34:29 +0000

[diff] [blame]

326

/// \param tables The DisassemblerTables to populate with the decode

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

327

/// decode information for the current instruction.

328

void emitDecodePath(DisassemblerTables &tables) const;

329

330

/// Constructor - Initializes a RecognizableInstr with the appropriate fields

331

/// from a CodeGenInstruction.

332

///

Dmitri Gribenko

2012-09-13 12:34:29 +0000

[diff] [blame]

333

/// \param tables The DisassemblerTables that the specifier will be added to.

334

/// \param insn The CodeGenInstruction to extract information from.

335

/// \param uid The unique ID of the current instruction.

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

336

RecognizableInstr(DisassemblerTables &tables,

337

const CodeGenInstruction &insn,

338

InstrUID uid);

339

public:

340

/// processInstr - Accepts a CodeGenInstruction and loads decode information

341

/// for it into a DisassemblerTables if appropriate.

342

///

Dmitri Gribenko

2012-09-13 12:34:29 +0000

[diff] [blame]

343

/// \param tables The DiassemblerTables to be populated with decode

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

344

/// information.

Dmitri Gribenko

2012-09-13 12:34:29 +0000

[diff] [blame]

345

/// \param insn The CodeGenInstruction to be used as a source for this

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

346

/// information.

Dmitri Gribenko

2012-09-13 12:34:29 +0000

[diff] [blame]

347

/// \param uid The unique ID of the instruction.

Sean Callanan

2009-12-19 02:59:52 +0000

[diff] [blame]

348

static void processInstr(DisassemblerTables &tables,

349

const CodeGenInstruction &insn,

350

InstrUID uid);

351

};

Rafael Auler

2018-02-15 21:20:31 +0000

[diff] [blame]

352

Sean Callanan