CoCalc -- X86DisassemblerTables.h

GitHub Repository: freebsd/freebsd-src
Path: blob/main/contrib/llvm-project/llvm/utils/TableGen/X86DisassemblerTables.h
³⁵²⁵⁸ views
1
//===- X86DisassemblerTables.h - Disassembler tables ------------*- C++ -*-===//
2
//
3
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4
// See https://llvm.org/LICENSE.txt for license information.
5
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6
//
7
//===----------------------------------------------------------------------===//
8
//
9
// This file is part of the X86 Disassembler Emitter.
10
// It contains the interface of the disassembler tables.
11
// Documentation for the disassembler emitter in general can be found in
12
//  X86DisassemblerEmitter.h.
13
//
14
//===----------------------------------------------------------------------===//
15

16
#ifndef LLVM_UTILS_TABLEGEN_X86DISASSEMBLERTABLES_H
17
#define LLVM_UTILS_TABLEGEN_X86DISASSEMBLERTABLES_H
18

19
#include "X86DisassemblerShared.h"
20
#include "llvm/Support/X86DisassemblerDecoderCommon.h"
21
#include <map>
22
#include <memory>
23
#include <vector>
24

25
namespace llvm {
26
class raw_ostream;
27

28
namespace X86Disassembler {
29

30
class ModRMFilter;
31

32
/// DisassemblerTables - Encapsulates all the decode tables being generated by
33
///   the table emitter.  Contains functions to populate the tables as well as
34
///   to emit them as hierarchical C structures suitable for consumption by the
35
///   runtime.
36
class DisassemblerTables {
37
private:
38
  /// The decoder tables.  There is one for each opcode type:
39
  /// [0] one-byte opcodes
40
  /// [1] two-byte opcodes of the form 0f __
41
  /// [2] three-byte opcodes of the form 0f 38 __
42
  /// [3] three-byte opcodes of the form 0f 3a __
43
  /// [4] XOP8 map opcode
44
  /// [5] XOP9 map opcode
45
  /// [6] XOPA map opcode
46
  /// [7] 3dnow map opcode
47
  /// [8] fixed length MAP4 opcode
48
  /// [9] fixed length MAP5 opcode
49
  /// [10] fixed length MAP6 opcode
50
  /// [11] fixed length MAP7 opcode
51
  std::unique_ptr<ContextDecision> Tables[12];
52

53
  // Table of ModRM encodings.
54
  typedef std::map<std::vector<unsigned>, unsigned> ModRMMapTy;
55
  mutable ModRMMapTy ModRMTable;
56

57
  /// The instruction information table
58
  std::vector<InstructionSpecifier> InstructionSpecifiers;
59

60
  /// True if there are primary decode conflicts in the instruction set
61
  bool HasConflicts;
62

63
  /// emitModRMDecision - Emits a table of entries corresponding to a single
64
  ///   ModR/M decision.  Compacts the ModR/M decision if possible.  ModR/M
65
  ///   decisions are printed as:
66
  ///
67
  ///   { /* struct ModRMDecision */
68
  ///     TYPE,
69
  ///     modRMTablennnn
70
  ///   }
71
  ///
72
  ///   where nnnn is a unique ID for the corresponding table of IDs.
73
  ///   TYPE indicates whether the table has one entry that is the same
74
  ///   regardless of ModR/M byte, two entries - one for bytes 0x00-0xbf and one
75
  ///   for bytes 0xc0-0xff -, or 256 entries, one for each possible byte.
76
  ///   nnnn is the number of a table for looking up these values.  The tables
77
  ///   are written separately so that tables consisting entirely of zeros will
78
  ///   not be duplicated.  (These all have the name modRMEmptyTable.)  A table
79
  ///   is printed as:
80
  ///
81
  ///   InstrUID modRMTablennnn[k] = {
82
  ///     nnnn, /* MNEMONIC */
83
  ///     ...
84
  ///     nnnn /* MNEMONIC */
85
  ///   };
86
  ///
87
  /// @param o1       - The output stream to print the ID table to.
88
  /// @param o2       - The output stream to print the decision structure to.
89
  /// @param i1       - The indentation level to use with stream o1.
90
  /// @param i2       - The indentation level to use with stream o2.
91
  /// @param ModRMTableNum - next table number for adding to ModRMTable.
92
  /// @param decision - The ModR/M decision to emit.  This decision has 256
93
  ///                   entries - emitModRMDecision decides how to compact it.
94
  void emitModRMDecision(raw_ostream &o1, raw_ostream &o2, unsigned &i1,
95
                         unsigned &i2, unsigned &ModRMTableNum,
96
                         ModRMDecision &decision) const;
97

98
  /// emitOpcodeDecision - Emits an OpcodeDecision and all its subsidiary ModR/M
99
  ///   decisions.  An OpcodeDecision is printed as:
100
  ///
101
  ///   { /* struct OpcodeDecision */
102
  ///     /* 0x00 */
103
  ///     { /* struct ModRMDecision */
104
  ///       ...
105
  ///     }
106
  ///     ...
107
  ///   }
108
  ///
109
  ///   where the ModRMDecision structure is printed as described in the
110
  ///   documentation for emitModRMDecision().  emitOpcodeDecision() passes on a
111
  ///   stream and indent level for the UID tables generated by
112
  ///   emitModRMDecision(), but does not use them itself.
113
  ///
114
  /// @param o1       - The output stream to print the ID tables generated by
115
  ///                   emitModRMDecision() to.
116
  /// @param o2       - The output stream for the decision structure itself.
117
  /// @param i1       - The indent level to use with stream o1.
118
  /// @param i2       - The indent level to use with stream o2.
119
  /// @param ModRMTableNum - next table number for adding to ModRMTable.
120
  /// @param decision - The OpcodeDecision to emit along with its subsidiary
121
  ///                    structures.
122
  void emitOpcodeDecision(raw_ostream &o1, raw_ostream &o2, unsigned &i1,
123
                          unsigned &i2, unsigned &ModRMTableNum,
124
                          OpcodeDecision &decision) const;
125

126
  /// emitContextDecision - Emits a ContextDecision and all its subsidiary
127
  ///   Opcode and ModRMDecisions.  A ContextDecision is printed as:
128
  ///
129
  ///   struct ContextDecision NAME = {
130
  ///     { /* OpcodeDecisions */
131
  ///       /* IC */
132
  ///       { /* struct OpcodeDecision */
133
  ///         ...
134
  ///       },
135
  ///       ...
136
  ///     }
137
  ///   }
138
  ///
139
  ///   NAME is the name of the ContextDecision (typically one of the four names
140
  ///   ONEBYTE_SYM, TWOBYTE_SYM, THREEBYTE38_SYM, THREEBYTE3A_SYM from
141
  ///   X86DisassemblerDecoderCommon.h).
142
  ///   IC is one of the contexts in InstructionContext.  There is an opcode
143
  ///   decision for each possible context.
144
  ///   The OpcodeDecision structures are printed as described in the
145
  ///   documentation for emitOpcodeDecision.
146
  ///
147
  /// @param o1       - The output stream to print the ID tables generated by
148
  ///                   emitModRMDecision() to.
149
  /// @param o2       - The output stream to print the decision structure to.
150
  /// @param i1       - The indent level to use with stream o1.
151
  /// @param i2       - The indent level to use with stream o2.
152
  /// @param ModRMTableNum - next table number for adding to ModRMTable.
153
  /// @param decision - The ContextDecision to emit along with its subsidiary
154
  ///                   structures.
155
  /// @param name     - The name for the ContextDecision.
156
  void emitContextDecision(raw_ostream &o1, raw_ostream &o2, unsigned &i1,
157
                           unsigned &i2, unsigned &ModRMTableNum,
158
                           ContextDecision &decision, const char *name) const;
159

160
  /// emitInstructionInfo - Prints the instruction specifier table, which has
161
  ///   one entry for each instruction, and contains name and operand
162
  ///   information.  This table is printed as:
163
  ///
164
  ///   struct InstructionSpecifier CONTEXTS_SYM[k] = {
165
  ///     {
166
  ///       /* nnnn */
167
  ///       "MNEMONIC",
168
  ///       0xnn,
169
  ///       {
170
  ///         {
171
  ///           ENCODING,
172
  ///           TYPE
173
  ///         },
174
  ///         ...
175
  ///       }
176
  ///     },
177
  ///   };
178
  ///
179
  ///   k is the total number of instructions.
180
  ///   nnnn is the ID of the current instruction (0-based).  This table
181
  ///   includes entries for non-instructions like PHINODE.
182
  ///   0xnn is the lowest possible opcode for the current instruction, used for
183
  ///   AddRegFrm instructions to compute the operand's value.
184
  ///   ENCODING and TYPE describe the encoding and type for a single operand.
185
  ///
186
  /// @param o  - The output stream to which the instruction table should be
187
  ///             written.
188
  /// @param i  - The indent level for use with the stream.
189
  void emitInstructionInfo(raw_ostream &o, unsigned &i) const;
190

191
  /// emitContextTable - Prints the table that is used to translate from an
192
  ///   instruction attribute mask to an instruction context.  This table is
193
  ///   printed as:
194
  ///
195
  ///   InstructionContext CONTEXTS_STR[256] = {
196
  ///     IC, /* 0x00 */
197
  ///     ...
198
  ///   };
199
  ///
200
  ///   IC is the context corresponding to the mask 0x00, and there are 256
201
  ///   possible masks.
202
  ///
203
  /// @param o  - The output stream to which the context table should be
204
  /// written.
205
  /// @param i  - The indent level for use with the stream.
206
  void emitContextTable(raw_ostream &o, uint32_t &i) const;
207

208
  /// emitContextDecisions - Prints all four ContextDecision structures using
209
  ///   emitContextDecision().
210
  ///
211
  /// @param o1 - The output stream to print the ID tables generated by
212
  ///             emitModRMDecision() to.
213
  /// @param o2 - The output stream to print the decision structures to.
214
  /// @param i1 - The indent level to use with stream o1.
215
  /// @param i2 - The indent level to use with stream o2.
216
  /// @param ModRMTableNum - next table number for adding to ModRMTable.
217
  void emitContextDecisions(raw_ostream &o1, raw_ostream &o2, unsigned &i1,
218
                            unsigned &i2, unsigned &ModRMTableNum) const;
219

220
  /// setTableFields - Uses a ModRMFilter to set the appropriate entries in a
221
  ///   ModRMDecision to refer to a particular instruction ID.
222
  ///
223
  /// @param decision - The ModRMDecision to populate.
224
  /// @param filter   - The filter to use in deciding which entries to populate.
225
  /// @param uid      - The unique ID to set matching entries to.
226
  /// @param opcode   - The opcode of the instruction, for error reporting.
227
  void setTableFields(ModRMDecision &decision, const ModRMFilter &filter,
228
                      InstrUID uid, uint8_t opcode);
229

230
public:
231
  /// Constructor - Allocates space for the class decisions and clears them.
232
  DisassemblerTables();
233

234
  ~DisassemblerTables();
235

236
  /// emit - Emits the instruction table, context table, and class decisions.
237
  ///
238
  /// @param o  - The output stream to print the tables to.
239
  void emit(raw_ostream &o) const;
240

241
  /// setTableFields - Uses the opcode type, instruction context, opcode, and a
242
  ///   ModRMFilter as criteria to set a particular set of entries in the
243
  ///   decode tables to point to a specific uid.
244
  ///
245
  /// @param type         - The opcode type (ONEBYTE, TWOBYTE, etc.)
246
  /// @param insnContext  - The context to use (IC, IC_64BIT, etc.)
247
  /// @param opcode       - The last byte of the opcode (not counting any escape
248
  ///                       or extended opcodes).
249
  /// @param filter       - The ModRMFilter that decides which ModR/M byte
250
  /// values
251
  ///                       correspond to the desired instruction.
252
  /// @param uid          - The unique ID of the instruction.
253
  /// @param is32bit      - Instructon is only 32-bit
254
  /// @param noPrefix     - Instruction record has no prefix.
255
  /// @param ignoresVEX_L - Instruction ignores VEX.L
256
  /// @param ignoresVEX_W - Instruction ignores VEX.W
257
  /// @param AddrSize     - Instructions address size 16/32/64. 0 is unspecified
258
  void setTableFields(OpcodeType type, InstructionContext insnContext,
259
                      uint8_t opcode, const ModRMFilter &filter, InstrUID uid,
260
                      bool is32bit, bool noPrefix, bool ignoresVEX_L,
261
                      bool ignoresVEX_W, unsigned AddrSize);
262

263
  /// specForUID - Returns the instruction specifier for a given unique
264
  ///   instruction ID.  Used when resolving collisions.
265
  ///
266
  /// @param uid  - The unique ID of the instruction.
267
  /// @return     - A reference to the instruction specifier.
268
  InstructionSpecifier &specForUID(InstrUID uid) {
269
    if (uid >= InstructionSpecifiers.size())
270
      InstructionSpecifiers.resize(uid + 1);
271

272
    return InstructionSpecifiers[uid];
273
  }
274

275
  // hasConflicts - Reports whether there were primary decode conflicts
276
  //   from any instructions added to the tables.
277
  // @return  - true if there were; false otherwise.
278

279
  bool hasConflicts() { return HasConflicts; }
280
};
281

282
} // namespace X86Disassembler
283

284
} // namespace llvm
285

286
#endif
287

288
Product

Resources

Company