1 //===- X86DisassemblerTables.h - Disassembler tables ------------*- C++ -*-===//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 // This file is part of the X86 Disassembler Emitter.
11 // It contains the interface of the disassembler tables.
12 // Documentation for the disassembler emitter in general can be found in
13 // X86DisasemblerEmitter.h.
15 //===----------------------------------------------------------------------===//
17 #ifndef X86DISASSEMBLERTABLES_H
18 #define X86DISASSEMBLERTABLES_H
20 #include "X86DisassemblerShared.h"
21 #include "X86ModRMFilters.h"
22 #include "llvm/Support/raw_ostream.h"
28 namespace X86Disassembler {
30 /// DisassemblerTables - Encapsulates all the decode tables being generated by
31 /// the table emitter. Contains functions to populate the tables as well as
32 /// to emit them as hierarchical C structures suitable for consumption by the
34 class DisassemblerTables {
36 /// The decoder tables. There is one for each opcode type:
37 /// [0] one-byte opcodes
38 /// [1] two-byte opcodes of the form 0f __
39 /// [2] three-byte opcodes of the form 0f 38 __
40 /// [3] three-byte opcodes of the form 0f 3a __
41 /// [4] three-byte opcodes of the form 0f a6 __
42 /// [5] three-byte opcodes of the form 0f a7 __
43 ContextDecision* Tables[6];
45 // Table of ModRM encodings.
46 typedef std::map<std::vector<unsigned>, unsigned> ModRMMapTy;
47 mutable ModRMMapTy ModRMTable;
49 /// The instruction information table
50 std::vector<InstructionSpecifier> InstructionSpecifiers;
52 /// True if there are primary decode conflicts in the instruction set
55 /// emitModRMDecision - Emits a table of entries corresponding to a single
56 /// ModR/M decision. Compacts the ModR/M decision if possible. ModR/M
57 /// decisions are printed as:
59 /// { /* struct ModRMDecision */
64 /// where nnnn is a unique ID for the corresponding table of IDs.
65 /// TYPE indicates whether the table has one entry that is the same
66 /// regardless of ModR/M byte, two entries - one for bytes 0x00-0xbf and one
67 /// for bytes 0xc0-0xff -, or 256 entries, one for each possible byte.
68 /// nnnn is the number of a table for looking up these values. The tables
69 /// are written separately so that tables consisting entirely of zeros will
70 /// not be duplicated. (These all have the name modRMEmptyTable.) A table
73 /// InstrUID modRMTablennnn[k] = {
74 /// nnnn, /* MNEMONIC */
76 /// nnnn /* MNEMONIC */
79 /// @param o1 - The output stream to print the ID table to.
80 /// @param o2 - The output stream to print the decision structure to.
81 /// @param i1 - The indentation level to use with stream o1.
82 /// @param i2 - The indentation level to use with stream o2.
83 /// @param ModRMTableNum - next table number for adding to ModRMTable.
84 /// @param decision - The ModR/M decision to emit. This decision has 256
85 /// entries - emitModRMDecision decides how to compact it.
86 void emitModRMDecision(raw_ostream &o1, raw_ostream &o2,
87 unsigned &i1, unsigned &i2, unsigned &ModRMTableNum,
88 ModRMDecision &decision) const;
90 /// emitOpcodeDecision - Emits an OpcodeDecision and all its subsidiary ModR/M
91 /// decisions. An OpcodeDecision is printed as:
93 /// { /* struct OpcodeDecision */
95 /// { /* struct ModRMDecision */
101 /// where the ModRMDecision structure is printed as described in the
102 /// documentation for emitModRMDecision(). emitOpcodeDecision() passes on a
103 /// stream and indent level for the UID tables generated by
104 /// emitModRMDecision(), but does not use them itself.
106 /// @param o1 - The output stream to print the ID tables generated by
107 /// emitModRMDecision() to.
108 /// @param o2 - The output stream for the decision structure itself.
109 /// @param i1 - The indent level to use with stream o1.
110 /// @param i2 - The indent level to use with stream o2.
111 /// @param ModRMTableNum - next table number for adding to ModRMTable.
112 /// @param decision - The OpcodeDecision to emit along with its subsidiary
114 void emitOpcodeDecision(raw_ostream &o1, raw_ostream &o2,
115 unsigned &i1, unsigned &i2, unsigned &ModRMTableNum,
116 OpcodeDecision &decision) const;
118 /// emitContextDecision - Emits a ContextDecision and all its subsidiary
119 /// Opcode and ModRMDecisions. A ContextDecision is printed as:
121 /// struct ContextDecision NAME = {
122 /// { /* OpcodeDecisions */
124 /// { /* struct OpcodeDecision */
131 /// NAME is the name of the ContextDecision (typically one of the four names
132 /// ONEBYTE_SYM, TWOBYTE_SYM, THREEBYTE38_SYM, THREEBYTE3A_SYM,
133 /// THREEBYTEA6_SYM, and THREEBYTEA7_SYM from
134 /// X86DisassemblerDecoderCommon.h).
135 /// IC is one of the contexts in InstructionContext. There is an opcode
136 /// decision for each possible context.
137 /// The OpcodeDecision structures are printed as described in the
138 /// documentation for emitOpcodeDecision.
140 /// @param o1 - The output stream to print the ID tables generated by
141 /// emitModRMDecision() to.
142 /// @param o2 - The output stream to print the decision structure to.
143 /// @param i1 - The indent level to use with stream o1.
144 /// @param i2 - The indent level to use with stream o2.
145 /// @param ModRMTableNum - next table number for adding to ModRMTable.
146 /// @param decision - The ContextDecision to emit along with its subsidiary
148 /// @param name - The name for the ContextDecision.
149 void emitContextDecision(raw_ostream &o1, raw_ostream &o2,
150 unsigned &i1, unsigned &i2, unsigned &ModRMTableNum,
151 ContextDecision &decision, const char* name) const;
153 /// emitInstructionInfo - Prints the instruction specifier table, which has
154 /// one entry for each instruction, and contains name and operand
155 /// information. This table is printed as:
157 /// struct InstructionSpecifier CONTEXTS_SYM[k] = {
172 /// k is the total number of instructions.
173 /// nnnn is the ID of the current instruction (0-based). This table
174 /// includes entries for non-instructions like PHINODE.
175 /// 0xnn is the lowest possible opcode for the current instruction, used for
176 /// AddRegFrm instructions to compute the operand's value.
177 /// ENCODING and TYPE describe the encoding and type for a single operand.
179 /// @param o - The output stream to which the instruction table should be
181 /// @param i - The indent level for use with the stream.
182 void emitInstructionInfo(raw_ostream &o, unsigned &i) const;
184 /// emitContextTable - Prints the table that is used to translate from an
185 /// instruction attribute mask to an instruction context. This table is
188 /// InstructionContext CONTEXTS_STR[256] = {
193 /// IC is the context corresponding to the mask 0x00, and there are 256
196 /// @param o - The output stream to which the context table should be written.
197 /// @param i - The indent level for use with the stream.
198 void emitContextTable(raw_ostream &o, uint32_t &i) const;
200 /// emitContextDecisions - Prints all four ContextDecision structures using
201 /// emitContextDecision().
203 /// @param o1 - The output stream to print the ID tables generated by
204 /// emitModRMDecision() to.
205 /// @param o2 - The output stream to print the decision structures to.
206 /// @param i1 - The indent level to use with stream o1.
207 /// @param i2 - The indent level to use with stream o2.
208 /// @param ModRMTableNum - next table number for adding to ModRMTable.
209 void emitContextDecisions(raw_ostream &o1, raw_ostream &o2,
210 unsigned &i1, unsigned &i2,
211 unsigned &ModRMTableNum) const;
213 /// setTableFields - Uses a ModRMFilter to set the appropriate entries in a
214 /// ModRMDecision to refer to a particular instruction ID.
216 /// @param decision - The ModRMDecision to populate.
217 /// @param filter - The filter to use in deciding which entries to populate.
218 /// @param uid - The unique ID to set matching entries to.
219 /// @param opcode - The opcode of the instruction, for error reporting.
220 void setTableFields(ModRMDecision &decision,
221 const ModRMFilter &filter,
225 /// Constructor - Allocates space for the class decisions and clears them.
226 DisassemblerTables();
228 ~DisassemblerTables();
230 /// emit - Emits the instruction table, context table, and class decisions.
232 /// @param o - The output stream to print the tables to.
233 void emit(raw_ostream &o) const;
235 /// setTableFields - Uses the opcode type, instruction context, opcode, and a
236 /// ModRMFilter as criteria to set a particular set of entries in the
237 /// decode tables to point to a specific uid.
239 /// @param type - The opcode type (ONEBYTE, TWOBYTE, etc.)
240 /// @param insnContext - The context to use (IC, IC_64BIT, etc.)
241 /// @param opcode - The last byte of the opcode (not counting any escape
242 /// or extended opcodes).
243 /// @param filter - The ModRMFilter that decides which ModR/M byte values
244 /// correspond to the desired instruction.
245 /// @param uid - The unique ID of the instruction.
246 /// @param is32bit - Instructon is only 32-bit
247 /// @param ignoresVEX_L - Instruction ignores VEX.L
248 void setTableFields(OpcodeType type,
249 InstructionContext insnContext,
251 const ModRMFilter &filter,
256 /// specForUID - Returns the instruction specifier for a given unique
257 /// instruction ID. Used when resolving collisions.
259 /// @param uid - The unique ID of the instruction.
260 /// @return - A reference to the instruction specifier.
261 InstructionSpecifier& specForUID(InstrUID uid) {
262 if (uid >= InstructionSpecifiers.size())
263 InstructionSpecifiers.resize(uid + 1);
265 return InstructionSpecifiers[uid];
268 // hasConflicts - Reports whether there were primary decode conflicts
269 // from any instructions added to the tables.
270 // @return - true if there were; false otherwise.
272 bool hasConflicts() {
277 } // namespace X86Disassembler