1 | //===- X86DisassemblerTables.h - Disassembler tables ------------*- C++ -*-===// |
2 | // |
3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
4 | // See https://llvm.org/LICENSE.txt for license information. |
5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
6 | // |
7 | //===----------------------------------------------------------------------===// |
8 | // |
9 | // This file is part of the X86 Disassembler Emitter. |
10 | // It contains the interface of the disassembler tables. |
11 | // Documentation for the disassembler emitter in general can be found in |
12 | // X86DisassemblerEmitter.h. |
13 | // |
14 | //===----------------------------------------------------------------------===// |
15 | |
16 | #ifndef LLVM_UTILS_TABLEGEN_X86DISASSEMBLERTABLES_H |
17 | #define LLVM_UTILS_TABLEGEN_X86DISASSEMBLERTABLES_H |
18 | |
19 | #include "X86DisassemblerShared.h" |
20 | #include "llvm/Support/X86DisassemblerDecoderCommon.h" |
21 | #include <map> |
22 | #include <memory> |
23 | #include <vector> |
24 | |
25 | namespace llvm { |
26 | class raw_ostream; |
27 | |
28 | namespace X86Disassembler { |
29 | |
30 | class ModRMFilter; |
31 | |
32 | /// DisassemblerTables - Encapsulates all the decode tables being generated by |
33 | /// the table emitter. Contains functions to populate the tables as well as |
34 | /// to emit them as hierarchical C structures suitable for consumption by the |
35 | /// runtime. |
36 | class DisassemblerTables { |
37 | private: |
38 | /// The decoder tables. There is one for each opcode type: |
39 | /// [0] one-byte opcodes |
40 | /// [1] two-byte opcodes of the form 0f __ |
41 | /// [2] three-byte opcodes of the form 0f 38 __ |
42 | /// [3] three-byte opcodes of the form 0f 3a __ |
43 | /// [4] XOP8 map opcode |
44 | /// [5] XOP9 map opcode |
45 | /// [6] XOPA map opcode |
46 | /// [7] 3dnow map opcode |
47 | /// [8] fixed length MAP4 opcode |
48 | /// [9] fixed length MAP5 opcode |
49 | /// [10] fixed length MAP6 opcode |
50 | /// [11] fixed length MAP7 opcode |
51 | std::unique_ptr<ContextDecision> Tables[12]; |
52 | |
53 | // Table of ModRM encodings. |
54 | typedef std::map<std::vector<unsigned>, unsigned> ModRMMapTy; |
55 | mutable ModRMMapTy ModRMTable; |
56 | |
57 | /// The instruction information table |
58 | std::vector<InstructionSpecifier> InstructionSpecifiers; |
59 | |
60 | /// True if there are primary decode conflicts in the instruction set |
61 | bool HasConflicts; |
62 | |
63 | /// emitModRMDecision - Emits a table of entries corresponding to a single |
64 | /// ModR/M decision. Compacts the ModR/M decision if possible. ModR/M |
65 | /// decisions are printed as: |
66 | /// |
67 | /// { /* struct ModRMDecision */ |
68 | /// TYPE, |
69 | /// modRMTablennnn |
70 | /// } |
71 | /// |
72 | /// where nnnn is a unique ID for the corresponding table of IDs. |
73 | /// TYPE indicates whether the table has one entry that is the same |
74 | /// regardless of ModR/M byte, two entries - one for bytes 0x00-0xbf and one |
75 | /// for bytes 0xc0-0xff -, or 256 entries, one for each possible byte. |
76 | /// nnnn is the number of a table for looking up these values. The tables |
77 | /// are written separately so that tables consisting entirely of zeros will |
78 | /// not be duplicated. (These all have the name modRMEmptyTable.) A table |
79 | /// is printed as: |
80 | /// |
81 | /// InstrUID modRMTablennnn[k] = { |
82 | /// nnnn, /* MNEMONIC */ |
83 | /// ... |
84 | /// nnnn /* MNEMONIC */ |
85 | /// }; |
86 | /// |
87 | /// @param o1 - The output stream to print the ID table to. |
88 | /// @param o2 - The output stream to print the decision structure to. |
89 | /// @param i1 - The indentation level to use with stream o1. |
90 | /// @param i2 - The indentation level to use with stream o2. |
91 | /// @param ModRMTableNum - next table number for adding to ModRMTable. |
92 | /// @param decision - The ModR/M decision to emit. This decision has 256 |
93 | /// entries - emitModRMDecision decides how to compact it. |
94 | void emitModRMDecision(raw_ostream &o1, raw_ostream &o2, unsigned &i1, |
95 | unsigned &i2, unsigned &ModRMTableNum, |
96 | ModRMDecision &decision) const; |
97 | |
98 | /// emitOpcodeDecision - Emits an OpcodeDecision and all its subsidiary ModR/M |
99 | /// decisions. An OpcodeDecision is printed as: |
100 | /// |
101 | /// { /* struct OpcodeDecision */ |
102 | /// /* 0x00 */ |
103 | /// { /* struct ModRMDecision */ |
104 | /// ... |
105 | /// } |
106 | /// ... |
107 | /// } |
108 | /// |
109 | /// where the ModRMDecision structure is printed as described in the |
110 | /// documentation for emitModRMDecision(). emitOpcodeDecision() passes on a |
111 | /// stream and indent level for the UID tables generated by |
112 | /// emitModRMDecision(), but does not use them itself. |
113 | /// |
114 | /// @param o1 - The output stream to print the ID tables generated by |
115 | /// emitModRMDecision() to. |
116 | /// @param o2 - The output stream for the decision structure itself. |
117 | /// @param i1 - The indent level to use with stream o1. |
118 | /// @param i2 - The indent level to use with stream o2. |
119 | /// @param ModRMTableNum - next table number for adding to ModRMTable. |
120 | /// @param decision - The OpcodeDecision to emit along with its subsidiary |
121 | /// structures. |
122 | void emitOpcodeDecision(raw_ostream &o1, raw_ostream &o2, unsigned &i1, |
123 | unsigned &i2, unsigned &ModRMTableNum, |
124 | OpcodeDecision &decision) const; |
125 | |
126 | /// emitContextDecision - Emits a ContextDecision and all its subsidiary |
127 | /// Opcode and ModRMDecisions. A ContextDecision is printed as: |
128 | /// |
129 | /// struct ContextDecision NAME = { |
130 | /// { /* OpcodeDecisions */ |
131 | /// /* IC */ |
132 | /// { /* struct OpcodeDecision */ |
133 | /// ... |
134 | /// }, |
135 | /// ... |
136 | /// } |
137 | /// } |
138 | /// |
139 | /// NAME is the name of the ContextDecision (typically one of the four names |
140 | /// ONEBYTE_SYM, TWOBYTE_SYM, THREEBYTE38_SYM, THREEBYTE3A_SYM from |
141 | /// X86DisassemblerDecoderCommon.h). |
142 | /// IC is one of the contexts in InstructionContext. There is an opcode |
143 | /// decision for each possible context. |
144 | /// The OpcodeDecision structures are printed as described in the |
145 | /// documentation for emitOpcodeDecision. |
146 | /// |
147 | /// @param o1 - The output stream to print the ID tables generated by |
148 | /// emitModRMDecision() to. |
149 | /// @param o2 - The output stream to print the decision structure to. |
150 | /// @param i1 - The indent level to use with stream o1. |
151 | /// @param i2 - The indent level to use with stream o2. |
152 | /// @param ModRMTableNum - next table number for adding to ModRMTable. |
153 | /// @param decision - The ContextDecision to emit along with its subsidiary |
154 | /// structures. |
155 | /// @param name - The name for the ContextDecision. |
156 | void emitContextDecision(raw_ostream &o1, raw_ostream &o2, unsigned &i1, |
157 | unsigned &i2, unsigned &ModRMTableNum, |
158 | ContextDecision &decision, const char *name) const; |
159 | |
160 | /// emitInstructionInfo - Prints the instruction specifier table, which has |
161 | /// one entry for each instruction, and contains name and operand |
162 | /// information. This table is printed as: |
163 | /// |
164 | /// struct InstructionSpecifier CONTEXTS_SYM[k] = { |
165 | /// { |
166 | /// /* nnnn */ |
167 | /// "MNEMONIC", |
168 | /// 0xnn, |
169 | /// { |
170 | /// { |
171 | /// ENCODING, |
172 | /// TYPE |
173 | /// }, |
174 | /// ... |
175 | /// } |
176 | /// }, |
177 | /// }; |
178 | /// |
179 | /// k is the total number of instructions. |
180 | /// nnnn is the ID of the current instruction (0-based). This table |
181 | /// includes entries for non-instructions like PHINODE. |
182 | /// 0xnn is the lowest possible opcode for the current instruction, used for |
183 | /// AddRegFrm instructions to compute the operand's value. |
184 | /// ENCODING and TYPE describe the encoding and type for a single operand. |
185 | /// |
186 | /// @param o - The output stream to which the instruction table should be |
187 | /// written. |
188 | /// @param i - The indent level for use with the stream. |
189 | void emitInstructionInfo(raw_ostream &o, unsigned &i) const; |
190 | |
191 | /// emitContextTable - Prints the table that is used to translate from an |
192 | /// instruction attribute mask to an instruction context. This table is |
193 | /// printed as: |
194 | /// |
195 | /// InstructionContext CONTEXTS_STR[256] = { |
196 | /// IC, /* 0x00 */ |
197 | /// ... |
198 | /// }; |
199 | /// |
200 | /// IC is the context corresponding to the mask 0x00, and there are 256 |
201 | /// possible masks. |
202 | /// |
203 | /// @param o - The output stream to which the context table should be |
204 | /// written. |
205 | /// @param i - The indent level for use with the stream. |
206 | void emitContextTable(raw_ostream &o, uint32_t &i) const; |
207 | |
208 | /// emitContextDecisions - Prints all four ContextDecision structures using |
209 | /// emitContextDecision(). |
210 | /// |
211 | /// @param o1 - The output stream to print the ID tables generated by |
212 | /// emitModRMDecision() to. |
213 | /// @param o2 - The output stream to print the decision structures to. |
214 | /// @param i1 - The indent level to use with stream o1. |
215 | /// @param i2 - The indent level to use with stream o2. |
216 | /// @param ModRMTableNum - next table number for adding to ModRMTable. |
217 | void emitContextDecisions(raw_ostream &o1, raw_ostream &o2, unsigned &i1, |
218 | unsigned &i2, unsigned &ModRMTableNum) const; |
219 | |
220 | /// setTableFields - Uses a ModRMFilter to set the appropriate entries in a |
221 | /// ModRMDecision to refer to a particular instruction ID. |
222 | /// |
223 | /// @param decision - The ModRMDecision to populate. |
224 | /// @param filter - The filter to use in deciding which entries to populate. |
225 | /// @param uid - The unique ID to set matching entries to. |
226 | /// @param opcode - The opcode of the instruction, for error reporting. |
227 | void setTableFields(ModRMDecision &decision, const ModRMFilter &filter, |
228 | InstrUID uid, uint8_t opcode); |
229 | |
230 | public: |
231 | /// Constructor - Allocates space for the class decisions and clears them. |
232 | DisassemblerTables(); |
233 | |
234 | ~DisassemblerTables(); |
235 | |
236 | /// emit - Emits the instruction table, context table, and class decisions. |
237 | /// |
238 | /// @param o - The output stream to print the tables to. |
239 | void emit(raw_ostream &o) const; |
240 | |
241 | /// setTableFields - Uses the opcode type, instruction context, opcode, and a |
242 | /// ModRMFilter as criteria to set a particular set of entries in the |
243 | /// decode tables to point to a specific uid. |
244 | /// |
245 | /// @param type - The opcode type (ONEBYTE, TWOBYTE, etc.) |
246 | /// @param insnContext - The context to use (IC, IC_64BIT, etc.) |
247 | /// @param opcode - The last byte of the opcode (not counting any escape |
248 | /// or extended opcodes). |
249 | /// @param filter - The ModRMFilter that decides which ModR/M byte |
250 | /// values |
251 | /// correspond to the desired instruction. |
252 | /// @param uid - The unique ID of the instruction. |
253 | /// @param is32bit - Instructon is only 32-bit |
254 | /// @param noPrefix - Instruction record has no prefix. |
255 | /// @param ignoresVEX_L - Instruction ignores VEX.L |
256 | /// @param ignoresVEX_W - Instruction ignores VEX.W |
257 | /// @param AddrSize - Instructions address size 16/32/64. 0 is unspecified |
258 | void setTableFields(OpcodeType type, InstructionContext insnContext, |
259 | uint8_t opcode, const ModRMFilter &filter, InstrUID uid, |
260 | bool is32bit, bool noPrefix, bool ignoresVEX_L, |
261 | bool ignoresVEX_W, unsigned AddrSize); |
262 | |
263 | /// specForUID - Returns the instruction specifier for a given unique |
264 | /// instruction ID. Used when resolving collisions. |
265 | /// |
266 | /// @param uid - The unique ID of the instruction. |
267 | /// @return - A reference to the instruction specifier. |
268 | InstructionSpecifier &specForUID(InstrUID uid) { |
269 | if (uid >= InstructionSpecifiers.size()) |
270 | InstructionSpecifiers.resize(new_size: uid + 1); |
271 | |
272 | return InstructionSpecifiers[uid]; |
273 | } |
274 | |
275 | // hasConflicts - Reports whether there were primary decode conflicts |
276 | // from any instructions added to the tables. |
277 | // @return - true if there were; false otherwise. |
278 | |
279 | bool hasConflicts() { return HasConflicts; } |
280 | }; |
281 | |
282 | } // namespace X86Disassembler |
283 | |
284 | } // namespace llvm |
285 | |
286 | #endif |
287 | |