1 //===- X86DisassemblerTables.h - Disassembler tables ------------*- C++ -*-===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file is part of the X86 Disassembler Emitter.
10 // It contains the interface of the disassembler tables.
11 // Documentation for the disassembler emitter in general can be found in
12 //  X86DisassemblerEmitter.h.
13 //
14 //===----------------------------------------------------------------------===//
15 
16 #ifndef LLVM_UTILS_TABLEGEN_X86DISASSEMBLERTABLES_H
17 #define LLVM_UTILS_TABLEGEN_X86DISASSEMBLERTABLES_H
18 
19 #include "X86DisassemblerShared.h"
20 #include "llvm/Support/X86DisassemblerDecoderCommon.h"
21 #include <map>
22 #include <memory>
23 #include <vector>
24 
25 namespace llvm {
26 class raw_ostream;
27 
28 namespace X86Disassembler {
29 
30 class ModRMFilter;
31 
32 /// DisassemblerTables - Encapsulates all the decode tables being generated by
33 ///   the table emitter.  Contains functions to populate the tables as well as
34 ///   to emit them as hierarchical C structures suitable for consumption by the
35 ///   runtime.
36 class DisassemblerTables {
37 private:
38   /// The decoder tables.  There is one for each opcode type:
39   /// [0] one-byte opcodes
40   /// [1] two-byte opcodes of the form 0f __
41   /// [2] three-byte opcodes of the form 0f 38 __
42   /// [3] three-byte opcodes of the form 0f 3a __
43   /// [4] XOP8 map opcode
44   /// [5] XOP9 map opcode
45   /// [6] XOPA map opcode
46   /// [7] 3dnow map opcode
47   /// [8] fixed length MAP4 opcode
48   /// [9] fixed length MAP5 opcode
49   /// [10] fixed length MAP6 opcode
50   /// [11] fixed length MAP7 opcode
51   std::unique_ptr<ContextDecision> Tables[12];
52 
53   // Table of ModRM encodings.
54   typedef std::map<std::vector<unsigned>, unsigned> ModRMMapTy;
55   mutable ModRMMapTy ModRMTable;
56 
57   /// The instruction information table
58   std::vector<InstructionSpecifier> InstructionSpecifiers;
59 
60   /// True if there are primary decode conflicts in the instruction set
61   bool HasConflicts;
62 
63   /// emitModRMDecision - Emits a table of entries corresponding to a single
64   ///   ModR/M decision.  Compacts the ModR/M decision if possible.  ModR/M
65   ///   decisions are printed as:
66   ///
67   ///   { /* struct ModRMDecision */
68   ///     TYPE,
69   ///     modRMTablennnn
70   ///   }
71   ///
72   ///   where nnnn is a unique ID for the corresponding table of IDs.
73   ///   TYPE indicates whether the table has one entry that is the same
74   ///   regardless of ModR/M byte, two entries - one for bytes 0x00-0xbf and one
75   ///   for bytes 0xc0-0xff -, or 256 entries, one for each possible byte.
76   ///   nnnn is the number of a table for looking up these values.  The tables
77   ///   are written separately so that tables consisting entirely of zeros will
78   ///   not be duplicated.  (These all have the name modRMEmptyTable.)  A table
79   ///   is printed as:
80   ///
81   ///   InstrUID modRMTablennnn[k] = {
82   ///     nnnn, /* MNEMONIC */
83   ///     ...
84   ///     nnnn /* MNEMONIC */
85   ///   };
86   ///
87   /// @param o1       - The output stream to print the ID table to.
88   /// @param o2       - The output stream to print the decision structure to.
89   /// @param i1       - The indentation level to use with stream o1.
90   /// @param i2       - The indentation level to use with stream o2.
91   /// @param ModRMTableNum - next table number for adding to ModRMTable.
92   /// @param decision - The ModR/M decision to emit.  This decision has 256
93   ///                   entries - emitModRMDecision decides how to compact it.
94   void emitModRMDecision(raw_ostream &o1, raw_ostream &o2,
95                          unsigned &i1, unsigned &i2, unsigned &ModRMTableNum,
96                          ModRMDecision &decision) const;
97 
98   /// emitOpcodeDecision - Emits an OpcodeDecision and all its subsidiary ModR/M
99   ///   decisions.  An OpcodeDecision is printed as:
100   ///
101   ///   { /* struct OpcodeDecision */
102   ///     /* 0x00 */
103   ///     { /* struct ModRMDecision */
104   ///       ...
105   ///     }
106   ///     ...
107   ///   }
108   ///
109   ///   where the ModRMDecision structure is printed as described in the
110   ///   documentation for emitModRMDecision().  emitOpcodeDecision() passes on a
111   ///   stream and indent level for the UID tables generated by
112   ///   emitModRMDecision(), but does not use them itself.
113   ///
114   /// @param o1       - The output stream to print the ID tables generated by
115   ///                   emitModRMDecision() to.
116   /// @param o2       - The output stream for the decision structure itself.
117   /// @param i1       - The indent level to use with stream o1.
118   /// @param i2       - The indent level to use with stream o2.
119   /// @param ModRMTableNum - next table number for adding to ModRMTable.
120   /// @param decision - The OpcodeDecision to emit along with its subsidiary
121   ///                    structures.
122   void emitOpcodeDecision(raw_ostream &o1, raw_ostream &o2,
123                           unsigned &i1, unsigned &i2, unsigned &ModRMTableNum,
124                           OpcodeDecision &decision) const;
125 
126   /// emitContextDecision - Emits a ContextDecision and all its subsidiary
127   ///   Opcode and ModRMDecisions.  A ContextDecision is printed as:
128   ///
129   ///   struct ContextDecision NAME = {
130   ///     { /* OpcodeDecisions */
131   ///       /* IC */
132   ///       { /* struct OpcodeDecision */
133   ///         ...
134   ///       },
135   ///       ...
136   ///     }
137   ///   }
138   ///
139   ///   NAME is the name of the ContextDecision (typically one of the four names
140   ///   ONEBYTE_SYM, TWOBYTE_SYM, THREEBYTE38_SYM, THREEBYTE3A_SYM from
141   ///   X86DisassemblerDecoderCommon.h).
142   ///   IC is one of the contexts in InstructionContext.  There is an opcode
143   ///   decision for each possible context.
144   ///   The OpcodeDecision structures are printed as described in the
145   ///   documentation for emitOpcodeDecision.
146   ///
147   /// @param o1       - The output stream to print the ID tables generated by
148   ///                   emitModRMDecision() to.
149   /// @param o2       - The output stream to print the decision structure to.
150   /// @param i1       - The indent level to use with stream o1.
151   /// @param i2       - The indent level to use with stream o2.
152   /// @param ModRMTableNum - next table number for adding to ModRMTable.
153   /// @param decision - The ContextDecision to emit along with its subsidiary
154   ///                   structures.
155   /// @param name     - The name for the ContextDecision.
156   void emitContextDecision(raw_ostream &o1, raw_ostream &o2,
157                            unsigned &i1, unsigned &i2, unsigned &ModRMTableNum,
158                            ContextDecision &decision, const char* name) const;
159 
160   /// emitInstructionInfo - Prints the instruction specifier table, which has
161   ///   one entry for each instruction, and contains name and operand
162   ///   information.  This table is printed as:
163   ///
164   ///   struct InstructionSpecifier CONTEXTS_SYM[k] = {
165   ///     {
166   ///       /* nnnn */
167   ///       "MNEMONIC",
168   ///       0xnn,
169   ///       {
170   ///         {
171   ///           ENCODING,
172   ///           TYPE
173   ///         },
174   ///         ...
175   ///       }
176   ///     },
177   ///   };
178   ///
179   ///   k is the total number of instructions.
180   ///   nnnn is the ID of the current instruction (0-based).  This table
181   ///   includes entries for non-instructions like PHINODE.
182   ///   0xnn is the lowest possible opcode for the current instruction, used for
183   ///   AddRegFrm instructions to compute the operand's value.
184   ///   ENCODING and TYPE describe the encoding and type for a single operand.
185   ///
186   /// @param o  - The output stream to which the instruction table should be
187   ///             written.
188   /// @param i  - The indent level for use with the stream.
189   void emitInstructionInfo(raw_ostream &o, unsigned &i) const;
190 
191   /// emitContextTable - Prints the table that is used to translate from an
192   ///   instruction attribute mask to an instruction context.  This table is
193   ///   printed as:
194   ///
195   ///   InstructionContext CONTEXTS_STR[256] = {
196   ///     IC, /* 0x00 */
197   ///     ...
198   ///   };
199   ///
200   ///   IC is the context corresponding to the mask 0x00, and there are 256
201   ///   possible masks.
202   ///
203   /// @param o  - The output stream to which the context table should be written.
204   /// @param i  - The indent level for use with the stream.
205   void emitContextTable(raw_ostream &o, uint32_t &i) const;
206 
207   /// emitContextDecisions - Prints all four ContextDecision structures using
208   ///   emitContextDecision().
209   ///
210   /// @param o1 - The output stream to print the ID tables generated by
211   ///             emitModRMDecision() to.
212   /// @param o2 - The output stream to print the decision structures to.
213   /// @param i1 - The indent level to use with stream o1.
214   /// @param i2 - The indent level to use with stream o2.
215   /// @param ModRMTableNum - next table number for adding to ModRMTable.
216   void emitContextDecisions(raw_ostream &o1, raw_ostream &o2,
217                             unsigned &i1, unsigned &i2,
218                             unsigned &ModRMTableNum) const;
219 
220   /// setTableFields - Uses a ModRMFilter to set the appropriate entries in a
221   ///   ModRMDecision to refer to a particular instruction ID.
222   ///
223   /// @param decision - The ModRMDecision to populate.
224   /// @param filter   - The filter to use in deciding which entries to populate.
225   /// @param uid      - The unique ID to set matching entries to.
226   /// @param opcode   - The opcode of the instruction, for error reporting.
227   void setTableFields(ModRMDecision &decision,
228                       const ModRMFilter &filter,
229                       InstrUID uid,
230                       uint8_t opcode);
231 public:
232   /// Constructor - Allocates space for the class decisions and clears them.
233   DisassemblerTables();
234 
235   ~DisassemblerTables();
236 
237   /// emit - Emits the instruction table, context table, and class decisions.
238   ///
239   /// @param o  - The output stream to print the tables to.
240   void emit(raw_ostream &o) const;
241 
242   /// setTableFields - Uses the opcode type, instruction context, opcode, and a
243   ///   ModRMFilter as criteria to set a particular set of entries in the
244   ///   decode tables to point to a specific uid.
245   ///
246   /// @param type         - The opcode type (ONEBYTE, TWOBYTE, etc.)
247   /// @param insnContext  - The context to use (IC, IC_64BIT, etc.)
248   /// @param opcode       - The last byte of the opcode (not counting any escape
249   ///                       or extended opcodes).
250   /// @param filter       - The ModRMFilter that decides which ModR/M byte values
251   ///                       correspond to the desired instruction.
252   /// @param uid          - The unique ID of the instruction.
253   /// @param is32bit      - Instructon is only 32-bit
254   /// @param noPrefix     - Instruction record has no prefix.
255   /// @param ignoresVEX_L - Instruction ignores VEX.L
256   /// @param ignoresVEX_W - Instruction ignores VEX.W
257   /// @param AddrSize     - Instructions address size 16/32/64. 0 is unspecified
258   void setTableFields(OpcodeType type,
259                       InstructionContext insnContext,
260                       uint8_t opcode,
261                       const ModRMFilter &filter,
262                       InstrUID uid,
263                       bool is32bit,
264                       bool noPrefix,
265                       bool ignoresVEX_L,
266                       bool ignoresVEX_W,
267                       unsigned AddrSize);
268 
269   /// specForUID - Returns the instruction specifier for a given unique
270   ///   instruction ID.  Used when resolving collisions.
271   ///
272   /// @param uid  - The unique ID of the instruction.
273   /// @return     - A reference to the instruction specifier.
274   InstructionSpecifier& specForUID(InstrUID uid) {
275     if (uid >= InstructionSpecifiers.size())
276       InstructionSpecifiers.resize(uid + 1);
277 
278     return InstructionSpecifiers[uid];
279   }
280 
281   // hasConflicts - Reports whether there were primary decode conflicts
282   //   from any instructions added to the tables.
283   // @return  - true if there were; false otherwise.
284 
285   bool hasConflicts() {
286     return HasConflicts;
287   }
288 };
289 
290 } // namespace X86Disassembler
291 
292 } // namespace llvm
293 
294 #endif
295