• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 //===- X86DisassemblerTables.h - Disassembler tables ------------*- C++ -*-===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file is part of the X86 Disassembler Emitter.
11 // It contains the interface of the disassembler tables.
12 // Documentation for the disassembler emitter in general can be found in
13 //  X86DisasemblerEmitter.h.
14 //
15 //===----------------------------------------------------------------------===//
16 
17 #ifndef X86DISASSEMBLERTABLES_H
18 #define X86DISASSEMBLERTABLES_H
19 
20 #include "X86DisassemblerShared.h"
21 #include "X86ModRMFilters.h"
22 #include "llvm/Support/raw_ostream.h"
23 #include <vector>
24 
25 namespace llvm {
26 
27 namespace X86Disassembler {
28 
29 /// DisassemblerTables - Encapsulates all the decode tables being generated by
30 ///   the table emitter.  Contains functions to populate the tables as well as
31 ///   to emit them as hierarchical C structures suitable for consumption by the
32 ///   runtime.
33 class DisassemblerTables {
34 private:
35   /// The decoder tables.  There is one for each opcode type:
36   /// [0] one-byte opcodes
37   /// [1] two-byte opcodes of the form 0f __
38   /// [2] three-byte opcodes of the form 0f 38 __
39   /// [3] three-byte opcodes of the form 0f 3a __
40   /// [4] three-byte opcodes of the form 0f a6 __
41   /// [5] three-byte opcodes of the form 0f a7 __
42   ContextDecision* Tables[6];
43 
44   /// The instruction information table
45   std::vector<InstructionSpecifier> InstructionSpecifiers;
46 
47   /// True if there are primary decode conflicts in the instruction set
48   bool HasConflicts;
49 
50   /// emitOneID - Emits a table entry for a single instruction entry, at the
51   ///   innermost level of the structure hierarchy.  The entry is printed out
52   ///   in the format "nnnn, /* MNEMONIC */" where nnnn is the ID in decimal,
53   ///   the comma is printed if addComma is true, and the menonic is the name
54   ///   of the instruction as listed in the LLVM tables.
55   ///
56   /// @param o        - The output stream to print the entry on.
57   /// @param i        - The indentation level for o.
58   /// @param id       - The unique ID of the instruction to print.
59   /// @param addComma - Whether or not to print a comma after the ID.  True if
60   ///                    additional items will follow.
61   void emitOneID(raw_ostream &o,
62                  uint32_t &i,
63                  InstrUID id,
64                  bool addComma) const;
65 
66   /// emitModRMDecision - Emits a table of entries corresponding to a single
67   ///   ModR/M decision.  Compacts the ModR/M decision if possible.  ModR/M
68   ///   decisions are printed as:
69   ///
70   ///   { /* struct ModRMDecision */
71   ///     TYPE,
72   ///     modRMTablennnn
73   ///   }
74   ///
75   ///   where nnnn is a unique ID for the corresponding table of IDs.
76   ///   TYPE indicates whether the table has one entry that is the same
77   ///   regardless of ModR/M byte, two entries - one for bytes 0x00-0xbf and one
78   ///   for bytes 0xc0-0xff -, or 256 entries, one for each possible byte.
79   ///   nnnn is the number of a table for looking up these values.  The tables
80   ///   are written separately so that tables consisting entirely of zeros will
81   ///   not be duplicated.  (These all have the name modRMEmptyTable.)  A table
82   ///   is printed as:
83   ///
84   ///   InstrUID modRMTablennnn[k] = {
85   ///     nnnn, /* MNEMONIC */
86   ///     ...
87   ///     nnnn /* MNEMONIC */
88   ///   };
89   ///
90   /// @param o1       - The output stream to print the ID table to.
91   /// @param o2       - The output stream to print the decision structure to.
92   /// @param i1       - The indentation level to use with stream o1.
93   /// @param i2       - The indentation level to use with stream o2.
94   /// @param decision - The ModR/M decision to emit.  This decision has 256
95   ///                   entries - emitModRMDecision decides how to compact it.
96   void emitModRMDecision(raw_ostream &o1,
97                          raw_ostream &o2,
98                          uint32_t &i1,
99                          uint32_t &i2,
100                          ModRMDecision &decision) const;
101 
102   /// emitOpcodeDecision - Emits an OpcodeDecision and all its subsidiary ModR/M
103   ///   decisions.  An OpcodeDecision is printed as:
104   ///
105   ///   { /* struct OpcodeDecision */
106   ///     /* 0x00 */
107   ///     { /* struct ModRMDecision */
108   ///       ...
109   ///     }
110   ///     ...
111   ///   }
112   ///
113   ///   where the ModRMDecision structure is printed as described in the
114   ///   documentation for emitModRMDecision().  emitOpcodeDecision() passes on a
115   ///   stream and indent level for the UID tables generated by
116   ///   emitModRMDecision(), but does not use them itself.
117   ///
118   /// @param o1       - The output stream to print the ID tables generated by
119   ///                   emitModRMDecision() to.
120   /// @param o2       - The output stream for the decision structure itself.
121   /// @param i1       - The indent level to use with stream o1.
122   /// @param i2       - The indent level to use with stream o2.
123   /// @param decision - The OpcodeDecision to emit along with its subsidiary
124   ///                    structures.
125   void emitOpcodeDecision(raw_ostream &o1,
126                           raw_ostream &o2,
127                           uint32_t &i1,
128                           uint32_t &i2,
129                           OpcodeDecision &decision) const;
130 
131   /// emitContextDecision - Emits a ContextDecision and all its subsidiary
132   ///   Opcode and ModRMDecisions.  A ContextDecision is printed as:
133   ///
134   ///   struct ContextDecision NAME = {
135   ///     { /* OpcodeDecisions */
136   ///       /* IC */
137   ///       { /* struct OpcodeDecision */
138   ///         ...
139   ///       },
140   ///       ...
141   ///     }
142   ///   }
143   ///
144   ///   NAME is the name of the ContextDecision (typically one of the four names
145   ///   ONEBYTE_SYM, TWOBYTE_SYM, THREEBYTE38_SYM, THREEBYTE3A_SYM,
146   ///   THREEBYTEA6_SYM, and THREEBYTEA7_SYM from
147   ///   X86DisassemblerDecoderCommon.h).
148   ///   IC is one of the contexts in InstructionContext.  There is an opcode
149   ///   decision for each possible context.
150   ///   The OpcodeDecision structures are printed as described in the
151   ///   documentation for emitOpcodeDecision.
152   ///
153   /// @param o1       - The output stream to print the ID tables generated by
154   ///                   emitModRMDecision() to.
155   /// @param o2       - The output stream to print the decision structure to.
156   /// @param i1       - The indent level to use with stream o1.
157   /// @param i2       - The indent level to use with stream o2.
158   /// @param decision - The ContextDecision to emit along with its subsidiary
159   ///                   structures.
160   /// @param name     - The name for the ContextDecision.
161   void emitContextDecision(raw_ostream &o1,
162                            raw_ostream &o2,
163                            uint32_t &i1,
164                            uint32_t &i2,
165                            ContextDecision &decision,
166                            const char* name) const;
167 
168   /// emitInstructionInfo - Prints the instruction specifier table, which has
169   ///   one entry for each instruction, and contains name and operand
170   ///   information.  This table is printed as:
171   ///
172   ///   struct InstructionSpecifier CONTEXTS_SYM[k] = {
173   ///     {
174   ///       /* nnnn */
175   ///       "MNEMONIC",
176   ///       0xnn,
177   ///       {
178   ///         {
179   ///           ENCODING,
180   ///           TYPE
181   ///         },
182   ///         ...
183   ///       }
184   ///     },
185   ///   };
186   ///
187   ///   k is the total number of instructions.
188   ///   nnnn is the ID of the current instruction (0-based).  This table
189   ///   includes entries for non-instructions like PHINODE.
190   ///   0xnn is the lowest possible opcode for the current instruction, used for
191   ///   AddRegFrm instructions to compute the operand's value.
192   ///   ENCODING and TYPE describe the encoding and type for a single operand.
193   ///
194   /// @param o  - The output stream to which the instruction table should be
195   ///             written.
196   /// @param i  - The indent level for use with the stream.
197   void emitInstructionInfo(raw_ostream &o, uint32_t &i) const;
198 
199   /// emitContextTable - Prints the table that is used to translate from an
200   ///   instruction attribute mask to an instruction context.  This table is
201   ///   printed as:
202   ///
203   ///   InstructionContext CONTEXTS_STR[256] = {
204   ///     IC, /* 0x00 */
205   ///     ...
206   ///   };
207   ///
208   ///   IC is the context corresponding to the mask 0x00, and there are 256
209   ///   possible masks.
210   ///
211   /// @param o  - The output stream to which the context table should be written.
212   /// @param i  - The indent level for use with the stream.
213   void emitContextTable(raw_ostream &o, uint32_t &i) const;
214 
215   /// emitContextDecisions - Prints all four ContextDecision structures using
216   ///   emitContextDecision().
217   ///
218   /// @param o1 - The output stream to print the ID tables generated by
219   ///             emitModRMDecision() to.
220   /// @param o2 - The output stream to print the decision structures to.
221   /// @param i1 - The indent level to use with stream o1.
222   /// @param i2 - The indent level to use with stream o2.
223   void emitContextDecisions(raw_ostream &o1,
224                             raw_ostream &o2,
225                             uint32_t &i1,
226                             uint32_t &i2) const;
227 
228   /// setTableFields - Uses a ModRMFilter to set the appropriate entries in a
229   ///   ModRMDecision to refer to a particular instruction ID.
230   ///
231   /// @param decision - The ModRMDecision to populate.
232   /// @param filter   - The filter to use in deciding which entries to populate.
233   /// @param uid      - The unique ID to set matching entries to.
234   /// @param opcode   - The opcode of the instruction, for error reporting.
235   void setTableFields(ModRMDecision &decision,
236                       const ModRMFilter &filter,
237                       InstrUID uid,
238                       uint8_t opcode);
239 public:
240   /// Constructor - Allocates space for the class decisions and clears them.
241   DisassemblerTables();
242 
243   ~DisassemblerTables();
244 
245   /// emit - Emits the instruction table, context table, and class decisions.
246   ///
247   /// @param o  - The output stream to print the tables to.
248   void emit(raw_ostream &o) const;
249 
250   /// setTableFields - Uses the opcode type, instruction context, opcode, and a
251   ///   ModRMFilter as criteria to set a particular set of entries in the
252   ///   decode tables to point to a specific uid.
253   ///
254   /// @param type         - The opcode type (ONEBYTE, TWOBYTE, etc.)
255   /// @param insnContext  - The context to use (IC, IC_64BIT, etc.)
256   /// @param opcode       - The last byte of the opcode (not counting any escape
257   ///                       or extended opcodes).
258   /// @param filter       - The ModRMFilter that decides which ModR/M byte values
259   ///                       correspond to the desired instruction.
260   /// @param uid          - The unique ID of the instruction.
261   /// @param is32bit      - Instructon is only 32-bit
262   /// @param ignoresVEX_L - Instruction ignores VEX.L
263   void setTableFields(OpcodeType type,
264                       InstructionContext insnContext,
265                       uint8_t opcode,
266                       const ModRMFilter &filter,
267                       InstrUID uid,
268                       bool is32bit,
269                       bool ignoresVEX_L);
270 
271   /// specForUID - Returns the instruction specifier for a given unique
272   ///   instruction ID.  Used when resolving collisions.
273   ///
274   /// @param uid  - The unique ID of the instruction.
275   /// @return     - A reference to the instruction specifier.
specForUID(InstrUID uid)276   InstructionSpecifier& specForUID(InstrUID uid) {
277     if (uid >= InstructionSpecifiers.size())
278       InstructionSpecifiers.resize(uid + 1);
279 
280     return InstructionSpecifiers[uid];
281   }
282 
283   // hasConflicts - Reports whether there were primary decode conflicts
284   //   from any instructions added to the tables.
285   // @return  - true if there were; false otherwise.
286 
hasConflicts()287   bool hasConflicts() {
288     return HasConflicts;
289   }
290 };
291 
292 } // namespace X86Disassembler
293 
294 } // namespace llvm
295 
296 #endif
297