/src/capstonenext/MCInstPrinter.c
Line | Count | Source (jump to first uncovered line) |
1 | | /* Capstone Disassembly Engine */ |
2 | | /* By Rot127 <unisono@quyllur.org>, 2023 */ |
3 | | |
4 | | #include "MCInstPrinter.h" |
5 | | #include "cs_priv.h" |
6 | | #include <capstone/platform.h> |
7 | | |
8 | | extern bool ARM_getFeatureBits(unsigned int mode, unsigned int feature); |
9 | | extern bool PPC_getFeatureBits(unsigned int mode, unsigned int feature); |
10 | | extern bool Mips_getFeatureBits(unsigned int mode, unsigned int feature); |
11 | | extern bool AArch64_getFeatureBits(unsigned int mode, unsigned int feature); |
12 | | extern bool TriCore_getFeatureBits(unsigned int mode, unsigned int feature); |
13 | | extern bool Sparc_getFeatureBits(unsigned int mode, unsigned int feature); |
14 | | |
15 | | static bool testFeatureBits(const MCInst *MI, uint32_t Value) |
16 | 97.6k | { |
17 | 97.6k | assert(MI && MI->csh); |
18 | 97.6k | switch (MI->csh->arch) { |
19 | 0 | default: |
20 | 0 | assert(0 && "Not implemented for current arch."); |
21 | 0 | return false; |
22 | 0 | #ifdef CAPSTONE_HAS_ARM |
23 | 6.06k | case CS_ARCH_ARM: |
24 | 6.06k | return ARM_getFeatureBits(MI->csh->mode, Value); |
25 | 0 | #endif |
26 | 0 | #ifdef CAPSTONE_HAS_POWERPC |
27 | 668 | case CS_ARCH_PPC: |
28 | 668 | return PPC_getFeatureBits(MI->csh->mode, Value); |
29 | 0 | #endif |
30 | 0 | #ifdef CAPSTONE_HAS_MIPS |
31 | 12.1k | case CS_ARCH_MIPS: |
32 | 12.1k | return Mips_getFeatureBits(MI->csh->mode, Value); |
33 | 0 | #endif |
34 | 0 | #ifdef CAPSTONE_HAS_AARCH64 |
35 | 75.7k | case CS_ARCH_AARCH64: |
36 | 75.7k | return AArch64_getFeatureBits(MI->csh->mode, Value); |
37 | 0 | #endif |
38 | 0 | #ifdef CAPSTONE_HAS_TRICORE |
39 | 0 | case CS_ARCH_TRICORE: |
40 | 0 | return TriCore_getFeatureBits(MI->csh->mode, Value); |
41 | 0 | #endif |
42 | 0 | #ifdef CAPSTONE_HAS_SPARC |
43 | 3.01k | case CS_ARCH_SPARC: |
44 | 3.01k | return Sparc_getFeatureBits(MI->csh->mode, Value); |
45 | 97.6k | #endif |
46 | 97.6k | } |
47 | 97.6k | } |
48 | | |
49 | | static bool matchAliasCondition(MCInst *MI, const MCRegisterInfo *MRI, |
50 | | unsigned *OpIdx, const AliasMatchingData *M, |
51 | | const AliasPatternCond *C, |
52 | | bool *OrPredicateResult) |
53 | 873k | { |
54 | | // Feature tests are special, they don't consume operands. |
55 | 873k | if (C->Kind == AliasPatternCond_K_Feature) |
56 | 12.4k | return testFeatureBits(MI, C->Value); |
57 | 860k | if (C->Kind == AliasPatternCond_K_NegFeature) |
58 | 9.04k | return !testFeatureBits(MI, C->Value); |
59 | | // For feature tests where just one feature is required in a list, set the |
60 | | // predicate result bit to whether the expression will return true, and only |
61 | | // return the real result at the end of list marker. |
62 | 851k | if (C->Kind == AliasPatternCond_K_OrFeature) { |
63 | 75.9k | *OrPredicateResult |= testFeatureBits(MI, C->Value); |
64 | 75.9k | return true; |
65 | 75.9k | } |
66 | 775k | if (C->Kind == AliasPatternCond_K_OrNegFeature) { |
67 | 196 | *OrPredicateResult |= !(testFeatureBits(MI, C->Value)); |
68 | 196 | return true; |
69 | 196 | } |
70 | 775k | if (C->Kind == AliasPatternCond_K_EndOrFeatures) { |
71 | 29.8k | bool Res = *OrPredicateResult; |
72 | 29.8k | *OrPredicateResult = false; |
73 | 29.8k | return Res; |
74 | 29.8k | } |
75 | | |
76 | | // Get and consume an operand. |
77 | 745k | MCOperand *Opnd = MCInst_getOperand(MI, *OpIdx); |
78 | 745k | ++(*OpIdx); |
79 | | |
80 | | // Check the specific condition for the operand. |
81 | 745k | switch (C->Kind) { |
82 | 0 | default: |
83 | 0 | assert(0 && "invalid kind"); |
84 | 260k | case AliasPatternCond_K_Imm: |
85 | | // Operand must be a specific immediate. |
86 | 260k | return MCOperand_isImm(Opnd) && |
87 | 260k | MCOperand_getImm(Opnd) == (int32_t)C->Value; |
88 | 47.4k | case AliasPatternCond_K_Reg: |
89 | | // Operand must be a specific register. |
90 | 47.4k | return MCOperand_isReg(Opnd) && |
91 | 47.4k | MCOperand_getReg(Opnd) == C->Value; |
92 | 2.26k | case AliasPatternCond_K_TiedReg: |
93 | | // Operand must match the register of another operand. |
94 | 2.26k | return MCOperand_isReg(Opnd) && |
95 | 2.26k | MCOperand_getReg(Opnd) == |
96 | 2.26k | MCOperand_getReg( |
97 | 2.26k | MCInst_getOperand(MI, C->Value)); |
98 | 308k | case AliasPatternCond_K_RegClass: |
99 | | // Operand must be a register in this class. Value is a register class |
100 | | // id. |
101 | 308k | return MCOperand_isReg(Opnd) && |
102 | 308k | MCRegisterClass_contains( |
103 | 308k | MCRegisterInfo_getRegClass(MRI, C->Value), |
104 | 308k | MCOperand_getReg(Opnd)); |
105 | 32.0k | case AliasPatternCond_K_Custom: |
106 | | // Operand must match some custom criteria. |
107 | 32.0k | assert(M->ValidateMCOperand && |
108 | 32.0k | "A custom validator should be set but isn't."); |
109 | 32.0k | return M->ValidateMCOperand(Opnd, C->Value); |
110 | 95.2k | case AliasPatternCond_K_Ignore: |
111 | | // Operand can be anything. |
112 | 95.2k | return true; |
113 | 0 | case AliasPatternCond_K_Feature: |
114 | 0 | case AliasPatternCond_K_NegFeature: |
115 | 0 | case AliasPatternCond_K_OrFeature: |
116 | 0 | case AliasPatternCond_K_OrNegFeature: |
117 | 0 | case AliasPatternCond_K_EndOrFeatures: |
118 | 0 | assert(0 && "handled earlier"); |
119 | 745k | } |
120 | 0 | return false; |
121 | 745k | } |
122 | | |
123 | | /// Check if PatternsForOpcode is all zero. |
124 | | static inline bool validOpToPatter(const PatternsForOpcode *P) |
125 | 183M | { |
126 | 183M | return !(P->Opcode == 0 && P->PatternStart == 0 && P->NumPatterns == 0); |
127 | 183M | } |
128 | | |
129 | | const char *matchAliasPatterns(MCInst *MI, const AliasMatchingData *M) |
130 | 1.55M | { |
131 | | // TODO Rewrite to C |
132 | | |
133 | | // auto It = lower_bound(M.OpToPatterns, MI->getOpcode(), |
134 | | // [](const PatternsForOpcode &L, unsigned Opcode) { |
135 | | // return L.Opcode < Opcode; |
136 | | // }); |
137 | | // if (It == M.OpToPatterns.end() || It->Opcode != MI->getOpcode()) |
138 | | // return nullptr; |
139 | | |
140 | | // Binary search by opcode. Return false if there are no aliases for this |
141 | | // opcode. |
142 | 1.55M | unsigned MIOpcode = MI->Opcode; |
143 | 1.55M | size_t i = 0; |
144 | 1.55M | uint32_t PatternOpcode = M->OpToPatterns[i].Opcode; |
145 | 184M | while (PatternOpcode < MIOpcode && validOpToPatter(&M->OpToPatterns[i])) |
146 | 182M | PatternOpcode = M->OpToPatterns[++i].Opcode; |
147 | 1.55M | if (PatternOpcode != MI->Opcode || |
148 | 1.55M | !validOpToPatter(&M->OpToPatterns[i])) |
149 | 1.41M | return NULL; |
150 | | |
151 | | // // Try all patterns for this opcode. |
152 | 139k | uint32_t AsmStrOffset = ~0U; |
153 | 139k | const AliasPattern *Patterns = |
154 | 139k | M->Patterns + M->OpToPatterns[i].PatternStart; |
155 | 139k | for (const AliasPattern *P = Patterns; |
156 | 435k | P != Patterns + M->OpToPatterns[i].NumPatterns; ++P) { |
157 | | // Check operand count first. |
158 | 349k | if (MCInst_getNumOperands(MI) != P->NumOperands) |
159 | 0 | return NULL; |
160 | | |
161 | | // Test all conditions for this pattern. |
162 | 349k | const AliasPatternCond *Conds = |
163 | 349k | M->PatternConds + P->AliasCondStart; |
164 | 349k | unsigned OpIdx = 0; |
165 | 349k | bool OrPredicateResult = false; |
166 | 349k | bool allMatch = true; |
167 | 349k | for (const AliasPatternCond *C = Conds; |
168 | 925k | C != Conds + P->NumConds; ++C) { |
169 | 873k | if (!matchAliasCondition(MI, MI->MRI, &OpIdx, M, C, |
170 | 873k | &OrPredicateResult)) { |
171 | 296k | allMatch = false; |
172 | 296k | break; |
173 | 296k | } |
174 | 873k | } |
175 | 349k | if (allMatch) { |
176 | 52.6k | AsmStrOffset = P->AsmStrOffset; |
177 | 52.6k | break; |
178 | 52.6k | } |
179 | 349k | } |
180 | | // If no alias matched, don't print an alias. |
181 | 139k | if (AsmStrOffset == ~0U) |
182 | 86.5k | return NULL; |
183 | | |
184 | | // Go to offset AsmStrOffset and use the null terminated string there. The |
185 | | // offset should point to the beginning of an alias string, so it should |
186 | | // either be zero or be preceded by a null byte. |
187 | 52.6k | return M->AsmStrings + AsmStrOffset; |
188 | 139k | } |
189 | | |
190 | | // TODO Add functionality to toggle the flag. |
191 | | bool getUseMarkup(void) |
192 | 8.24M | { |
193 | 8.24M | return false; |
194 | 8.24M | } |
195 | | |
196 | | /// Utility functions to make adding mark ups simpler. |
197 | | const char *markup(const char *s) |
198 | 8.10M | { |
199 | 8.10M | static const char *no_markup = ""; |
200 | 8.10M | if (getUseMarkup()) |
201 | 0 | return s; |
202 | 8.10M | else |
203 | 8.10M | return no_markup; |
204 | 8.10M | } |
205 | | |
206 | | // binary search for encoding in IndexType array |
207 | | // return -1 if not found, or index if found |
208 | | unsigned int binsearch_IndexTypeEncoding(const struct IndexType *index, |
209 | | size_t size, uint16_t encoding) |
210 | 111k | { |
211 | | // binary searching since the index is sorted in encoding order |
212 | 111k | size_t left, right, m; |
213 | | |
214 | 111k | right = size - 1; |
215 | | |
216 | 111k | if (encoding < index[0].encoding || encoding > index[right].encoding) |
217 | | // not found |
218 | 20.2k | return -1; |
219 | | |
220 | 91.2k | left = 0; |
221 | | |
222 | 431k | while (left <= right) { |
223 | 400k | m = (left + right) / 2; |
224 | 400k | if (encoding == index[m].encoding) { |
225 | | // LLVM actually uses lower_bound for the index table search |
226 | | // Here we need to check if a previous entry is of the same encoding |
227 | | // and return the first one. |
228 | 60.2k | while (m > 0 && encoding == index[m - 1].encoding) |
229 | 0 | --m; |
230 | 60.2k | return m; |
231 | 60.2k | } |
232 | | |
233 | 340k | if (encoding < index[m].encoding) |
234 | 128k | right = m - 1; |
235 | 211k | else |
236 | 211k | left = m + 1; |
237 | 340k | } |
238 | | |
239 | | // not found |
240 | 30.9k | return -1; |
241 | 91.2k | } |
242 | | |
243 | | // binary search for encoding in IndexTypeStr array |
244 | | // return -1 if not found, or index if found |
245 | | unsigned int binsearch_IndexTypeStrEncoding(const struct IndexTypeStr *index, |
246 | | size_t size, const char *name) |
247 | 1.10k | { |
248 | | // binary searching since the index is sorted in encoding order |
249 | 1.10k | size_t left, right, m; |
250 | | |
251 | 1.10k | right = size - 1; |
252 | | |
253 | 1.10k | int str_left_cmp = strcmp(name, index[0].name); |
254 | 1.10k | int str_right_cmp = strcmp(name, index[right].name); |
255 | 1.10k | if (str_left_cmp < 0 || str_right_cmp > 0) |
256 | | // not found |
257 | 0 | return -1; |
258 | | |
259 | 1.10k | left = 0; |
260 | | |
261 | 11.4k | while (left <= right) { |
262 | 11.4k | m = (left + right) / 2; |
263 | 11.4k | if (strcmp(name, index[m].name) == 0) { |
264 | | // LLVM actually uses lower_bound for the index table search |
265 | | // Here we need to check if a previous entry is of the same encoding |
266 | | // and return the first one. |
267 | 1.08k | while (m > 0 && (strcmp(name, index[m - 1].name) == 0)) |
268 | 0 | --m; |
269 | 1.08k | return m; |
270 | 1.08k | } |
271 | | |
272 | 10.3k | if (strcmp(name, index[m].name) < 0) |
273 | 4.73k | right = m - 1; |
274 | 5.62k | else |
275 | 5.62k | left = m + 1; |
276 | 10.3k | } |
277 | | |
278 | | // not found |
279 | 18 | return -1; |
280 | 1.10k | } |