/src/capstonenext/MCInstPrinter.c
Line | Count | Source (jump to first uncovered line) |
1 | | /* Capstone Disassembly Engine */ |
2 | | /* By Rot127 <unisono@quyllur.org>, 2023 */ |
3 | | |
4 | | #include "MCInstPrinter.h" |
5 | | #include "cs_priv.h" |
6 | | #include <capstone/platform.h> |
7 | | |
8 | | extern bool ARM_getFeatureBits(unsigned int mode, unsigned int feature); |
9 | | extern bool PPC_getFeatureBits(unsigned int mode, unsigned int feature); |
10 | | extern bool Mips_getFeatureBits(unsigned int mode, unsigned int feature); |
11 | | extern bool AArch64_getFeatureBits(unsigned int mode, unsigned int feature); |
12 | | extern bool TriCore_getFeatureBits(unsigned int mode, unsigned int feature); |
13 | | extern bool Sparc_getFeatureBits(unsigned int mode, unsigned int feature); |
14 | | |
15 | | static bool testFeatureBits(const MCInst *MI, uint32_t Value) |
16 | 58.8k | { |
17 | 58.8k | assert(MI && MI->csh); |
18 | 58.8k | switch (MI->csh->arch) { |
19 | 0 | default: |
20 | 0 | assert(0 && "Not implemented for current arch."); |
21 | 0 | return false; |
22 | 0 | #ifdef CAPSTONE_HAS_ARM |
23 | 3.38k | case CS_ARCH_ARM: |
24 | 3.38k | return ARM_getFeatureBits(MI->csh->mode, Value); |
25 | 0 | #endif |
26 | 0 | #ifdef CAPSTONE_HAS_POWERPC |
27 | 615 | case CS_ARCH_PPC: |
28 | 615 | return PPC_getFeatureBits(MI->csh->mode, Value); |
29 | 0 | #endif |
30 | 0 | #ifdef CAPSTONE_HAS_MIPS |
31 | 7.26k | case CS_ARCH_MIPS: |
32 | 7.26k | return Mips_getFeatureBits(MI->csh->mode, Value); |
33 | 0 | #endif |
34 | 0 | #ifdef CAPSTONE_HAS_AARCH64 |
35 | 45.6k | case CS_ARCH_AARCH64: |
36 | 45.6k | return AArch64_getFeatureBits(MI->csh->mode, Value); |
37 | 0 | #endif |
38 | 0 | #ifdef CAPSTONE_HAS_TRICORE |
39 | 0 | case CS_ARCH_TRICORE: |
40 | 0 | return TriCore_getFeatureBits(MI->csh->mode, Value); |
41 | 0 | #endif |
42 | 0 | #ifdef CAPSTONE_HAS_SPARC |
43 | 1.89k | case CS_ARCH_SPARC: |
44 | 1.89k | return Sparc_getFeatureBits(MI->csh->mode, Value); |
45 | 58.8k | #endif |
46 | 58.8k | } |
47 | 58.8k | } |
48 | | |
49 | | static bool matchAliasCondition(MCInst *MI, const MCRegisterInfo *MRI, |
50 | | unsigned *OpIdx, const AliasMatchingData *M, |
51 | | const AliasPatternCond *C, |
52 | | bool *OrPredicateResult) |
53 | 540k | { |
54 | | // Feature tests are special, they don't consume operands. |
55 | 540k | if (C->Kind == AliasPatternCond_K_Feature) |
56 | 7.77k | return testFeatureBits(MI, C->Value); |
57 | 532k | if (C->Kind == AliasPatternCond_K_NegFeature) |
58 | 4.91k | return !testFeatureBits(MI, C->Value); |
59 | | // For feature tests where just one feature is required in a list, set the |
60 | | // predicate result bit to whether the expression will return true, and only |
61 | | // return the real result at the end of list marker. |
62 | 527k | if (C->Kind == AliasPatternCond_K_OrFeature) { |
63 | 45.8k | *OrPredicateResult |= testFeatureBits(MI, C->Value); |
64 | 45.8k | return true; |
65 | 45.8k | } |
66 | 482k | if (C->Kind == AliasPatternCond_K_OrNegFeature) { |
67 | 231 | *OrPredicateResult |= !(testFeatureBits(MI, C->Value)); |
68 | 231 | return true; |
69 | 231 | } |
70 | 481k | if (C->Kind == AliasPatternCond_K_EndOrFeatures) { |
71 | 18.7k | bool Res = *OrPredicateResult; |
72 | 18.7k | *OrPredicateResult = false; |
73 | 18.7k | return Res; |
74 | 18.7k | } |
75 | | |
76 | | // Get and consume an operand. |
77 | 463k | MCOperand *Opnd = MCInst_getOperand(MI, *OpIdx); |
78 | 463k | ++(*OpIdx); |
79 | | |
80 | | // Check the specific condition for the operand. |
81 | 463k | switch (C->Kind) { |
82 | 0 | default: |
83 | 0 | assert(0 && "invalid kind"); |
84 | 175k | case AliasPatternCond_K_Imm: |
85 | | // Operand must be a specific immediate. |
86 | 175k | return MCOperand_isImm(Opnd) && |
87 | 175k | MCOperand_getImm(Opnd) == (int32_t)C->Value; |
88 | 28.7k | case AliasPatternCond_K_Reg: |
89 | | // Operand must be a specific register. |
90 | 28.7k | return MCOperand_isReg(Opnd) && |
91 | 28.7k | MCOperand_getReg(Opnd) == C->Value; |
92 | 1.66k | case AliasPatternCond_K_TiedReg: |
93 | | // Operand must match the register of another operand. |
94 | 1.66k | return MCOperand_isReg(Opnd) && |
95 | 1.66k | MCOperand_getReg(Opnd) == |
96 | 1.66k | MCOperand_getReg( |
97 | 1.66k | MCInst_getOperand(MI, C->Value)); |
98 | 187k | case AliasPatternCond_K_RegClass: |
99 | | // Operand must be a register in this class. Value is a register class |
100 | | // id. |
101 | 187k | return MCOperand_isReg(Opnd) && |
102 | 187k | MCRegisterClass_contains( |
103 | 187k | MCRegisterInfo_getRegClass(MRI, C->Value), |
104 | 187k | MCOperand_getReg(Opnd)); |
105 | 11.4k | case AliasPatternCond_K_Custom: |
106 | | // Operand must match some custom criteria. |
107 | 11.4k | assert(M->ValidateMCOperand && |
108 | 11.4k | "A custom validator should be set but isn't."); |
109 | 11.4k | return M->ValidateMCOperand(Opnd, C->Value); |
110 | 58.0k | case AliasPatternCond_K_Ignore: |
111 | | // Operand can be anything. |
112 | 58.0k | return true; |
113 | 0 | case AliasPatternCond_K_Feature: |
114 | 0 | case AliasPatternCond_K_NegFeature: |
115 | 0 | case AliasPatternCond_K_OrFeature: |
116 | 0 | case AliasPatternCond_K_OrNegFeature: |
117 | 0 | case AliasPatternCond_K_EndOrFeatures: |
118 | 0 | assert(0 && "handled earlier"); |
119 | 463k | } |
120 | 0 | return false; |
121 | 463k | } |
122 | | |
123 | | /// Check if PatternsForOpcode is all zero. |
124 | | static inline bool validOpToPatter(const PatternsForOpcode *P) |
125 | 115M | { |
126 | 115M | return !(P->Opcode == 0 && P->PatternStart == 0 && P->NumPatterns == 0); |
127 | 115M | } |
128 | | |
129 | | const char *matchAliasPatterns(MCInst *MI, const AliasMatchingData *M) |
130 | 967k | { |
131 | | // TODO Rewrite to C |
132 | | |
133 | | // auto It = lower_bound(M.OpToPatterns, MI->getOpcode(), |
134 | | // [](const PatternsForOpcode &L, unsigned Opcode) { |
135 | | // return L.Opcode < Opcode; |
136 | | // }); |
137 | | // if (It == M.OpToPatterns.end() || It->Opcode != MI->getOpcode()) |
138 | | // return nullptr; |
139 | | |
140 | | // Binary search by opcode. Return false if there are no aliases for this |
141 | | // opcode. |
142 | 967k | unsigned MIOpcode = MI->Opcode; |
143 | 967k | size_t i = 0; |
144 | 967k | uint32_t PatternOpcode = M->OpToPatterns[i].Opcode; |
145 | 115M | while (PatternOpcode < MIOpcode && validOpToPatter(&M->OpToPatterns[i])) |
146 | 114M | PatternOpcode = M->OpToPatterns[++i].Opcode; |
147 | 967k | if (PatternOpcode != MI->Opcode || |
148 | 967k | !validOpToPatter(&M->OpToPatterns[i])) |
149 | 881k | return NULL; |
150 | | |
151 | | // // Try all patterns for this opcode. |
152 | 86.0k | uint32_t AsmStrOffset = ~0U; |
153 | 86.0k | const AliasPattern *Patterns = |
154 | 86.0k | M->Patterns + M->OpToPatterns[i].PatternStart; |
155 | 86.0k | for (const AliasPattern *P = Patterns; |
156 | 273k | P != Patterns + M->OpToPatterns[i].NumPatterns; ++P) { |
157 | | // Check operand count first. |
158 | 221k | if (MCInst_getNumOperands(MI) != P->NumOperands) |
159 | 0 | return NULL; |
160 | | |
161 | | // Test all conditions for this pattern. |
162 | 221k | const AliasPatternCond *Conds = |
163 | 221k | M->PatternConds + P->AliasCondStart; |
164 | 221k | unsigned OpIdx = 0; |
165 | 221k | bool OrPredicateResult = false; |
166 | 221k | bool allMatch = true; |
167 | 221k | for (const AliasPatternCond *C = Conds; |
168 | 574k | C != Conds + P->NumConds; ++C) { |
169 | 540k | if (!matchAliasCondition(MI, MI->MRI, &OpIdx, M, C, |
170 | 540k | &OrPredicateResult)) { |
171 | 187k | allMatch = false; |
172 | 187k | break; |
173 | 187k | } |
174 | 540k | } |
175 | 221k | if (allMatch) { |
176 | 33.9k | AsmStrOffset = P->AsmStrOffset; |
177 | 33.9k | break; |
178 | 33.9k | } |
179 | 221k | } |
180 | | // If no alias matched, don't print an alias. |
181 | 86.0k | if (AsmStrOffset == ~0U) |
182 | 52.1k | return NULL; |
183 | | |
184 | | // Go to offset AsmStrOffset and use the null terminated string there. The |
185 | | // offset should point to the beginning of an alias string, so it should |
186 | | // either be zero or be preceded by a null byte. |
187 | 33.9k | return M->AsmStrings + AsmStrOffset; |
188 | 86.0k | } |
189 | | |
190 | | // TODO Add functionality to toggle the flag. |
191 | | bool getUseMarkup(void) |
192 | 5.15M | { |
193 | 5.15M | return false; |
194 | 5.15M | } |
195 | | |
196 | | /// Utility functions to make adding mark ups simpler. |
197 | | const char *markup(const char *s) |
198 | 5.06M | { |
199 | 5.06M | static const char *no_markup = ""; |
200 | 5.06M | if (getUseMarkup()) |
201 | 0 | return s; |
202 | 5.06M | else |
203 | 5.06M | return no_markup; |
204 | 5.06M | } |
205 | | |
206 | | // binary search for encoding in IndexType array |
207 | | // return -1 if not found, or index if found |
208 | | unsigned int binsearch_IndexTypeEncoding(const struct IndexType *index, |
209 | | size_t size, uint16_t encoding) |
210 | 68.7k | { |
211 | | // binary searching since the index is sorted in encoding order |
212 | 68.7k | size_t left, right, m; |
213 | | |
214 | 68.7k | right = size - 1; |
215 | | |
216 | 68.7k | if (encoding < index[0].encoding || encoding > index[right].encoding) |
217 | | // not found |
218 | 14.8k | return -1; |
219 | | |
220 | 53.9k | left = 0; |
221 | | |
222 | 234k | while (left <= right) { |
223 | 217k | m = (left + right) / 2; |
224 | 217k | if (encoding == index[m].encoding) { |
225 | | // LLVM actually uses lower_bound for the index table search |
226 | | // Here we need to check if a previous entry is of the same encoding |
227 | | // and return the first one. |
228 | 37.6k | while (m > 0 && encoding == index[m - 1].encoding) |
229 | 0 | --m; |
230 | 37.6k | return m; |
231 | 37.6k | } |
232 | | |
233 | 180k | if (encoding < index[m].encoding) |
234 | 67.6k | right = m - 1; |
235 | 112k | else |
236 | 112k | left = m + 1; |
237 | 180k | } |
238 | | |
239 | | // not found |
240 | 16.3k | return -1; |
241 | 53.9k | } |
242 | | |
243 | | // binary search for encoding in IndexTypeStr array |
244 | | // return -1 if not found, or index if found |
245 | | unsigned int binsearch_IndexTypeStrEncoding(const struct IndexTypeStr *index, |
246 | | size_t size, const char *name) |
247 | 968 | { |
248 | | // binary searching since the index is sorted in encoding order |
249 | 968 | size_t left, right, m; |
250 | | |
251 | 968 | right = size - 1; |
252 | | |
253 | 968 | int str_left_cmp = strcmp(name, index[0].name); |
254 | 968 | int str_right_cmp = strcmp(name, index[right].name); |
255 | 968 | if (str_left_cmp < 0 || str_right_cmp > 0) |
256 | | // not found |
257 | 0 | return -1; |
258 | | |
259 | 968 | left = 0; |
260 | | |
261 | 10.1k | while (left <= right) { |
262 | 10.0k | m = (left + right) / 2; |
263 | 10.0k | if (strcmp(name, index[m].name) == 0) { |
264 | | // LLVM actually uses lower_bound for the index table search |
265 | | // Here we need to check if a previous entry is of the same encoding |
266 | | // and return the first one. |
267 | 962 | while (m > 0 && (strcmp(name, index[m - 1].name) == 0)) |
268 | 0 | --m; |
269 | 962 | return m; |
270 | 962 | } |
271 | | |
272 | 9.13k | if (strcmp(name, index[m].name) < 0) |
273 | 4.29k | right = m - 1; |
274 | 4.83k | else |
275 | 4.83k | left = m + 1; |
276 | 9.13k | } |
277 | | |
278 | | // not found |
279 | 6 | return -1; |
280 | 968 | } |