Coverage Report

Created: 2026-05-30 06:22

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/capstonenext/MCInstPrinter.c
Line
Count
Source
1
/* Capstone Disassembly Engine */
2
/* By Rot127 <unisono@quyllur.org>, 2023 */
3
4
#include "MCInstPrinter.h"
5
#include "cs_priv.h"
6
#include <capstone/platform.h>
7
8
extern bool ARM_getFeatureBits(unsigned int mode, unsigned int feature);
9
extern bool PPC_getFeatureBits(unsigned int mode, unsigned int feature);
10
extern bool Mips_getFeatureBits(unsigned int mode, unsigned int feature);
11
extern bool AArch64_getFeatureBits(unsigned int mode, unsigned int feature);
12
extern bool TriCore_getFeatureBits(unsigned int mode, unsigned int feature);
13
extern bool Sparc_getFeatureBits(unsigned int mode, unsigned int feature);
14
extern bool RISCV_getFeatureBits(unsigned int mode, unsigned int feature);
15
16
static bool testFeatureBits(const MCInst *MI, uint32_t Value)
17
64.0k
{
18
64.0k
  assert(MI && MI->csh);
19
64.0k
  switch (MI->csh->arch) {
20
0
  default:
21
0
    assert(0 && "Not implemented for current arch.");
22
0
    return false;
23
0
#ifdef CAPSTONE_HAS_ARM
24
4.57k
  case CS_ARCH_ARM:
25
4.57k
    return ARM_getFeatureBits(MI->csh->mode, Value);
26
0
#endif
27
0
#ifdef CAPSTONE_HAS_POWERPC
28
569
  case CS_ARCH_PPC:
29
569
    return PPC_getFeatureBits(MI->csh->mode, Value);
30
0
#endif
31
0
#ifdef CAPSTONE_HAS_MIPS
32
9.61k
  case CS_ARCH_MIPS:
33
9.61k
    return Mips_getFeatureBits(MI->csh->mode, Value);
34
0
#endif
35
0
#ifdef CAPSTONE_HAS_AARCH64
36
47.7k
  case CS_ARCH_AARCH64:
37
47.7k
    return AArch64_getFeatureBits(MI->csh->mode, Value);
38
0
#endif
39
0
#ifdef CAPSTONE_HAS_TRICORE
40
0
  case CS_ARCH_TRICORE:
41
0
    return TriCore_getFeatureBits(MI->csh->mode, Value);
42
0
#endif
43
0
#ifdef CAPSTONE_HAS_SPARC
44
1.31k
  case CS_ARCH_SPARC:
45
1.31k
    return Sparc_getFeatureBits(MI->csh->mode, Value);
46
0
#endif
47
0
#ifdef CAPSTONE_HAS_RISCV
48
297
  case CS_ARCH_RISCV:
49
297
    return RISCV_getFeatureBits(MI->csh->mode, Value);
50
64.0k
#endif
51
64.0k
  }
52
64.0k
}
53
54
static bool matchAliasCondition(MCInst *MI, const MCRegisterInfo *MRI,
55
        unsigned *OpIdx, const AliasMatchingData *M,
56
        const AliasPatternCond *C,
57
        bool *OrPredicateResult)
58
698k
{
59
  // Feature tests are special, they don't consume operands.
60
698k
  if (C->Kind == AliasPatternCond_K_Feature)
61
9.38k
    return testFeatureBits(MI, C->Value);
62
689k
  if (C->Kind == AliasPatternCond_K_NegFeature)
63
6.55k
    return !testFeatureBits(MI, C->Value);
64
  // For feature tests where just one feature is required in a list, set the
65
  // predicate result bit to whether the expression will return true, and only
66
  // return the real result at the end of list marker.
67
682k
  if (C->Kind == AliasPatternCond_K_OrFeature) {
68
47.9k
    *OrPredicateResult |= testFeatureBits(MI, C->Value);
69
47.9k
    return true;
70
47.9k
  }
71
634k
  if (C->Kind == AliasPatternCond_K_OrNegFeature) {
72
143
    *OrPredicateResult |= !(testFeatureBits(MI, C->Value));
73
143
    return true;
74
143
  }
75
634k
  if (C->Kind == AliasPatternCond_K_EndOrFeatures) {
76
20.1k
    bool Res = *OrPredicateResult;
77
20.1k
    *OrPredicateResult = false;
78
20.1k
    return Res;
79
20.1k
  }
80
81
  // Get and consume an operand.
82
614k
  MCOperand *Opnd = MCInst_getOperand(MI, *OpIdx);
83
614k
  ++(*OpIdx);
84
85
  // Check the specific condition for the operand.
86
614k
  switch (C->Kind) {
87
0
  default:
88
0
    assert(0 && "invalid kind");
89
185k
  case AliasPatternCond_K_Imm:
90
    // Operand must be a specific immediate.
91
185k
    return MCOperand_isImm(Opnd) &&
92
185k
           MCOperand_getImm(Opnd) == (int32_t)C->Value;
93
76.2k
  case AliasPatternCond_K_Reg:
94
    // Operand must be a specific register.
95
76.2k
    return MCOperand_isReg(Opnd) &&
96
76.2k
           MCOperand_getReg(Opnd) == C->Value;
97
2.77k
  case AliasPatternCond_K_TiedReg:
98
    // Operand must match the register of another operand.
99
2.77k
    return MCOperand_isReg(Opnd) &&
100
2.77k
           MCOperand_getReg(Opnd) ==
101
2.77k
             MCOperand_getReg(
102
2.77k
               MCInst_getOperand(MI, C->Value));
103
256k
  case AliasPatternCond_K_RegClass:
104
    // Operand must be a register in this class. Value is a register class
105
    // id.
106
256k
    return MCOperand_isReg(Opnd) &&
107
256k
           MCRegisterClass_contains(
108
256k
             MCRegisterInfo_getRegClass(MRI, C->Value),
109
256k
             MCOperand_getReg(Opnd));
110
23.9k
  case AliasPatternCond_K_Custom:
111
    // Operand must match some custom criteria.
112
23.9k
    assert(M->ValidateMCOperand &&
113
23.9k
           "A custom validator should be set but isn't.");
114
23.9k
    return M->ValidateMCOperand(Opnd, C->Value);
115
70.1k
  case AliasPatternCond_K_Ignore:
116
    // Operand can be anything.
117
70.1k
    return true;
118
0
  case AliasPatternCond_K_Feature:
119
0
  case AliasPatternCond_K_NegFeature:
120
0
  case AliasPatternCond_K_OrFeature:
121
0
  case AliasPatternCond_K_OrNegFeature:
122
0
  case AliasPatternCond_K_EndOrFeatures:
123
0
    assert(0 && "handled earlier");
124
614k
  }
125
0
  return false;
126
614k
}
127
128
/// Check if PatternsForOpcode is all zero.
129
static inline bool validOpToPatter(const PatternsForOpcode *P)
130
157M
{
131
157M
  return !(P->Opcode == 0 && P->PatternStart == 0 && P->NumPatterns == 0);
132
157M
}
133
134
const char *matchAliasPatterns(MCInst *MI, const AliasMatchingData *M)
135
1.46M
{
136
  // TODO Rewrite to C
137
138
  // auto It = lower_bound(M.OpToPatterns, MI->getOpcode(),
139
  //                       [](const PatternsForOpcode &L, unsigned Opcode) {
140
  //                         return L.Opcode < Opcode;
141
  //                       });
142
  // if (It == M.OpToPatterns.end() || It->Opcode != MI->getOpcode())
143
  //   return nullptr;
144
145
  // Binary search by opcode. Return false if there are no aliases for this
146
  // opcode.
147
1.46M
  unsigned MIOpcode = MI->Opcode;
148
1.46M
  size_t i = 0;
149
1.46M
  uint32_t PatternOpcode = M->OpToPatterns[i].Opcode;
150
157M
  while (PatternOpcode < MIOpcode && validOpToPatter(&M->OpToPatterns[i]))
151
156M
    PatternOpcode = M->OpToPatterns[++i].Opcode;
152
1.46M
  if (PatternOpcode != MI->Opcode ||
153
127k
      !validOpToPatter(&M->OpToPatterns[i]))
154
1.34M
    return NULL;
155
156
  // // Try all patterns for this opcode.
157
127k
  uint32_t AsmStrOffset = ~0U;
158
127k
  const AliasPattern *Patterns =
159
127k
    M->Patterns + M->OpToPatterns[i].PatternStart;
160
127k
  for (const AliasPattern *P = Patterns;
161
359k
       P != Patterns + M->OpToPatterns[i].NumPatterns; ++P) {
162
    // Check operand count first.
163
280k
    if (MCInst_getNumOperands(MI) != P->NumOperands)
164
0
      return NULL;
165
166
    // Test all conditions for this pattern.
167
280k
    const AliasPatternCond *Conds =
168
280k
      M->PatternConds + P->AliasCondStart;
169
280k
    unsigned OpIdx = 0;
170
280k
    bool OrPredicateResult = false;
171
280k
    bool allMatch = true;
172
280k
    for (const AliasPatternCond *C = Conds;
173
746k
         C != Conds + P->NumConds; ++C) {
174
698k
      if (!matchAliasCondition(MI, MI->MRI, &OpIdx, M, C,
175
698k
             &OrPredicateResult)) {
176
232k
        allMatch = false;
177
232k
        break;
178
232k
      }
179
698k
    }
180
280k
    if (allMatch) {
181
47.6k
      AsmStrOffset = P->AsmStrOffset;
182
47.6k
      break;
183
47.6k
    }
184
280k
  }
185
  // If no alias matched, don't print an alias.
186
127k
  if (AsmStrOffset == ~0U)
187
79.7k
    return NULL;
188
189
  // Go to offset AsmStrOffset and use the null terminated string there. The
190
  // offset should point to the beginning of an alias string, so it should
191
  // either be zero or be preceded by a null byte.
192
47.6k
  return M->AsmStrings + AsmStrOffset;
193
127k
}
194
195
// TODO Add functionality to toggle the flag.
196
bool getUseMarkup(void)
197
7.43M
{
198
7.43M
  return false;
199
7.43M
}
200
201
/// Utility functions to make adding mark ups simpler.
202
const char *markup(const char *s)
203
7.29M
{
204
7.29M
  static const char *no_markup = "";
205
7.29M
  if (getUseMarkup())
206
0
    return s;
207
7.29M
  else
208
7.29M
    return no_markup;
209
7.29M
}
210
211
// binary search for encoding in IndexType array
212
// return -1 if not found, or index if found
213
unsigned int binsearch_IndexTypeEncoding(const struct IndexType *index,
214
           size_t size, uint16_t encoding)
215
78.9k
{
216
  // binary searching since the index is sorted in encoding order
217
78.9k
  size_t left, right, m;
218
219
78.9k
  right = size - 1;
220
221
78.9k
  if (encoding < index[0].encoding || encoding > index[right].encoding)
222
    // not found
223
12.8k
    return -1;
224
225
66.1k
  left = 0;
226
227
335k
  while (left <= right) {
228
312k
    m = (left + right) / 2;
229
312k
    if (encoding == index[m].encoding) {
230
      // LLVM actually uses lower_bound for the index table search
231
      // Here we need to check if a previous entry is of the same encoding
232
      // and return the first one.
233
42.4k
      while (m > 0 && encoding == index[m - 1].encoding)
234
0
        --m;
235
42.4k
      return m;
236
42.4k
    }
237
238
269k
    if (encoding < index[m].encoding)
239
96.0k
      right = m - 1;
240
173k
    else
241
173k
      left = m + 1;
242
269k
  }
243
244
  // not found
245
23.6k
  return -1;
246
66.1k
}
247
248
// binary search for encoding in IndexTypeStr array
249
// return -1 if not found, or index if found
250
unsigned int binsearch_IndexTypeStrEncoding(const struct IndexTypeStr *index,
251
              size_t size, const char *name)
252
1.24k
{
253
  // binary searching since the index is sorted in encoding order
254
1.24k
  size_t left, right, m;
255
256
1.24k
  right = size - 1;
257
258
1.24k
  int str_left_cmp = strcmp(name, index[0].name);
259
1.24k
  int str_right_cmp = strcmp(name, index[right].name);
260
1.24k
  if (str_left_cmp < 0 || str_right_cmp > 0)
261
    // not found
262
0
    return -1;
263
264
1.24k
  left = 0;
265
266
13.1k
  while (left <= right) {
267
13.0k
    m = (left + right) / 2;
268
13.0k
    if (strcmp(name, index[m].name) == 0) {
269
      // LLVM actually uses lower_bound for the index table search
270
      // Here we need to check if a previous entry is of the same encoding
271
      // and return the first one.
272
1.18k
      while (m > 0 && (strcmp(name, index[m - 1].name) == 0))
273
0
        --m;
274
1.18k
      return m;
275
1.18k
    }
276
277
11.8k
    if (strcmp(name, index[m].name) < 0)
278
5.41k
      right = m - 1;
279
6.47k
    else
280
6.47k
      left = m + 1;
281
11.8k
  }
282
283
  // not found
284
68
  return -1;
285
1.24k
}