Coverage Report

Created: 2025-10-14 06:42

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/capstonenext/arch/WASM/WASMDisassembler.c
Line
Count
Source
1
/* Capstone Disassembly Engine */
2
/* By Spike, xwings 2019 */
3
4
#include <string.h>
5
#include <stddef.h>
6
7
#include "WASMDisassembler.h"
8
#include "WASMMapping.h"
9
#include "../../cs_priv.h"
10
11
static const short opcodes[256] = {
12
  WASM_INS_UNREACHABLE,
13
  WASM_INS_NOP,
14
  WASM_INS_BLOCK,
15
  WASM_INS_LOOP,
16
  WASM_INS_IF,
17
  WASM_INS_ELSE,
18
  -1,
19
  -1,
20
  -1,
21
  -1,
22
  -1,
23
  WASM_INS_END,
24
  WASM_INS_BR,
25
  WASM_INS_BR_IF,
26
  WASM_INS_BR_TABLE,
27
  WASM_INS_RETURN,
28
  WASM_INS_CALL,
29
  WASM_INS_CALL_INDIRECT,
30
  -1,
31
  -1,
32
  -1,
33
  -1,
34
  -1,
35
  -1,
36
  -1,
37
  -1,
38
  WASM_INS_DROP,
39
  WASM_INS_SELECT,
40
  -1,
41
  -1,
42
  -1,
43
  -1,
44
  WASM_INS_GET_LOCAL,
45
  WASM_INS_SET_LOCAL,
46
  WASM_INS_TEE_LOCAL,
47
  WASM_INS_GET_GLOBAL,
48
  WASM_INS_SET_GLOBAL,
49
  -1,
50
  -1,
51
  -1,
52
  WASM_INS_I32_LOAD,
53
  WASM_INS_I64_LOAD,
54
  WASM_INS_F32_LOAD,
55
  WASM_INS_F64_LOAD,
56
  WASM_INS_I32_LOAD8_S,
57
  WASM_INS_I32_LOAD8_U,
58
  WASM_INS_I32_LOAD16_S,
59
  WASM_INS_I32_LOAD16_U,
60
  WASM_INS_I64_LOAD8_S,
61
  WASM_INS_I64_LOAD8_U,
62
  WASM_INS_I64_LOAD16_S,
63
  WASM_INS_I64_LOAD16_U,
64
  WASM_INS_I64_LOAD32_S,
65
  WASM_INS_I64_LOAD32_U,
66
  WASM_INS_I32_STORE,
67
  WASM_INS_I64_STORE,
68
  WASM_INS_F32_STORE,
69
  WASM_INS_F64_STORE,
70
  WASM_INS_I32_STORE8,
71
  WASM_INS_I32_STORE16,
72
  WASM_INS_I64_STORE8,
73
  WASM_INS_I64_STORE16,
74
  WASM_INS_I64_STORE32,
75
  WASM_INS_CURRENT_MEMORY,
76
  WASM_INS_GROW_MEMORY,
77
  WASM_INS_I32_CONST,
78
  WASM_INS_I64_CONST,
79
  WASM_INS_F32_CONST,
80
  WASM_INS_F64_CONST,
81
  WASM_INS_I32_EQZ,
82
  WASM_INS_I32_EQ,
83
  WASM_INS_I32_NE,
84
  WASM_INS_I32_LT_S,
85
  WASM_INS_I32_LT_U,
86
  WASM_INS_I32_GT_S,
87
  WASM_INS_I32_GT_U,
88
  WASM_INS_I32_LE_S,
89
  WASM_INS_I32_LE_U,
90
  WASM_INS_I32_GE_S,
91
  WASM_INS_I32_GE_U,
92
  WASM_INS_I64_EQZ,
93
  WASM_INS_I64_EQ,
94
  WASM_INS_I64_NE,
95
  WASM_INS_I64_LT_S,
96
  WASM_INS_I64_LT_U,
97
  WASN_INS_I64_GT_S,
98
  WASM_INS_I64_GT_U,
99
  WASM_INS_I64_LE_S,
100
  WASM_INS_I64_LE_U,
101
  WASM_INS_I64_GE_S,
102
  WASM_INS_I64_GE_U,
103
  WASM_INS_F32_EQ,
104
  WASM_INS_F32_NE,
105
  WASM_INS_F32_LT,
106
  WASM_INS_F32_GT,
107
  WASM_INS_F32_LE,
108
  WASM_INS_F32_GE,
109
  WASM_INS_F64_EQ,
110
  WASM_INS_F64_NE,
111
  WASM_INS_F64_LT,
112
  WASM_INS_F64_GT,
113
  WASM_INS_F64_LE,
114
  WASM_INS_F64_GE,
115
  WASM_INS_I32_CLZ,
116
  WASM_INS_I32_CTZ,
117
  WASM_INS_I32_POPCNT,
118
  WASM_INS_I32_ADD,
119
  WASM_INS_I32_SUB,
120
  WASM_INS_I32_MUL,
121
  WASM_INS_I32_DIV_S,
122
  WASM_INS_I32_DIV_U,
123
  WASM_INS_I32_REM_S,
124
  WASM_INS_I32_REM_U,
125
  WASM_INS_I32_AND,
126
  WASM_INS_I32_OR,
127
  WASM_INS_I32_XOR,
128
  WASM_INS_I32_SHL,
129
  WASM_INS_I32_SHR_S,
130
  WASM_INS_I32_SHR_U,
131
  WASM_INS_I32_ROTL,
132
  WASM_INS_I32_ROTR,
133
  WASM_INS_I64_CLZ,
134
  WASM_INS_I64_CTZ,
135
  WASM_INS_I64_POPCNT,
136
  WASM_INS_I64_ADD,
137
  WASM_INS_I64_SUB,
138
  WASM_INS_I64_MUL,
139
  WASM_INS_I64_DIV_S,
140
  WASM_INS_I64_DIV_U,
141
  WASM_INS_I64_REM_S,
142
  WASM_INS_I64_REM_U,
143
  WASM_INS_I64_AND,
144
  WASM_INS_I64_OR,
145
  WASM_INS_I64_XOR,
146
  WASM_INS_I64_SHL,
147
  WASM_INS_I64_SHR_S,
148
  WASM_INS_I64_SHR_U,
149
  WASM_INS_I64_ROTL,
150
  WASM_INS_I64_ROTR,
151
  WASM_INS_F32_ABS,
152
  WASM_INS_F32_NEG,
153
  WASM_INS_F32_CEIL,
154
  WASM_INS_F32_FLOOR,
155
  WASM_INS_F32_TRUNC,
156
  WASM_INS_F32_NEAREST,
157
  WASM_INS_F32_SQRT,
158
  WASM_INS_F32_ADD,
159
  WASM_INS_F32_SUB,
160
  WASM_INS_F32_MUL,
161
  WASM_INS_F32_DIV,
162
  WASM_INS_F32_MIN,
163
  WASM_INS_F32_MAX,
164
  WASM_INS_F32_COPYSIGN,
165
  WASM_INS_F64_ABS,
166
  WASM_INS_F64_NEG,
167
  WASM_INS_F64_CEIL,
168
  WASM_INS_F64_FLOOR,
169
  WASM_INS_F64_TRUNC,
170
  WASM_INS_F64_NEAREST,
171
  WASM_INS_F64_SQRT,
172
  WASM_INS_F64_ADD,
173
  WASM_INS_F64_SUB,
174
  WASM_INS_F64_MUL,
175
  WASM_INS_F64_DIV,
176
  WASM_INS_F64_MIN,
177
  WASM_INS_F64_MAX,
178
  WASM_INS_F64_COPYSIGN,
179
  WASM_INS_I32_WARP_I64,
180
  WASP_INS_I32_TRUNC_S_F32,
181
  WASM_INS_I32_TRUNC_U_F32,
182
  WASM_INS_I32_TRUNC_S_F64,
183
  WASM_INS_I32_TRUNC_U_F64,
184
  WASM_INS_I64_EXTEND_S_I32,
185
  WASM_INS_I64_EXTEND_U_I32,
186
  WASM_INS_I64_TRUNC_S_F32,
187
  WASM_INS_I64_TRUNC_U_F32,
188
  WASM_INS_I64_TRUNC_S_F64,
189
  WASM_INS_I64_TRUNC_U_F64,
190
  WASM_INS_F32_CONVERT_S_I32,
191
  WASM_INS_F32_CONVERT_U_I32,
192
  WASM_INS_F32_CONVERT_S_I64,
193
  WASM_INS_F32_CONVERT_U_I64,
194
  WASM_INS_F32_DEMOTE_F64,
195
  WASM_INS_F64_CONVERT_S_I32,
196
  WASM_INS_F64_CONVERT_U_I32,
197
  WASM_INS_F64_CONVERT_S_I64,
198
  WASM_INS_F64_CONVERT_U_I64,
199
  WASM_INS_F64_PROMOTE_F32,
200
  WASM_INS_I32_REINTERPRET_F32,
201
  WASM_INS_I64_REINTERPRET_F64,
202
  WASM_INS_F32_REINTERPRET_I32,
203
  WASM_INS_F64_REINTERPRET_I64,
204
  -1,
205
  -1,
206
  -1,
207
  -1,
208
  -1,
209
  -1,
210
  -1,
211
  -1,
212
  -1,
213
  -1,
214
  -1,
215
  -1,
216
  -1,
217
  -1,
218
  -1,
219
  -1,
220
  -1,
221
  -1,
222
  -1,
223
  -1,
224
  -1,
225
  -1,
226
  -1,
227
  -1,
228
  -1,
229
  -1,
230
  -1,
231
  -1,
232
  -1,
233
  -1,
234
  -1,
235
  -1,
236
  -1,
237
  -1,
238
  -1,
239
  -1,
240
  -1,
241
  -1,
242
  -1,
243
  -1,
244
  -1,
245
  -1,
246
  -1,
247
  -1,
248
  -1,
249
  -1,
250
  -1,
251
  -1,
252
  -1,
253
  -1,
254
  -1,
255
  -1,
256
  -1,
257
  -1,
258
  -1,
259
  -1,
260
  -1,
261
  -1,
262
  -1,
263
  -1,
264
  -1,
265
  -1,
266
  -1,
267
  -1,
268
};
269
270
// input  | code: code pointer start from varuint32
271
//        | code_len: real code len count from varint
272
//        | leng: return value, means length of varint. -1 means error
273
// return | varint
274
static uint32_t get_varuint32(const uint8_t *code, size_t code_len,
275
            size_t *leng)
276
29.7k
{
277
29.7k
  uint32_t data = 0;
278
29.7k
  int i;
279
280
37.4k
  for (i = 0;; i++) {
281
37.4k
    if (code_len < i + 1) {
282
227
      *leng = -1;
283
227
      return 0;
284
227
    }
285
286
37.2k
    if (i > 4 || (i == 4 && (code[i] & 0x7f) > 0x0f)) {
287
153
      *leng = -1;
288
153
      return 0;
289
153
    }
290
291
37.1k
    data = data + (((uint32_t)code[i] & 0x7f) << (i * 7));
292
37.1k
    if (code[i] >> 7 == 0) {
293
29.3k
      break;
294
29.3k
    }
295
37.1k
  }
296
297
29.3k
  *leng = i + 1;
298
299
29.3k
  return data;
300
29.7k
}
301
302
// input  | code : code pointer start from varuint64
303
//        | code_len : real code len count from varint
304
//        | leng: return value, means length of varint. -1 means error
305
// return   | varint
306
static uint64_t get_varuint64(const uint8_t *code, size_t code_len,
307
            size_t *leng)
308
297
{
309
297
  uint64_t data;
310
297
  int i;
311
312
297
  data = 0;
313
893
  for (i = 0;; i++) {
314
893
    if (code_len < i + 1) {
315
9
      *leng = -1;
316
9
      return 0;
317
9
    }
318
319
884
    if (i > 9 || (i == 9 && (code[i] & 0x7f) > 0x01)) {
320
3
      *leng = -1;
321
3
      return 0;
322
3
    }
323
324
881
    data = data + (((uint64_t)code[i] & 0x7f) << (i * 7));
325
881
    if (code[i] >> 7 == 0) {
326
285
      break;
327
285
    }
328
881
  }
329
330
285
  *leng = i + 1;
331
332
285
  return data;
333
297
}
334
335
// input  | code : code pointer start from uint32
336
//      | dest : the pointer where we store the uint32
337
// return | None
338
static void get_uint32(const uint8_t *code, uint32_t *dest)
339
1.25k
{
340
1.25k
  memcpy(dest, code, 4);
341
1.25k
}
342
343
// input  | code : code pointer start from uint32
344
//      | dest : the pointer where we store the uint64
345
// return   | None
346
static void get_uint64(const uint8_t *code, uint64_t *dest)
347
542
{
348
542
  memcpy(dest, code, 8);
349
542
}
350
351
// input  | code : code pointer start from varint7
352
//      | code_len : start from the code pointer to the end, how long is it
353
//      | leng : length of the param , -1 means error
354
// return   | data of varint7
355
static int8_t get_varint7(const uint8_t *code, size_t code_len, size_t *leng)
356
1.04k
{
357
1.04k
  int8_t data;
358
359
1.04k
  if (code_len < 1) {
360
0
    *leng = -1;
361
0
    return -1;
362
0
  }
363
364
1.04k
  *leng = 1;
365
366
1.04k
  if (code[0] == 0x40) {
367
291
    return -1;
368
291
  }
369
370
751
  data = code[0] & 0x7f;
371
372
751
  return data;
373
1.04k
}
374
375
// input  | code : code pointer start from varuint32
376
//      | code_len : start from the code pointer to the end, how long is it
377
//      | param_size : pointer of the param size
378
//      | MI : Mcinst handler in this round of disasm
379
// return   | true/false if the function successfully finished
380
static bool read_varuint32(const uint8_t *code, size_t code_len,
381
         uint16_t *param_size, MCInst *MI)
382
3.89k
{
383
3.89k
  size_t len = 0;
384
3.89k
  uint32_t data;
385
386
3.89k
  data = get_varuint32(code, code_len, &len);
387
3.89k
  if (len == -1) {
388
18
    return false;
389
18
  }
390
391
3.87k
  if (MI->flat_insn->detail) {
392
3.87k
    MI->flat_insn->detail->wasm.op_count = 1;
393
3.87k
    MI->flat_insn->detail->wasm.operands[0].type =
394
3.87k
      WASM_OP_VARUINT32;
395
3.87k
    MI->flat_insn->detail->wasm.operands[0].size = len;
396
3.87k
    MI->flat_insn->detail->wasm.operands[0].varuint32 = data;
397
3.87k
  }
398
399
3.87k
  MI->wasm_data.size = len;
400
3.87k
  MI->wasm_data.type = WASM_OP_VARUINT32;
401
3.87k
  MI->wasm_data.uint32 = data;
402
3.87k
  *param_size = len;
403
404
3.87k
  return true;
405
3.89k
}
406
407
// input  | code : code pointer start from varuint64
408
//      | code_len : start from the code pointer to the end, how long is it
409
//      | param_size : pointer of the param size
410
//      | MI : Mcinst handler in this round of disasm
411
// return   | true/false if the function successfully finished
412
static bool read_varuint64(const uint8_t *code, size_t code_len,
413
         uint16_t *param_size, MCInst *MI)
414
297
{
415
297
  size_t len = 0;
416
297
  uint64_t data;
417
418
297
  data = get_varuint64(code, code_len, &len);
419
297
  if (len == -1) {
420
12
    return false;
421
12
  }
422
423
285
  if (MI->flat_insn->detail) {
424
285
    MI->flat_insn->detail->wasm.op_count = 1;
425
285
    MI->flat_insn->detail->wasm.operands[0].type =
426
285
      WASM_OP_VARUINT64;
427
285
    MI->flat_insn->detail->wasm.operands[0].size = len;
428
285
    MI->flat_insn->detail->wasm.operands[0].varuint64 = data;
429
285
  }
430
431
285
  MI->wasm_data.size = len;
432
285
  MI->wasm_data.type = WASM_OP_VARUINT64;
433
285
  MI->wasm_data.uint64 = data;
434
285
  *param_size = len;
435
436
285
  return true;
437
297
}
438
439
// input  | code : code pointer start from memoryimmediate
440
//      | code_len : start from the code pointer to the end, how long is it
441
//      | param_size : pointer of the param size (sum of two params)
442
//      | MI : Mcinst handler in this round of disasm
443
// return   | true/false if the function successfully finished
444
static bool read_memoryimmediate(const uint8_t *code, size_t code_len,
445
         uint16_t *param_size, MCInst *MI)
446
7.70k
{
447
7.70k
  size_t tmp, len = 0;
448
7.70k
  uint32_t data[2];
449
450
7.70k
  if (MI->flat_insn->detail) {
451
7.70k
    MI->flat_insn->detail->wasm.op_count = 2;
452
7.70k
  }
453
454
7.70k
  data[0] = get_varuint32(code, code_len, &tmp);
455
7.70k
  if (tmp == -1) {
456
49
    return false;
457
49
  }
458
459
7.65k
  if (MI->flat_insn->detail) {
460
7.65k
    MI->flat_insn->detail->wasm.operands[0].type =
461
7.65k
      WASM_OP_VARUINT32;
462
7.65k
    MI->flat_insn->detail->wasm.operands[0].size = tmp;
463
7.65k
    MI->flat_insn->detail->wasm.operands[0].varuint32 = data[0];
464
7.65k
  }
465
466
7.65k
  len = tmp;
467
7.65k
  data[1] = get_varuint32(&code[len], code_len - len, &tmp);
468
469
7.65k
  if (MI->flat_insn->detail) {
470
7.65k
    MI->flat_insn->detail->wasm.operands[1].type =
471
7.65k
      WASM_OP_VARUINT32;
472
7.65k
    MI->flat_insn->detail->wasm.operands[1].size = tmp;
473
7.65k
    MI->flat_insn->detail->wasm.operands[1].varuint32 = data[1];
474
7.65k
  }
475
476
7.65k
  len += tmp;
477
7.65k
  MI->wasm_data.size = len;
478
7.65k
  MI->wasm_data.type = WASM_OP_IMM;
479
7.65k
  MI->wasm_data.immediate[0] = data[0];
480
7.65k
  MI->wasm_data.immediate[1] = data[1];
481
7.65k
  *param_size = len;
482
483
7.65k
  return true;
484
7.70k
}
485
486
// input  | code : code pointer start from uint32
487
//      | code_len : start from the code pointer to the end, how long is it
488
//      | param_size : pointer of the param size
489
//      | MI : Mcinst handler in this round of disasm
490
// return   | true/false if the function successfully finished
491
static bool read_uint32(const uint8_t *code, size_t code_len,
492
      uint16_t *param_size, MCInst *MI)
493
633
{
494
633
  if (code_len < 4) {
495
6
    return false;
496
6
  }
497
498
627
  get_uint32(code, &(MI->wasm_data.uint32));
499
500
627
  if (MI->flat_insn->detail) {
501
627
    MI->flat_insn->detail->wasm.op_count = 1;
502
627
    MI->flat_insn->detail->wasm.operands[0].type = WASM_OP_UINT32;
503
627
    MI->flat_insn->detail->wasm.operands[0].size = 4;
504
627
    get_uint32(code,
505
627
         &(MI->flat_insn->detail->wasm.operands[0].uint32));
506
627
  }
507
508
627
  MI->wasm_data.size = 4;
509
627
  MI->wasm_data.type = WASM_OP_UINT32;
510
627
  *param_size = 4;
511
512
627
  return true;
513
633
}
514
515
// input  | code : code pointer start from uint64
516
//      | code_len : start from the code pointer to the end, how long is it
517
//      | param_size : pointer of the param size
518
//      | MI : Mcinst handler in this round of disasm
519
// return   | true/false if the function successfully finished
520
static bool read_uint64(const uint8_t *code, size_t code_len,
521
      uint16_t *param_size, MCInst *MI)
522
280
{
523
280
  if (code_len < 8) {
524
9
    return false;
525
9
  }
526
527
271
  get_uint64(code, &(MI->wasm_data.uint64));
528
529
271
  if (MI->flat_insn->detail) {
530
271
    MI->flat_insn->detail->wasm.op_count = 1;
531
271
    MI->flat_insn->detail->wasm.operands[0].type = WASM_OP_UINT64;
532
271
    MI->flat_insn->detail->wasm.operands[0].size = 8;
533
271
    get_uint64(code,
534
271
         &(MI->flat_insn->detail->wasm.operands[0].uint64));
535
271
  }
536
537
271
  MI->wasm_data.size = 8;
538
271
  MI->wasm_data.type = WASM_OP_UINT64;
539
271
  *param_size = 8;
540
541
271
  return true;
542
280
}
543
544
// input  | code : code pointer start from brtable
545
//      | code_len : start from the code pointer to the end, how long is it
546
//      | param_size : pointer of the param size (sum of all param)
547
//      | MI : Mcinst handler in this round of disasm
548
// return   | true/false if the function successfully finished
549
static bool read_brtable(const uint8_t *code, size_t code_len,
550
       uint16_t *param_size, MCInst *MI)
551
987
{
552
987
  uint32_t length, default_target;
553
987
  int tmp_len = 0, i;
554
987
  size_t var_len;
555
556
  // read length
557
987
  length = get_varuint32(code, code_len, &var_len);
558
987
  if (var_len == -1) {
559
9
    return false;
560
9
  }
561
562
978
  tmp_len += var_len;
563
978
  MI->wasm_data.brtable.length = length;
564
978
  if (length >= UINT32_MAX - tmp_len) {
565
    // integer overflow check
566
1
    return false;
567
1
  }
568
977
  if (code_len < tmp_len + length) {
569
    // safety check that we have minimum enough data to read
570
54
    return false;
571
54
  }
572
  // base address + 1 byte opcode + tmp_len for number of cases = start of targets
573
923
  MI->wasm_data.brtable.address = MI->address + 1 + tmp_len;
574
575
923
  if (MI->flat_insn->detail) {
576
923
    MI->flat_insn->detail->wasm.op_count = 1;
577
923
    MI->flat_insn->detail->wasm.operands[0].type = WASM_OP_BRTABLE;
578
923
    MI->flat_insn->detail->wasm.operands[0].brtable.length =
579
923
      MI->wasm_data.brtable.length;
580
923
    MI->flat_insn->detail->wasm.operands[0].brtable.address =
581
923
      MI->wasm_data.brtable.address;
582
923
  }
583
584
  // read data
585
9.48k
  for (i = 0; i < length; i++) {
586
8.58k
    if (code_len < tmp_len) {
587
0
      return false;
588
0
    }
589
590
8.58k
    get_varuint32(code + tmp_len, code_len - tmp_len, &var_len);
591
8.58k
    if (var_len == -1) {
592
16
      return false;
593
16
    }
594
595
8.56k
    tmp_len += var_len;
596
8.56k
  }
597
598
  // read default target
599
907
  default_target =
600
907
    get_varuint32(code + tmp_len, code_len - tmp_len, &var_len);
601
907
  if (var_len == -1) {
602
25
    return false;
603
25
  }
604
605
882
  MI->wasm_data.brtable.default_target = default_target;
606
882
  MI->wasm_data.type = WASM_OP_BRTABLE;
607
882
  *param_size = tmp_len + var_len;
608
609
882
  if (MI->flat_insn->detail) {
610
882
    MI->flat_insn->detail->wasm.operands[0].size = *param_size;
611
882
    MI->flat_insn->detail->wasm.operands[0].brtable.default_target =
612
882
      MI->wasm_data.brtable.default_target;
613
882
  }
614
615
882
  return true;
616
907
}
617
618
// input  | code : code pointer start from varint7
619
//      | code_len : start from the code pointer to the end, how long is it
620
//      | param_size : pointer of the param size
621
//      | MI : Mcinst handler in this round of disasm
622
// return   | true/false if the function successfully finished
623
static bool read_varint7(const uint8_t *code, size_t code_len,
624
       uint16_t *param_size, MCInst *MI)
625
1.04k
{
626
1.04k
  size_t len = 0;
627
628
1.04k
  MI->wasm_data.type = WASM_OP_INT7;
629
1.04k
  MI->wasm_data.int7 = get_varint7(code, code_len, &len);
630
1.04k
  if (len == -1) {
631
0
    return false;
632
0
  }
633
634
1.04k
  if (MI->flat_insn->detail) {
635
1.04k
    MI->flat_insn->detail->wasm.op_count = 1;
636
1.04k
    MI->flat_insn->detail->wasm.operands[0].type = WASM_OP_INT7;
637
1.04k
    MI->flat_insn->detail->wasm.operands[0].size = 1;
638
1.04k
    MI->flat_insn->detail->wasm.operands[0].int7 =
639
1.04k
      MI->wasm_data.int7;
640
1.04k
  }
641
642
1.04k
  *param_size = len;
643
644
1.04k
  return true;
645
1.04k
}
646
647
bool WASM_getInstruction(csh ud, const uint8_t *code, size_t code_len,
648
       MCInst *MI, uint16_t *size, uint64_t address,
649
       void *inst_info)
650
64.3k
{
651
64.3k
  unsigned char opcode;
652
64.3k
  uint16_t param_size;
653
654
64.3k
  if (code_len == 0)
655
0
    return false;
656
657
64.3k
  opcode = code[0];
658
64.3k
  if (opcodes[opcode] == -1) {
659
    // invalid opcode
660
258
    return false;
661
258
  }
662
663
  // valid opcode
664
64.0k
  MI->address = address;
665
64.0k
  MI->OpcodePub = MI->Opcode = opcode;
666
667
64.0k
  if (MI->flat_insn->detail) {
668
64.0k
    memset(MI->flat_insn->detail, 0,
669
64.0k
           offsetof(cs_detail, wasm) + sizeof(cs_wasm));
670
64.0k
    WASM_get_insn_id((cs_struct *)ud, MI->flat_insn, opcode);
671
64.0k
  }
672
673
  // setup groups
674
64.0k
  switch (opcode) {
675
0
  default:
676
0
    return false;
677
678
233
  case WASM_INS_I32_CONST:
679
233
    if (code_len == 1 ||
680
229
        !read_varuint32(&code[1], code_len - 1, &param_size, MI)) {
681
7
      return false;
682
7
    }
683
684
226
    if (MI->flat_insn->detail) {
685
226
      MI->flat_insn->detail->wasm.op_count = 1;
686
226
      MI->flat_insn->detail
687
226
        ->groups[MI->flat_insn->detail->groups_count] =
688
226
        WASM_GRP_NUMBERIC;
689
226
      MI->flat_insn->detail->groups_count++;
690
226
    }
691
692
226
    *size = param_size + 1;
693
694
226
    break;
695
696
300
  case WASM_INS_I64_CONST:
697
300
    if (code_len == 1 ||
698
297
        !read_varuint64(&code[1], code_len - 1, &param_size, MI)) {
699
15
      return false;
700
15
    }
701
702
285
    if (MI->flat_insn->detail) {
703
285
      MI->flat_insn->detail->wasm.op_count = 1;
704
285
      MI->flat_insn->detail
705
285
        ->groups[MI->flat_insn->detail->groups_count] =
706
285
        WASM_GRP_NUMBERIC;
707
285
      MI->flat_insn->detail->groups_count++;
708
285
    }
709
710
285
    *size = param_size + 1;
711
712
285
    break;
713
714
634
  case WASM_INS_F32_CONST:
715
634
    if (code_len == 1 ||
716
633
        !read_uint32(&code[1], code_len - 1, &param_size, MI)) {
717
7
      return false;
718
7
    }
719
720
627
    if (MI->flat_insn->detail) {
721
627
      MI->flat_insn->detail->wasm.op_count = 1;
722
627
      MI->flat_insn->detail
723
627
        ->groups[MI->flat_insn->detail->groups_count] =
724
627
        WASM_GRP_NUMBERIC;
725
627
      MI->flat_insn->detail->groups_count++;
726
627
    }
727
728
627
    *size = param_size + 1;
729
730
627
    break;
731
732
282
  case WASM_INS_F64_CONST:
733
282
    if (code_len == 1 ||
734
280
        !read_uint64(&code[1], code_len - 1, &param_size, MI)) {
735
11
      return false;
736
11
    }
737
738
271
    if (MI->flat_insn->detail) {
739
271
      MI->flat_insn->detail->wasm.op_count = 1;
740
271
      MI->flat_insn->detail
741
271
        ->groups[MI->flat_insn->detail->groups_count] =
742
271
        WASM_GRP_NUMBERIC;
743
271
      MI->flat_insn->detail->groups_count++;
744
271
    }
745
746
271
    *size = param_size + 1;
747
748
271
    break;
749
750
1.23k
  case WASM_INS_I32_EQZ:
751
1.46k
  case WASM_INS_I32_EQ:
752
1.69k
  case WASM_INS_I32_NE:
753
1.92k
  case WASM_INS_I32_LT_S:
754
2.14k
  case WASM_INS_I32_LT_U:
755
2.35k
  case WASM_INS_I32_GT_S:
756
2.58k
  case WASM_INS_I32_GT_U:
757
2.79k
  case WASM_INS_I32_LE_S:
758
3.02k
  case WASM_INS_I32_LE_U:
759
3.27k
  case WASM_INS_I32_GE_S:
760
3.52k
  case WASM_INS_I32_GE_U:
761
3.73k
  case WASM_INS_I64_EQZ:
762
4.11k
  case WASM_INS_I64_EQ:
763
4.32k
  case WASM_INS_I64_NE:
764
4.55k
  case WASM_INS_I64_LT_S:
765
4.77k
  case WASM_INS_I64_LT_U:
766
4.98k
  case WASN_INS_I64_GT_S:
767
5.22k
  case WASM_INS_I64_GT_U:
768
5.62k
  case WASM_INS_I64_LE_S:
769
5.85k
  case WASM_INS_I64_LE_U:
770
6.07k
  case WASM_INS_I64_GE_S:
771
6.28k
  case WASM_INS_I64_GE_U:
772
7.07k
  case WASM_INS_F32_EQ:
773
7.32k
  case WASM_INS_F32_NE:
774
8.38k
  case WASM_INS_F32_LT:
775
8.61k
  case WASM_INS_F32_GT:
776
8.82k
  case WASM_INS_F32_LE:
777
9.07k
  case WASM_INS_F32_GE:
778
9.32k
  case WASM_INS_F64_EQ:
779
9.74k
  case WASM_INS_F64_NE:
780
10.0k
  case WASM_INS_F64_LT:
781
10.5k
  case WASM_INS_F64_GT:
782
10.7k
  case WASM_INS_F64_LE:
783
11.0k
  case WASM_INS_F64_GE:
784
11.3k
  case WASM_INS_I32_CLZ:
785
11.5k
  case WASM_INS_I32_CTZ:
786
11.8k
  case WASM_INS_I32_POPCNT:
787
12.0k
  case WASM_INS_I32_ADD:
788
12.3k
  case WASM_INS_I32_SUB:
789
12.6k
  case WASM_INS_I32_MUL:
790
13.4k
  case WASM_INS_I32_DIV_S:
791
13.7k
  case WASM_INS_I32_DIV_U:
792
14.1k
  case WASM_INS_I32_REM_S:
793
14.4k
  case WASM_INS_I32_REM_U:
794
14.6k
  case WASM_INS_I32_AND:
795
14.9k
  case WASM_INS_I32_OR:
796
15.2k
  case WASM_INS_I32_XOR:
797
15.5k
  case WASM_INS_I32_SHL:
798
15.7k
  case WASM_INS_I32_SHR_S:
799
16.0k
  case WASM_INS_I32_SHR_U:
800
16.2k
  case WASM_INS_I32_ROTL:
801
16.8k
  case WASM_INS_I32_ROTR:
802
17.0k
  case WASM_INS_I64_CLZ:
803
17.3k
  case WASM_INS_I64_CTZ:
804
17.6k
  case WASM_INS_I64_POPCNT:
805
17.8k
  case WASM_INS_I64_ADD:
806
18.1k
  case WASM_INS_I64_SUB:
807
18.4k
  case WASM_INS_I64_MUL:
808
18.6k
  case WASM_INS_I64_DIV_S:
809
19.2k
  case WASM_INS_I64_DIV_U:
810
19.5k
  case WASM_INS_I64_REM_S:
811
20.1k
  case WASM_INS_I64_REM_U:
812
20.3k
  case WASM_INS_I64_AND:
813
20.6k
  case WASM_INS_I64_OR:
814
20.9k
  case WASM_INS_I64_XOR:
815
21.4k
  case WASM_INS_I64_SHL:
816
22.2k
  case WASM_INS_I64_SHR_S:
817
22.4k
  case WASM_INS_I64_SHR_U:
818
22.6k
  case WASM_INS_I64_ROTL:
819
22.9k
  case WASM_INS_I64_ROTR:
820
23.1k
  case WASM_INS_F32_ABS:
821
23.7k
  case WASM_INS_F32_NEG:
822
23.9k
  case WASM_INS_F32_CEIL:
823
24.2k
  case WASM_INS_F32_FLOOR:
824
24.4k
  case WASM_INS_F32_TRUNC:
825
24.8k
  case WASM_INS_F32_NEAREST:
826
25.1k
  case WASM_INS_F32_SQRT:
827
25.6k
  case WASM_INS_F32_ADD:
828
25.8k
  case WASM_INS_F32_SUB:
829
26.0k
  case WASM_INS_F32_MUL:
830
26.3k
  case WASM_INS_F32_DIV:
831
26.6k
  case WASM_INS_F32_MIN:
832
26.8k
  case WASM_INS_F32_MAX:
833
27.0k
  case WASM_INS_F32_COPYSIGN:
834
27.3k
  case WASM_INS_F64_ABS:
835
27.5k
  case WASM_INS_F64_NEG:
836
27.8k
  case WASM_INS_F64_CEIL:
837
28.0k
  case WASM_INS_F64_FLOOR:
838
28.3k
  case WASM_INS_F64_TRUNC:
839
28.5k
  case WASM_INS_F64_NEAREST:
840
28.7k
  case WASM_INS_F64_SQRT:
841
29.0k
  case WASM_INS_F64_ADD:
842
29.3k
  case WASM_INS_F64_SUB:
843
29.6k
  case WASM_INS_F64_MUL:
844
29.9k
  case WASM_INS_F64_DIV:
845
30.3k
  case WASM_INS_F64_MIN:
846
31.0k
  case WASM_INS_F64_MAX:
847
31.2k
  case WASM_INS_F64_COPYSIGN:
848
31.6k
  case WASM_INS_I32_WARP_I64:
849
31.8k
  case WASP_INS_I32_TRUNC_S_F32:
850
32.1k
  case WASM_INS_I32_TRUNC_U_F32:
851
32.7k
  case WASM_INS_I32_TRUNC_S_F64:
852
32.9k
  case WASM_INS_I32_TRUNC_U_F64:
853
33.2k
  case WASM_INS_I64_EXTEND_S_I32:
854
33.5k
  case WASM_INS_I64_EXTEND_U_I32:
855
33.7k
  case WASM_INS_I64_TRUNC_S_F32:
856
33.9k
  case WASM_INS_I64_TRUNC_U_F32:
857
34.2k
  case WASM_INS_I64_TRUNC_S_F64:
858
38.4k
  case WASM_INS_I64_TRUNC_U_F64:
859
38.7k
  case WASM_INS_F32_CONVERT_S_I32:
860
38.9k
  case WASM_INS_F32_CONVERT_U_I32:
861
39.3k
  case WASM_INS_F32_CONVERT_S_I64:
862
39.5k
  case WASM_INS_F32_CONVERT_U_I64:
863
39.8k
  case WASM_INS_F32_DEMOTE_F64:
864
40.0k
  case WASM_INS_F64_CONVERT_S_I32:
865
40.3k
  case WASM_INS_F64_CONVERT_U_I32:
866
40.5k
  case WASM_INS_F64_CONVERT_S_I64:
867
40.7k
  case WASM_INS_F64_CONVERT_U_I64:
868
41.0k
  case WASM_INS_F64_PROMOTE_F32:
869
41.2k
  case WASM_INS_I32_REINTERPRET_F32:
870
41.4k
  case WASM_INS_I64_REINTERPRET_F64:
871
41.6k
  case WASM_INS_F32_REINTERPRET_I32:
872
41.9k
  case WASM_INS_F64_REINTERPRET_I64:
873
41.9k
    MI->wasm_data.type = WASM_OP_NONE;
874
875
41.9k
    if (MI->flat_insn->detail) {
876
41.9k
      MI->flat_insn->detail->wasm.op_count = 0;
877
41.9k
      MI->flat_insn->detail
878
41.9k
        ->groups[MI->flat_insn->detail->groups_count] =
879
41.9k
        WASM_GRP_NUMBERIC;
880
41.9k
      MI->flat_insn->detail->groups_count++;
881
41.9k
    }
882
883
41.9k
    *size = 1;
884
885
41.9k
    break;
886
887
329
  case WASM_INS_DROP:
888
576
  case WASM_INS_SELECT:
889
576
    MI->wasm_data.type = WASM_OP_NONE;
890
891
576
    if (MI->flat_insn->detail) {
892
576
      MI->flat_insn->detail->wasm.op_count = 0;
893
576
      MI->flat_insn->detail
894
576
        ->groups[MI->flat_insn->detail->groups_count] =
895
576
        WASM_GRP_PARAMETRIC;
896
576
      MI->flat_insn->detail->groups_count++;
897
576
    }
898
899
576
    *size = 1;
900
901
576
    break;
902
903
533
  case WASM_INS_GET_LOCAL:
904
1.06k
  case WASM_INS_SET_LOCAL:
905
1.29k
  case WASM_INS_TEE_LOCAL:
906
1.62k
  case WASM_INS_GET_GLOBAL:
907
1.89k
  case WASM_INS_SET_GLOBAL:
908
1.89k
    if (code_len == 1 ||
909
1.87k
        !read_varuint32(&code[1], code_len - 1, &param_size, MI)) {
910
30
      return false;
911
30
    }
912
913
1.86k
    if (MI->flat_insn->detail) {
914
1.86k
      MI->flat_insn->detail->wasm.op_count = 1;
915
1.86k
      MI->flat_insn->detail
916
1.86k
        ->groups[MI->flat_insn->detail->groups_count] =
917
1.86k
        WASM_GRP_VARIABLE;
918
1.86k
      MI->flat_insn->detail->groups_count++;
919
1.86k
    }
920
921
1.86k
    *size = param_size + 1;
922
923
1.86k
    break;
924
925
236
  case WASM_INS_I32_LOAD:
926
804
  case WASM_INS_I64_LOAD:
927
1.05k
  case WASM_INS_F32_LOAD:
928
1.32k
  case WASM_INS_F64_LOAD:
929
1.86k
  case WASM_INS_I32_LOAD8_S:
930
2.15k
  case WASM_INS_I32_LOAD8_U:
931
2.40k
  case WASM_INS_I32_LOAD16_S:
932
2.71k
  case WASM_INS_I32_LOAD16_U:
933
3.37k
  case WASM_INS_I64_LOAD8_S:
934
3.73k
  case WASM_INS_I64_LOAD8_U:
935
4.00k
  case WASM_INS_I64_LOAD16_S:
936
4.27k
  case WASM_INS_I64_LOAD16_U:
937
4.54k
  case WASM_INS_I64_LOAD32_S:
938
4.95k
  case WASM_INS_I64_LOAD32_U:
939
5.74k
  case WASM_INS_I32_STORE:
940
5.96k
  case WASM_INS_I64_STORE:
941
6.34k
  case WASM_INS_F32_STORE:
942
6.58k
  case WASM_INS_F64_STORE:
943
6.91k
  case WASM_INS_I32_STORE8:
944
7.17k
  case WASM_INS_I32_STORE16:
945
7.38k
  case WASM_INS_I64_STORE8:
946
7.60k
  case WASM_INS_I64_STORE16:
947
7.81k
  case WASM_INS_I64_STORE32:
948
7.81k
    if (code_len == 1 ||
949
7.70k
        !read_memoryimmediate(&code[1], code_len - 1, &param_size,
950
7.70k
            MI)) {
951
167
      return false;
952
167
    }
953
954
7.65k
    if (MI->flat_insn->detail) {
955
7.65k
      MI->flat_insn->detail->wasm.op_count = 2;
956
7.65k
      MI->flat_insn->detail
957
7.65k
        ->groups[MI->flat_insn->detail->groups_count] =
958
7.65k
        WASM_GRP_MEMORY;
959
7.65k
      MI->flat_insn->detail->groups_count++;
960
7.65k
    }
961
962
7.65k
    *size = param_size + 1;
963
964
7.65k
    break;
965
966
255
  case WASM_INS_CURRENT_MEMORY:
967
535
  case WASM_INS_GROW_MEMORY:
968
535
    MI->wasm_data.type = WASM_OP_NONE;
969
970
535
    if (MI->flat_insn->detail) {
971
535
      MI->flat_insn->detail->wasm.op_count = 0;
972
535
      MI->flat_insn->detail
973
535
        ->groups[MI->flat_insn->detail->groups_count] =
974
535
        WASM_GRP_MEMORY;
975
535
      MI->flat_insn->detail->groups_count++;
976
535
    }
977
978
535
    *size = 1;
979
980
535
    break;
981
982
4.87k
  case WASM_INS_UNREACHABLE:
983
5.29k
  case WASM_INS_NOP:
984
5.57k
  case WASM_INS_ELSE:
985
5.81k
  case WASM_INS_END:
986
6.04k
  case WASM_INS_RETURN:
987
6.04k
    MI->wasm_data.type = WASM_OP_NONE;
988
989
6.04k
    if (MI->flat_insn->detail) {
990
6.04k
      MI->flat_insn->detail->wasm.op_count = 0;
991
6.04k
      MI->flat_insn->detail
992
6.04k
        ->groups[MI->flat_insn->detail->groups_count] =
993
6.04k
        WASM_GRP_CONTROL;
994
6.04k
      MI->flat_insn->detail->groups_count++;
995
6.04k
    }
996
997
6.04k
    *size = 1;
998
999
6.04k
    break;
1000
1001
228
  case WASM_INS_BLOCK:
1002
774
  case WASM_INS_LOOP:
1003
1.05k
  case WASM_INS_IF:
1004
1.05k
    if (code_len == 1 ||
1005
1.04k
        !read_varint7(&code[1], code_len - 1, &param_size, MI)) {
1006
17
      return false;
1007
17
    }
1008
1009
1.04k
    if (MI->flat_insn->detail) {
1010
1.04k
      MI->flat_insn->detail->wasm.op_count = 1;
1011
1.04k
      MI->flat_insn->detail
1012
1.04k
        ->groups[MI->flat_insn->detail->groups_count] =
1013
1.04k
        WASM_GRP_CONTROL;
1014
1.04k
      MI->flat_insn->detail->groups_count++;
1015
1.04k
    }
1016
1017
1.04k
    *size = param_size + 1;
1018
1019
1.04k
    break;
1020
1021
339
  case WASM_INS_BR:
1022
1.28k
  case WASM_INS_BR_IF:
1023
1.57k
  case WASM_INS_CALL:
1024
1.81k
  case WASM_INS_CALL_INDIRECT:
1025
1.81k
    if (code_len == 1 ||
1026
1.79k
        !read_varuint32(&code[1], code_len - 1, &param_size, MI)) {
1027
32
      return false;
1028
32
    }
1029
1030
1.78k
    if (MI->flat_insn->detail) {
1031
1.78k
      MI->flat_insn->detail->wasm.op_count = 1;
1032
1.78k
      MI->flat_insn->detail
1033
1.78k
        ->groups[MI->flat_insn->detail->groups_count] =
1034
1.78k
        WASM_GRP_CONTROL;
1035
1.78k
      MI->flat_insn->detail->groups_count++;
1036
1.78k
    }
1037
1038
1.78k
    *size = param_size + 1;
1039
1040
1.78k
    break;
1041
1042
990
  case WASM_INS_BR_TABLE:
1043
990
    if (code_len == 1 ||
1044
987
        !read_brtable(&code[1], code_len - 1, &param_size, MI)) {
1045
108
      return false;
1046
108
    }
1047
1048
882
    if (MI->flat_insn->detail) {
1049
882
      MI->flat_insn->detail->wasm.op_count = 1;
1050
882
      MI->flat_insn->detail
1051
882
        ->groups[MI->flat_insn->detail->groups_count] =
1052
882
        WASM_GRP_CONTROL;
1053
882
      MI->flat_insn->detail->groups_count++;
1054
882
    }
1055
1056
882
    *size = param_size + 1;
1057
1058
882
    break;
1059
64.0k
  }
1060
1061
63.7k
  return true;
1062
64.0k
}