Coverage Report

Created: 2025-11-16 06:38

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/capstonev5/arch/BPF/BPFDisassembler.c
Line
Count
Source
1
/* Capstone Disassembly Engine */
2
/* BPF Backend by david942j <david942j@gmail.com>, 2019 */
3
4
#ifdef CAPSTONE_HAS_BPF
5
6
#include <string.h>
7
#include <stddef.h> // offsetof macro
8
9
#include "BPFConstants.h"
10
#include "BPFDisassembler.h"
11
#include "BPFMapping.h"
12
#include "../../cs_priv.h"
13
14
static uint16_t read_u16(cs_struct *ud, const uint8_t *code)
15
42.5k
{
16
42.5k
  if (MODE_IS_BIG_ENDIAN(ud->mode))
17
23.5k
    return (((uint16_t)code[0] << 8) | code[1]);
18
18.9k
  else
19
18.9k
    return (((uint16_t)code[1] << 8) | code[0]);
20
42.5k
}
21
22
static uint32_t read_u32(cs_struct *ud, const uint8_t *code)
23
14.4k
{
24
14.4k
  if (MODE_IS_BIG_ENDIAN(ud->mode))
25
7.99k
    return ((uint32_t)read_u16(ud, code) << 16) | read_u16(ud, code + 2);
26
6.44k
  else
27
6.44k
    return ((uint32_t)read_u16(ud, code + 2) << 16) | read_u16(ud, code);
28
14.4k
}
29
30
///< Malloc bpf_internal, also checks if code_len is large enough.
31
static bpf_internal *alloc_bpf_internal(size_t code_len)
32
36.0k
{
33
36.0k
  bpf_internal *bpf;
34
35
36.0k
  if (code_len < 8)
36
515
    return NULL;
37
35.5k
  bpf = cs_mem_malloc(sizeof(bpf_internal));
38
35.5k
  if (bpf == NULL)
39
0
    return NULL;
40
  /* default value */
41
35.5k
  bpf->insn_size = 8;
42
35.5k
  return bpf;
43
35.5k
}
44
45
///< Fetch a cBPF structure from code
46
static bpf_internal* fetch_cbpf(cs_struct *ud, const uint8_t *code,
47
    size_t code_len)
48
12.6k
{
49
12.6k
  bpf_internal *bpf;
50
51
12.6k
  bpf = alloc_bpf_internal(code_len);
52
12.6k
  if (bpf == NULL)
53
152
    return NULL;
54
55
12.5k
  bpf->op = read_u16(ud, code);
56
12.5k
  bpf->jt = code[2];
57
12.5k
  bpf->jf = code[3];
58
12.5k
  bpf->k = read_u32(ud, code + 4);
59
12.5k
  return bpf;
60
12.6k
}
61
62
///< Fetch an eBPF structure from code
63
static bpf_internal* fetch_ebpf(cs_struct *ud, const uint8_t *code,
64
    size_t code_len)
65
23.4k
{
66
23.4k
  bpf_internal *bpf;
67
68
23.4k
  bpf = alloc_bpf_internal(code_len);
69
23.4k
  if (bpf == NULL)
70
363
    return NULL;
71
72
23.0k
  bpf->op = (uint16_t)code[0];
73
23.0k
  bpf->dst = code[1] & 0xf;
74
23.0k
  bpf->src = (code[1] & 0xf0) >> 4;
75
76
  // eBPF has one 16-byte instruction: BPF_LD | BPF_DW | BPF_IMM,
77
  // in this case imm is combined with the next block's imm.
78
23.0k
  if (bpf->op == (BPF_CLASS_LD | BPF_SIZE_DW | BPF_MODE_IMM)) {
79
630
    if (code_len < 16) {
80
4
      cs_mem_free(bpf);
81
4
      return NULL;
82
4
    }
83
626
    bpf->k = read_u32(ud, code + 4) | (((uint64_t)read_u32(ud, code + 12)) << 32);
84
626
    bpf->insn_size = 16;
85
626
  }
86
22.4k
  else {
87
22.4k
    bpf->offset = read_u16(ud, code + 2);
88
22.4k
    bpf->k = read_u32(ud, code + 4);
89
22.4k
  }
90
23.0k
  return bpf;
91
23.0k
}
92
93
9.62k
#define CHECK_READABLE_REG(ud, reg) do { \
94
9.62k
    if (! ((reg) >= BPF_REG_R0 && (reg) <= BPF_REG_R10)) \
95
9.62k
      return false; \
96
9.62k
  } while (0)
97
98
4.91k
#define CHECK_WRITABLE_REG(ud, reg) do { \
99
4.91k
    if (! ((reg) >= BPF_REG_R0 && (reg) < BPF_REG_R10)) \
100
4.91k
      return false; \
101
4.91k
  } while (0)
102
103
9.62k
#define CHECK_READABLE_AND_PUSH(ud, MI, r) do { \
104
9.62k
    CHECK_READABLE_REG(ud, r + BPF_REG_R0); \
105
9.62k
    MCOperand_CreateReg0(MI, r + BPF_REG_R0); \
106
9.56k
  } while (0)
107
108
4.91k
#define CHECK_WRITABLE_AND_PUSH(ud, MI, r) do { \
109
4.91k
    CHECK_WRITABLE_REG(ud, r + BPF_REG_R0); \
110
4.91k
    MCOperand_CreateReg0(MI, r + BPF_REG_R0); \
111
4.91k
  } while (0)
112
113
static bool decodeLoad(cs_struct *ud, MCInst *MI, bpf_internal *bpf)
114
10.2k
{
115
10.2k
  if (!EBPF_MODE(ud)) {
116
    /*
117
     *  +-----+-----------+--------------------+
118
     *  | ldb |    [k]    |       [x+k]        |
119
     *  | ldh |    [k]    |       [x+k]        |
120
     *  +-----+-----------+--------------------+
121
     */
122
4.88k
    if (BPF_SIZE(bpf->op) == BPF_SIZE_DW)
123
4
      return false;
124
4.87k
    if (BPF_SIZE(bpf->op) == BPF_SIZE_B || BPF_SIZE(bpf->op) == BPF_SIZE_H) {
125
      /* no ldx */
126
1.03k
      if (BPF_CLASS(bpf->op) != BPF_CLASS_LD)
127
3
        return false;
128
      /* can only be BPF_ABS and BPF_IND */
129
1.03k
      if (BPF_MODE(bpf->op) == BPF_MODE_ABS) {
130
530
        MCOperand_CreateImm0(MI, bpf->k);
131
530
        return true;
132
530
      }
133
500
      else if (BPF_MODE(bpf->op) == BPF_MODE_IND) {
134
496
        MCOperand_CreateReg0(MI, BPF_REG_X);
135
496
        MCOperand_CreateImm0(MI, bpf->k);
136
496
        return true;
137
496
      }
138
4
      return false;
139
1.03k
    }
140
    /*
141
     *  +-----+----+------+------+-----+-------+
142
     *  | ld  | #k | #len | M[k] | [k] | [x+k] |
143
     *  +-----+----+------+------+-----+-------+
144
     *  | ldx | #k | #len | M[k] | 4*([k]&0xf) |
145
     *  +-----+----+------+------+-------------+
146
     */
147
3.84k
    switch (BPF_MODE(bpf->op)) {
148
1.40k
    default:
149
1.40k
      break;
150
1.41k
    case BPF_MODE_IMM:
151
1.41k
      MCOperand_CreateImm0(MI, bpf->k);
152
1.41k
      return true;
153
485
    case BPF_MODE_LEN:
154
485
      return true;
155
537
    case BPF_MODE_MEM:
156
537
      MCOperand_CreateImm0(MI, bpf->k);
157
537
      return true;
158
3.84k
    }
159
1.40k
    if (BPF_CLASS(bpf->op) == BPF_CLASS_LD) {
160
997
      if (BPF_MODE(bpf->op) == BPF_MODE_ABS) {
161
579
        MCOperand_CreateImm0(MI, bpf->k);
162
579
        return true;
163
579
      }
164
418
      else if (BPF_MODE(bpf->op) == BPF_MODE_IND) {
165
415
        MCOperand_CreateReg0(MI, BPF_REG_X);
166
415
        MCOperand_CreateImm0(MI, bpf->k);
167
415
        return true;
168
415
      }
169
997
    }
170
410
    else { /* LDX */
171
410
      if (BPF_MODE(bpf->op) == BPF_MODE_MSH) {
172
408
        MCOperand_CreateImm0(MI, bpf->k);
173
408
        return true;
174
408
      }
175
410
    }
176
5
    return false;
177
1.40k
  }
178
179
  /* eBPF mode */
180
  /*
181
   * - IMM: lddw dst, imm64
182
   * - ABS: ld{w,h,b,dw} [k]
183
   * - IND: ld{w,h,b,dw} [src+k]
184
   * - MEM: ldx{w,h,b,dw} dst, [src+off]
185
   */
186
5.37k
  if (BPF_CLASS(bpf->op) == BPF_CLASS_LD) {
187
4.07k
    switch (BPF_MODE(bpf->op)) {
188
643
    case BPF_MODE_IMM:
189
643
      if (bpf->op != (BPF_CLASS_LD | BPF_SIZE_DW | BPF_MODE_IMM))
190
17
        return false;
191
626
      CHECK_WRITABLE_AND_PUSH(ud, MI, bpf->dst);
192
624
      MCOperand_CreateImm0(MI, bpf->k);
193
624
      return true;
194
2.21k
    case BPF_MODE_ABS:
195
2.21k
      MCOperand_CreateImm0(MI, bpf->k);
196
2.21k
      return true;
197
1.20k
    case BPF_MODE_IND:
198
1.20k
      CHECK_READABLE_AND_PUSH(ud, MI, bpf->src);
199
1.20k
      MCOperand_CreateImm0(MI, bpf->k);
200
1.20k
      return true;
201
4.07k
    }
202
8
    return false;
203
204
4.07k
  }
205
  /* LDX */
206
1.29k
  if (BPF_MODE(bpf->op) == BPF_MODE_MEM) {
207
1.28k
    CHECK_WRITABLE_AND_PUSH(ud, MI, bpf->dst);
208
1.28k
    CHECK_READABLE_AND_PUSH(ud, MI, bpf->src);
209
1.28k
    MCOperand_CreateImm0(MI, bpf->offset);
210
1.28k
    return true;
211
1.28k
  }
212
10
  return false;
213
1.29k
}
214
215
static bool decodeStore(cs_struct *ud, MCInst *MI, bpf_internal *bpf)
216
4.11k
{
217
  /* in cBPF, only BPF_ST* | BPF_MEM | BPF_W is valid
218
   * while in eBPF:
219
   * - BPF_STX | BPF_XADD | BPF_{W,DW}
220
   * - BPF_ST* | BPF_MEM | BPF_{W,H,B,DW}
221
   * are valid
222
   */
223
4.11k
  if (!EBPF_MODE(ud)) {
224
    /* can only store to M[] */
225
680
    if (bpf->op != (BPF_CLASS(bpf->op) | BPF_MODE_MEM | BPF_SIZE_W))
226
7
      return false;
227
673
    MCOperand_CreateImm0(MI, bpf->k);
228
673
    return true;
229
680
  }
230
231
  /* eBPF */
232
233
3.43k
  if (BPF_MODE(bpf->op) == BPF_MODE_XADD) {
234
749
    if (BPF_CLASS(bpf->op) != BPF_CLASS_STX)
235
2
      return false;
236
747
    if (BPF_SIZE(bpf->op) != BPF_SIZE_W && BPF_SIZE(bpf->op) != BPF_SIZE_DW)
237
2
      return false;
238
    /* xadd [dst + off], src */
239
745
    CHECK_READABLE_AND_PUSH(ud, MI, bpf->dst);
240
741
    MCOperand_CreateImm0(MI, bpf->offset);
241
741
    CHECK_READABLE_AND_PUSH(ud, MI, bpf->src);
242
739
    return true;
243
741
  }
244
245
2.68k
  if (BPF_MODE(bpf->op) != BPF_MODE_MEM)
246
10
    return false;
247
248
  /* st [dst + off], src */
249
2.67k
  CHECK_READABLE_AND_PUSH(ud, MI, bpf->dst);
250
2.67k
  MCOperand_CreateImm0(MI, bpf->offset);
251
2.67k
  if (BPF_CLASS(bpf->op) == BPF_CLASS_ST)
252
1.41k
    MCOperand_CreateImm0(MI, bpf->k);
253
1.25k
  else
254
1.25k
    CHECK_READABLE_AND_PUSH(ud, MI, bpf->src);
255
2.67k
  return true;
256
2.67k
}
257
258
static bool decodeALU(cs_struct *ud, MCInst *MI, bpf_internal *bpf)
259
4.46k
{
260
  /* Set MI->Operands */
261
262
  /* cBPF */
263
4.46k
  if (!EBPF_MODE(ud)) {
264
1.42k
    if (BPF_OP(bpf->op) > BPF_ALU_XOR)
265
1
      return false;
266
    /* cBPF's NEG has no operands */
267
1.42k
    if (BPF_OP(bpf->op) == BPF_ALU_NEG)
268
259
      return true;
269
1.16k
    if (BPF_SRC(bpf->op) == BPF_SRC_K)
270
445
      MCOperand_CreateImm0(MI, bpf->k);
271
723
    else /* BPF_SRC_X */
272
723
      MCOperand_CreateReg0(MI, BPF_REG_X);
273
1.16k
    return true;
274
1.42k
  }
275
276
  /* eBPF */
277
278
3.04k
  if (BPF_OP(bpf->op) > BPF_ALU_END)
279
2
    return false;
280
  /* ALU64 class doesn't have ENDian */
281
  /* ENDian's imm must be one of 16, 32, 64 */
282
3.03k
  if (BPF_OP(bpf->op) == BPF_ALU_END) {
283
758
    if (BPF_CLASS(bpf->op) == BPF_CLASS_ALU64)
284
1
      return false;
285
757
    if (bpf->k != 16 && bpf->k != 32 && bpf->k != 64)
286
33
      return false;
287
757
  }
288
289
  /* - op dst, imm
290
   * - op dst, src
291
   * - neg dst
292
   * - le<imm> dst
293
   */
294
  /* every ALU instructions have dst op */
295
3.00k
  CHECK_WRITABLE_AND_PUSH(ud, MI, bpf->dst);
296
297
  /* special cases */
298
3.00k
  if (BPF_OP(bpf->op) == BPF_ALU_NEG)
299
264
    return true;
300
2.73k
  if (BPF_OP(bpf->op) == BPF_ALU_END) {
301
    /* bpf->k must be one of 16, 32, 64 */
302
724
    MCInst_setOpcode(MI, MCInst_getOpcode(MI) | ((uint32_t)bpf->k << 4));
303
724
    return true;
304
724
  }
305
306
  /* normal cases */
307
2.01k
  if (BPF_SRC(bpf->op) == BPF_SRC_K) {
308
1.78k
    MCOperand_CreateImm0(MI, bpf->k);
309
1.78k
  }
310
230
  else { /* BPF_SRC_X */
311
230
    CHECK_READABLE_AND_PUSH(ud, MI, bpf->src);
312
230
  }
313
2.01k
  return true;
314
2.01k
}
315
316
static bool decodeJump(cs_struct *ud, MCInst *MI, bpf_internal *bpf)
317
2.92k
{
318
  /* cBPF and eBPF are very different in class jump */
319
2.92k
  if (!EBPF_MODE(ud)) {
320
995
    if (BPF_OP(bpf->op) > BPF_JUMP_JSET)
321
1
      return false;
322
323
    /* ja is a special case of jumps */
324
994
    if (BPF_OP(bpf->op) == BPF_JUMP_JA) {
325
268
      MCOperand_CreateImm0(MI, bpf->k);
326
268
      return true;
327
268
    }
328
329
726
    if (BPF_SRC(bpf->op) == BPF_SRC_K)
330
299
      MCOperand_CreateImm0(MI, bpf->k);
331
427
    else /* BPF_SRC_X */
332
427
      MCOperand_CreateReg0(MI, BPF_REG_X);
333
726
    MCOperand_CreateImm0(MI, bpf->jt);
334
726
    MCOperand_CreateImm0(MI, bpf->jf);
335
726
  }
336
1.92k
  else {
337
1.92k
    if (BPF_OP(bpf->op) > BPF_JUMP_JSLE)
338
1
      return false;
339
340
    /* No operands for exit */
341
1.92k
    if (BPF_OP(bpf->op) == BPF_JUMP_EXIT)
342
259
      return bpf->op == (BPF_CLASS_JMP | BPF_JUMP_EXIT);
343
1.66k
    if (BPF_OP(bpf->op) == BPF_JUMP_CALL) {
344
361
      if (bpf->op == (BPF_CLASS_JMP | BPF_JUMP_CALL)) {
345
263
        MCOperand_CreateImm0(MI, bpf->k);
346
263
        return true;
347
263
      }
348
98
      if (bpf->op == (BPF_CLASS_JMP | BPF_JUMP_CALL | BPF_SRC_X)) {
349
98
        CHECK_READABLE_AND_PUSH(ud, MI, bpf->k);
350
67
        return true;
351
98
      }
352
0
      return false;
353
98
    }
354
355
    /* ja is a special case of jumps */
356
1.30k
    if (BPF_OP(bpf->op) == BPF_JUMP_JA) {
357
198
      if (BPF_SRC(bpf->op) != BPF_SRC_K)
358
1
        return false;
359
197
      MCOperand_CreateImm0(MI, bpf->offset);
360
197
      return true;
361
198
    }
362
363
    /* <j>  dst, src, +off */
364
1.11k
    CHECK_READABLE_AND_PUSH(ud, MI, bpf->dst);
365
1.10k
    if (BPF_SRC(bpf->op) == BPF_SRC_K)
366
836
      MCOperand_CreateImm0(MI, bpf->k);
367
273
    else
368
273
      CHECK_READABLE_AND_PUSH(ud, MI, bpf->src);
369
1.10k
    MCOperand_CreateImm0(MI, bpf->offset);
370
1.10k
  }
371
1.83k
  return true;
372
2.92k
}
373
374
static bool decodeReturn(cs_struct *ud, MCInst *MI, bpf_internal *bpf)
375
1.23k
{
376
  /* Here only handles the BPF_RET class in cBPF */
377
1.23k
  switch (BPF_RVAL(bpf->op)) {
378
407
  case BPF_SRC_K:
379
407
    MCOperand_CreateImm0(MI, bpf->k);
380
407
    return true;
381
421
  case BPF_SRC_X:
382
421
    MCOperand_CreateReg0(MI, BPF_REG_X);
383
421
    return true;
384
404
  case BPF_SRC_A:
385
404
    MCOperand_CreateReg0(MI, BPF_REG_A);
386
404
    return true;
387
1.23k
  }
388
2
  return false;
389
1.23k
}
390
391
static bool decodeMISC(cs_struct *ud, MCInst *MI, bpf_internal *bpf)
392
435
{
393
435
  uint16_t op = bpf->op ^ BPF_CLASS_MISC;
394
435
  return op == BPF_MISCOP_TAX || op == BPF_MISCOP_TXA;
395
435
}
396
397
///< 1. Check if the instruction is valid
398
///< 2. Set MI->opcode
399
///< 3. Set MI->Operands
400
static bool getInstruction(cs_struct *ud, MCInst *MI, bpf_internal *bpf)
401
14.0k
{
402
14.0k
  cs_detail *detail;
403
404
14.0k
  detail = MI->flat_insn->detail;
405
  // initialize detail
406
14.0k
  if (detail) {
407
14.0k
    memset(detail, 0, offsetof(cs_detail, bpf) + sizeof(cs_bpf));
408
14.0k
  }
409
410
14.0k
  MCInst_clear(MI);
411
14.0k
  MCInst_setOpcode(MI, bpf->op);
412
413
14.0k
  switch (BPF_CLASS(bpf->op)) {
414
0
  default: /* should never happen */
415
0
    return false;
416
3.07k
  case BPF_CLASS_LD:
417
4.01k
  case BPF_CLASS_LDX:
418
4.01k
    return decodeLoad(ud, MI, bpf);
419
872
  case BPF_CLASS_ST:
420
1.73k
  case BPF_CLASS_STX:
421
1.73k
    return decodeStore(ud, MI, bpf);
422
2.87k
  case BPF_CLASS_ALU:
423
2.87k
    return decodeALU(ud, MI, bpf);
424
2.92k
  case BPF_CLASS_JMP:
425
2.92k
    return decodeJump(ud, MI, bpf);
426
602
  case BPF_CLASS_RET:
427
    /* eBPF doesn't have this class */
428
602
    if (EBPF_MODE(ud))
429
1
      return false;
430
601
    return decodeReturn(ud, MI, bpf);
431
1.89k
  case BPF_CLASS_MISC:
432
  /* case BPF_CLASS_ALU64: */
433
1.89k
    if (EBPF_MODE(ud))
434
1.59k
      return decodeALU(ud, MI, bpf);
435
302
    else
436
302
      return decodeMISC(ud, MI, bpf);
437
14.0k
  }
438
14.0k
}
439
440
bool BPF_getInstruction(csh ud, const uint8_t *code, size_t code_len,
441
    MCInst *instr, uint16_t *size, uint64_t address, void *info)
442
14.1k
{
443
14.1k
  cs_struct *cs;
444
14.1k
  bpf_internal *bpf;
445
446
14.1k
  cs = (cs_struct*)ud;
447
14.1k
  if (EBPF_MODE(cs))
448
8.26k
    bpf = fetch_ebpf(cs, code, code_len);
449
5.88k
  else
450
5.88k
    bpf = fetch_cbpf(cs, code, code_len);
451
14.1k
  if (bpf == NULL)
452
94
    return false;
453
14.0k
  if (!getInstruction(cs, instr, bpf)) {
454
115
    cs_mem_free(bpf);
455
115
    return false;
456
115
  }
457
458
13.9k
  *size = bpf->insn_size;
459
13.9k
  cs_mem_free(bpf);
460
461
  return true;
462
14.0k
}
463
464
#endif