Coverage Report

Created: 2026-02-26 06:51

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/ada-url/fuzz/parse.cc
Line
Count
Source
1
#include <fuzzer/FuzzedDataProvider.h>
2
3
#include <cstdio>
4
#include <memory>
5
#include <string>
6
7
#include "ada.cpp"
8
#include "ada.h"
9
10
9.00k
bool is_valid_utf8_string(const char *buf, size_t len) {
11
9.00k
  const uint8_t *data = reinterpret_cast<const uint8_t *>(buf);
12
9.00k
  uint64_t pos = 0;
13
9.00k
  uint32_t code_point = 0;
14
35.9k
  while (pos < len) {
15
34.4k
    uint64_t next_pos = pos + 16;
16
34.4k
    if (next_pos <= len) {  // if it is safe to read 16 more bytes, check that
17
                            // they are ascii
18
23.3k
      uint64_t v1;
19
23.3k
      std::memcpy(&v1, data + pos, sizeof(uint64_t));
20
23.3k
      uint64_t v2;
21
23.3k
      std::memcpy(&v2, data + pos + sizeof(uint64_t), sizeof(uint64_t));
22
23.3k
      uint64_t v{v1 | v2};
23
23.3k
      if ((v & 0x8080808080808080) == 0) {
24
5.73k
        pos = next_pos;
25
5.73k
        continue;
26
5.73k
      }
27
23.3k
    }
28
28.6k
    unsigned char byte = data[pos];
29
81.1k
    while (byte < 0b10000000) {
30
57.7k
      if (++pos == len) {
31
5.20k
        return true;
32
5.20k
      }
33
52.5k
      byte = data[pos];
34
52.5k
    }
35
36
23.4k
    if ((byte & 0b11100000) == 0b11000000) {
37
3.14k
      next_pos = pos + 2;
38
3.14k
      if (next_pos > len) {
39
118
        return false;
40
118
      }
41
3.02k
      if ((data[pos + 1] & 0b11000000) != 0b10000000) {
42
256
        return false;
43
256
      }
44
2.76k
      code_point = (byte & 0b00011111) << 6 | (data[pos + 1] & 0b00111111);
45
2.76k
      if ((code_point < 0x80) || (0x7ff < code_point)) {
46
8
        return false;
47
8
      }
48
20.3k
    } else if ((byte & 0b11110000) == 0b11100000) {
49
18.2k
      next_pos = pos + 3;
50
18.2k
      if (next_pos > len) {
51
46
        return false;
52
46
      }
53
18.2k
      if ((data[pos + 1] & 0b11000000) != 0b10000000) {
54
112
        return false;
55
112
      }
56
18.1k
      if ((data[pos + 2] & 0b11000000) != 0b10000000) {
57
24
        return false;
58
24
      }
59
18.0k
      code_point = (byte & 0b00001111) << 12 |
60
18.0k
                   (data[pos + 1] & 0b00111111) << 6 |
61
18.0k
                   (data[pos + 2] & 0b00111111);
62
18.0k
      if ((code_point < 0x800) || (0xffff < code_point) ||
63
18.0k
          (0xd7ff < code_point && code_point < 0xe000)) {
64
10
        return false;
65
10
      }
66
18.0k
    } else if ((byte & 0b11111000) == 0b11110000) {  // 0b11110000
67
466
      next_pos = pos + 4;
68
466
      if (next_pos > len) {
69
22
        return false;
70
22
      }
71
444
      if ((data[pos + 1] & 0b11000000) != 0b10000000) {
72
74
        return false;
73
74
      }
74
370
      if ((data[pos + 2] & 0b11000000) != 0b10000000) {
75
17
        return false;
76
17
      }
77
353
      if ((data[pos + 3] & 0b11000000) != 0b10000000) {
78
12
        return false;
79
12
      }
80
341
      code_point =
81
341
          (byte & 0b00000111) << 18 | (data[pos + 1] & 0b00111111) << 12 |
82
341
          (data[pos + 2] & 0b00111111) << 6 | (data[pos + 3] & 0b00111111);
83
341
      if (code_point <= 0xffff || 0x10ffff < code_point) {
84
13
        return false;
85
13
      }
86
1.60k
    } else {
87
1.60k
      return false;
88
1.60k
    }
89
21.1k
    pos = next_pos;
90
21.1k
  }
91
1.47k
  return true;
92
9.00k
}
93
94
9.00k
extern "C" int LLVMFuzzerTestOneInput(const uint8_t *data, size_t size) {
95
9.00k
  FuzzedDataProvider fdp(data, size);
96
9.00k
  std::string source = fdp.ConsumeRandomLengthString(256);
97
98
  // volatile forces the compiler to store the results without undue
99
  // optimizations
100
9.00k
  volatile size_t length = 0;
101
102
9.00k
  auto parse_url = ada::parse<ada::url>(source);
103
9.00k
  auto parse_url_aggregator = ada::parse<ada::url_aggregator>(source);
104
105
9.00k
  if (is_valid_utf8_string(source.data(), source.length())) {
106
6.68k
    if (parse_url.has_value() ^ parse_url_aggregator.has_value()) {
107
0
      printf("Source used to parse: %s", source.c_str());
108
0
      abort();
109
0
    }
110
6.68k
  }
111
112
9.00k
  if (parse_url) {
113
3.19k
    length += parse_url->get_href().size();
114
3.19k
    length += parse_url->get_origin().size();
115
3.19k
  }
116
117
9.00k
  if (parse_url_aggregator) {
118
3.05k
    length += parse_url_aggregator->get_href().size();
119
3.05k
    length += parse_url_aggregator->get_origin().size();
120
121
3.05k
    volatile bool is_parse_url_aggregator_output_valid = false;
122
3.05k
    is_parse_url_aggregator_output_valid = parse_url_aggregator->validate();
123
124
3.05k
    assert(parse_url->get_protocol() == parse_url_aggregator->get_protocol());
125
3.05k
    assert(parse_url->get_href() == parse_url_aggregator->get_href());
126
127
3.05k
    parse_url->set_href(source);
128
3.05k
    parse_url_aggregator->set_href(source);
129
3.05k
    assert(parse_url->get_href() == parse_url_aggregator->get_href());
130
3.05k
  }
131
132
  /**
133
   * ada::parse<ada::url>
134
   */
135
9.00k
  auto out_url = ada::parse<ada::url>("https://www.ada-url.com");
136
137
9.00k
  if (out_url) {
138
9.00k
    out_url->set_protocol(source);
139
9.00k
    out_url->set_username(source);
140
9.00k
    out_url->set_password(source);
141
9.00k
    out_url->set_hostname(source);
142
9.00k
    out_url->set_host(source);
143
9.00k
    out_url->set_pathname(source);
144
9.00k
    out_url->set_search(source);
145
9.00k
    out_url->set_hash(source);
146
9.00k
    out_url->set_port(source);
147
148
    // getters
149
9.00k
    length += out_url->get_protocol().size();
150
9.00k
    length += out_url->get_username().size();
151
9.00k
    length += out_url->get_password().size();
152
9.00k
    length += out_url->get_hostname().size();
153
9.00k
    length += out_url->get_host().size();
154
9.00k
    length += out_url->get_pathname().size();
155
9.00k
    length += out_url->get_search().size();
156
9.00k
    length += out_url->get_hash().size();
157
9.00k
    length += out_url->get_origin().size();
158
9.00k
    length += out_url->get_port().size();
159
160
9.00k
    length += out_url->to_string().size();
161
9.00k
  }
162
163
  /**
164
   * ada::parse<ada::url_aggregator>
165
   */
166
9.00k
  auto out_aggregator =
167
9.00k
      ada::parse<ada::url_aggregator>("https://www.ada-url.com");
168
169
9.00k
  if (out_aggregator) {
170
9.00k
    out_aggregator->set_protocol(source);
171
9.00k
    out_aggregator->set_username(source);
172
9.00k
    out_aggregator->set_password(source);
173
9.00k
    out_aggregator->set_hostname(source);
174
9.00k
    out_aggregator->set_host(source);
175
9.00k
    out_aggregator->set_pathname(source);
176
9.00k
    out_aggregator->set_search(source);
177
9.00k
    out_aggregator->set_hash(source);
178
9.00k
    out_aggregator->set_port(source);
179
180
    // getters
181
9.00k
    length += out_aggregator->get_protocol().size();
182
9.00k
    length += out_aggregator->get_username().size();
183
9.00k
    length += out_aggregator->get_password().size();
184
9.00k
    length += out_aggregator->get_hostname().size();
185
9.00k
    length += out_aggregator->get_host().size();
186
9.00k
    length += out_aggregator->get_pathname().size();
187
9.00k
    length += out_aggregator->get_search().size();
188
9.00k
    length += out_aggregator->get_hash().size();
189
9.00k
    length += out_aggregator->get_origin().size();
190
9.00k
    length += out_aggregator->get_port().size();
191
192
9.00k
    length += out_aggregator->to_string().size();
193
194
9.00k
    volatile bool is_output_valid = false;
195
9.00k
    is_output_valid = out_aggregator->validate();
196
197
    // Printing due to dead-code elimination
198
9.00k
    printf("diagram %s\n", out_aggregator->to_diagram().c_str());
199
200
    // clear methods
201
9.00k
    out_aggregator->clear_port();
202
9.00k
    out_aggregator->clear_search();
203
9.00k
    out_aggregator->clear_hash();
204
9.00k
  }
205
206
  /**
207
   * Node.js specific
208
   */
209
9.00k
  length += ada::href_from_file(source).size();
210
211
  /**
212
   * Others
213
   */
214
9.00k
  bool is_valid = ada::checkers::verify_dns_length(source);
215
216
  // Only used for avoiding dead-code elimination
217
9.00k
  if (is_valid) {
218
6.95k
    printf("dns length is valid\n");
219
6.95k
  }
220
221
  // Only used for avoiding dead-code elimination
222
9.00k
  printf("length of url is %zu\n", length);
223
224
9.00k
  return 0;
225
9.00k
}  // extern "C" int LLVMFuzzerTestOneInput(const uint8_t *data, size_t size) {