/src/openssl33/ssl/priority_queue.c
Line | Count | Source (jump to first uncovered line) |
1 | | /* |
2 | | * Copyright 2022-2023 The OpenSSL Project Authors. All Rights Reserved. |
3 | | * |
4 | | * Licensed under the Apache License 2.0 (the "License"). You may not use |
5 | | * this file except in compliance with the License. You can obtain a copy |
6 | | * in the file LICENSE in the source distribution or at |
7 | | * https://www.openssl.org/source/license.html |
8 | | */ |
9 | | |
10 | | #include <openssl/crypto.h> |
11 | | #include <openssl/err.h> |
12 | | #include <assert.h> |
13 | | #include "internal/priority_queue.h" |
14 | | #include "internal/safe_math.h" |
15 | | #include "internal/numbers.h" |
16 | | |
17 | | OSSL_SAFE_MATH_UNSIGNED(size_t, size_t) |
18 | | |
19 | | /* |
20 | | * Fundamental operations: |
21 | | * Binary Heap Fibonacci Heap |
22 | | * Get smallest O(1) O(1) |
23 | | * Delete any O(log n) O(log n) average but worst O(n) |
24 | | * Insert O(log n) O(1) |
25 | | * |
26 | | * Not supported: |
27 | | * Merge two structures O(log n) O(1) |
28 | | * Decrease key O(log n) O(1) |
29 | | * Increase key O(log n) ? |
30 | | * |
31 | | * The Fibonacci heap is quite a bit more complicated to implement and has |
32 | | * larger overhead in practice. We favour the binary heap here. A multi-way |
33 | | * (ternary or quaternary) heap might elicit a performance advantage via better |
34 | | * cache access patterns. |
35 | | */ |
36 | | |
37 | | struct pq_heap_st { |
38 | | void *data; /* User supplied data pointer */ |
39 | | size_t index; /* Constant index in elements[] */ |
40 | | }; |
41 | | |
42 | | struct pq_elem_st { |
43 | | size_t posn; /* Current index in heap[] or link in free list */ |
44 | | #ifndef NDEBUG |
45 | | int used; /* Debug flag indicating that this is in use */ |
46 | | #endif |
47 | | }; |
48 | | |
49 | | struct ossl_pqueue_st |
50 | | { |
51 | | struct pq_heap_st *heap; |
52 | | struct pq_elem_st *elements; |
53 | | int (*compare)(const void *, const void *); |
54 | | size_t htop; /* Highest used heap element */ |
55 | | size_t hmax; /* Allocated heap & element space */ |
56 | | size_t freelist; /* Index into elements[], start of free element list */ |
57 | | }; |
58 | | |
59 | | /* |
60 | | * The initial and maximum number of elements in the heap. |
61 | | */ |
62 | | static const size_t min_nodes = 8; |
63 | | static const size_t max_nodes = |
64 | | SIZE_MAX / (sizeof(struct pq_heap_st) > sizeof(struct pq_elem_st) |
65 | | ? sizeof(struct pq_heap_st) : sizeof(struct pq_elem_st)); |
66 | | |
67 | | #ifndef NDEBUG |
68 | | /* Some basic sanity checking of the data structure */ |
69 | | # define ASSERT_USED(pq, idx) \ |
70 | 92.2M | assert(pq->elements[pq->heap[idx].index].used); \ |
71 | 89.0M | assert(pq->elements[pq->heap[idx].index].posn == idx) |
72 | | # define ASSERT_ELEM_USED(pq, elem) \ |
73 | 2.41M | assert(pq->elements[elem].used) |
74 | | #else |
75 | | # define ASSERT_USED(pq, idx) |
76 | | # define ASSERT_ELEM_USED(pq, elem) |
77 | | #endif |
78 | | |
79 | | /* |
80 | | * Calculate the array growth based on the target size. |
81 | | * |
82 | | * The growth factor is a rational number and is defined by a numerator |
83 | | * and a denominator. According to Andrew Koenig in his paper "Why Are |
84 | | * Vectors Efficient?" from JOOP 11(5) 1998, this factor should be less |
85 | | * than the golden ratio (1.618...). |
86 | | * |
87 | | * We use an expansion factor of 8 / 5 = 1.6 |
88 | | */ |
89 | | static ossl_inline size_t compute_pqueue_growth(size_t target, size_t current) |
90 | 48.5k | { |
91 | 48.5k | int err = 0; |
92 | | |
93 | 97.1k | while (current < target) { |
94 | 48.5k | if (current >= max_nodes) |
95 | 0 | return 0; |
96 | | |
97 | 48.5k | current = safe_muldiv_size_t(current, 8, 5, &err); |
98 | 48.5k | if (err) |
99 | 0 | return 0; |
100 | 48.5k | if (current >= max_nodes) |
101 | 0 | current = max_nodes; |
102 | 48.5k | } |
103 | 48.5k | return current; |
104 | 48.5k | } |
105 | | |
106 | | static ossl_inline void pqueue_swap_elem(OSSL_PQUEUE *pq, size_t i, size_t j) |
107 | 16.1M | { |
108 | 16.1M | struct pq_heap_st *h = pq->heap, t_h; |
109 | 16.1M | struct pq_elem_st *e = pq->elements; |
110 | | |
111 | 16.1M | ASSERT_USED(pq, i); |
112 | 32.2M | ASSERT_USED(pq, j); |
113 | | |
114 | 16.1M | t_h = h[i]; |
115 | 16.1M | h[i] = h[j]; |
116 | 16.1M | h[j] = t_h; |
117 | | |
118 | 16.1M | e[h[i].index].posn = i; |
119 | 16.1M | e[h[j].index].posn = j; |
120 | 16.1M | } |
121 | | |
122 | | static ossl_inline void pqueue_move_elem(OSSL_PQUEUE *pq, size_t from, size_t to) |
123 | 3.10M | { |
124 | 3.10M | struct pq_heap_st *h = pq->heap; |
125 | 3.10M | struct pq_elem_st *e = pq->elements; |
126 | | |
127 | 3.10M | ASSERT_USED(pq, from); |
128 | | |
129 | 3.10M | h[to] = h[from]; |
130 | 3.10M | e[h[to].index].posn = to; |
131 | 3.10M | } |
132 | | |
133 | | /* |
134 | | * Force the specified element to the front of the heap. This breaks |
135 | | * the heap partial ordering pre-condition. |
136 | | */ |
137 | | static ossl_inline void pqueue_force_bottom(OSSL_PQUEUE *pq, size_t n) |
138 | 0 | { |
139 | 0 | ASSERT_USED(pq, n); |
140 | 0 | while (n > 0) { |
141 | 0 | const size_t p = (n - 1) / 2; |
142 | |
|
143 | 0 | ASSERT_USED(pq, p); |
144 | 0 | pqueue_swap_elem(pq, n, p); |
145 | 0 | n = p; |
146 | 0 | } |
147 | 0 | } |
148 | | |
149 | | /* |
150 | | * Move an element down to its correct position to restore the partial |
151 | | * order pre-condition. |
152 | | */ |
153 | | static ossl_inline void pqueue_move_down(OSSL_PQUEUE *pq, size_t n) |
154 | 3.64M | { |
155 | 3.64M | struct pq_heap_st *h = pq->heap; |
156 | | |
157 | 3.64M | ASSERT_USED(pq, n); |
158 | 5.07M | while (n > 0) { |
159 | 4.49M | const size_t p = (n - 1) / 2; |
160 | | |
161 | 4.49M | ASSERT_USED(pq, p); |
162 | 4.49M | if (pq->compare(h[n].data, h[p].data) >= 0) |
163 | 3.06M | break; |
164 | 1.42M | pqueue_swap_elem(pq, n, p); |
165 | 1.42M | n = p; |
166 | 1.42M | } |
167 | 3.64M | } |
168 | | |
169 | | /* |
170 | | * Move an element up to its correct position to restore the partial |
171 | | * order pre-condition. |
172 | | */ |
173 | | static ossl_inline void pqueue_move_up(OSSL_PQUEUE *pq, size_t n) |
174 | 3.10M | { |
175 | 3.10M | struct pq_heap_st *h = pq->heap; |
176 | 3.10M | size_t p = n * 2 + 1; |
177 | | |
178 | 3.10M | ASSERT_USED(pq, n); |
179 | 3.10M | if (pq->htop > p + 1) { |
180 | 2.97M | ASSERT_USED(pq, p); |
181 | 5.94M | ASSERT_USED(pq, p + 1); |
182 | 2.97M | if (pq->compare(h[p].data, h[p + 1].data) > 0) |
183 | 606k | p++; |
184 | 2.97M | } |
185 | 17.8M | while (pq->htop > p && pq->compare(h[p].data, h[n].data) < 0) { |
186 | 14.7M | ASSERT_USED(pq, p); |
187 | 14.7M | pqueue_swap_elem(pq, n, p); |
188 | 14.7M | n = p; |
189 | 14.7M | p = n * 2 + 1; |
190 | 14.7M | if (pq->htop > p + 1) { |
191 | 13.5M | ASSERT_USED(pq, p + 1); |
192 | 13.5M | if (pq->compare(h[p].data, h[p + 1].data) > 0) |
193 | 6.32M | p++; |
194 | 13.5M | } |
195 | 14.7M | } |
196 | 3.10M | } |
197 | | |
198 | | int ossl_pqueue_push(OSSL_PQUEUE *pq, void *data, size_t *elem) |
199 | 3.64M | { |
200 | 3.64M | size_t n, m; |
201 | | |
202 | 3.64M | if (!ossl_pqueue_reserve(pq, 1)) |
203 | 0 | return 0; |
204 | | |
205 | 3.64M | n = pq->htop++; |
206 | 3.64M | m = pq->freelist; |
207 | 3.64M | pq->freelist = pq->elements[m].posn; |
208 | | |
209 | 3.64M | pq->heap[n].data = data; |
210 | 3.64M | pq->heap[n].index = m; |
211 | | |
212 | 3.64M | pq->elements[m].posn = n; |
213 | 3.64M | #ifndef NDEBUG |
214 | 3.64M | pq->elements[m].used = 1; |
215 | 3.64M | #endif |
216 | 3.64M | pqueue_move_down(pq, n); |
217 | 3.64M | if (elem != NULL) |
218 | 3.64M | *elem = m; |
219 | 3.64M | return 1; |
220 | 3.64M | } |
221 | | |
222 | | void *ossl_pqueue_peek(const OSSL_PQUEUE *pq) |
223 | 10.6M | { |
224 | 10.6M | if (pq->htop > 0) { |
225 | 2.62M | ASSERT_USED(pq, 0); |
226 | 2.62M | return pq->heap->data; |
227 | 2.62M | } |
228 | 8.04M | return NULL; |
229 | 10.6M | } |
230 | | |
231 | | void *ossl_pqueue_pop(OSSL_PQUEUE *pq) |
232 | 6.35M | { |
233 | 6.35M | void *res; |
234 | 6.35M | size_t elem; |
235 | | |
236 | 6.35M | if (pq == NULL || pq->htop == 0) |
237 | 3.20M | return NULL; |
238 | | |
239 | 6.35M | ASSERT_USED(pq, 0); |
240 | 3.15M | res = pq->heap->data; |
241 | 3.15M | elem = pq->heap->index; |
242 | | |
243 | 3.15M | if (--pq->htop != 0) { |
244 | 3.10M | pqueue_move_elem(pq, pq->htop, 0); |
245 | 3.10M | pqueue_move_up(pq, 0); |
246 | 3.10M | } |
247 | | |
248 | 3.15M | pq->elements[elem].posn = pq->freelist; |
249 | 3.15M | pq->freelist = elem; |
250 | 3.15M | #ifndef NDEBUG |
251 | 3.15M | pq->elements[elem].used = 0; |
252 | 3.15M | #endif |
253 | 3.15M | return res; |
254 | 6.30M | } |
255 | | |
256 | | void *ossl_pqueue_remove(OSSL_PQUEUE *pq, size_t elem) |
257 | 2.41M | { |
258 | 2.41M | size_t n; |
259 | | |
260 | 2.41M | if (pq == NULL || elem >= pq->hmax || pq->htop == 0) |
261 | 0 | return 0; |
262 | | |
263 | 2.41M | ASSERT_ELEM_USED(pq, elem); |
264 | 2.41M | n = pq->elements[elem].posn; |
265 | | |
266 | 2.41M | ASSERT_USED(pq, n); |
267 | | |
268 | 2.41M | if (n == pq->htop - 1) { |
269 | 494k | pq->elements[elem].posn = pq->freelist; |
270 | 494k | pq->freelist = elem; |
271 | 494k | #ifndef NDEBUG |
272 | 494k | pq->elements[elem].used = 0; |
273 | 494k | #endif |
274 | 494k | return pq->heap[--pq->htop].data; |
275 | 494k | } |
276 | 1.91M | if (n > 0) |
277 | 0 | pqueue_force_bottom(pq, n); |
278 | 1.91M | return ossl_pqueue_pop(pq); |
279 | 2.41M | } |
280 | | |
281 | | static void pqueue_add_freelist(OSSL_PQUEUE *pq, size_t from) |
282 | 3.24M | { |
283 | 3.24M | struct pq_elem_st *e = pq->elements; |
284 | 3.24M | size_t i; |
285 | | |
286 | 3.24M | #ifndef NDEBUG |
287 | 32.1M | for (i = from; i < pq->hmax; i++) |
288 | 28.9M | e[i].used = 0; |
289 | 3.24M | #endif |
290 | 3.24M | e[from].posn = pq->freelist; |
291 | 28.9M | for (i = from + 1; i < pq->hmax; i++) |
292 | 25.6M | e[i].posn = i - 1; |
293 | 3.24M | pq->freelist = pq->hmax - 1; |
294 | 3.24M | } |
295 | | |
296 | | int ossl_pqueue_reserve(OSSL_PQUEUE *pq, size_t n) |
297 | 3.64M | { |
298 | 3.64M | size_t new_max, cur_max; |
299 | 3.64M | struct pq_heap_st *h; |
300 | 3.64M | struct pq_elem_st *e; |
301 | | |
302 | 3.64M | if (pq == NULL) |
303 | 0 | return 0; |
304 | 3.64M | cur_max = pq->hmax; |
305 | 3.64M | if (pq->htop + n < cur_max) |
306 | 3.59M | return 1; |
307 | | |
308 | 48.5k | new_max = compute_pqueue_growth(n + cur_max, cur_max); |
309 | 48.5k | if (new_max == 0) { |
310 | 0 | ERR_raise(ERR_LIB_SSL, ERR_R_INTERNAL_ERROR); |
311 | 0 | return 0; |
312 | 0 | } |
313 | | |
314 | 48.5k | h = OPENSSL_realloc(pq->heap, new_max * sizeof(*pq->heap)); |
315 | 48.5k | if (h == NULL) |
316 | 0 | return 0; |
317 | 48.5k | pq->heap = h; |
318 | | |
319 | 48.5k | e = OPENSSL_realloc(pq->elements, new_max * sizeof(*pq->elements)); |
320 | 48.5k | if (e == NULL) |
321 | 0 | return 0; |
322 | 48.5k | pq->elements = e; |
323 | | |
324 | 48.5k | pq->hmax = new_max; |
325 | 48.5k | pqueue_add_freelist(pq, cur_max); |
326 | 48.5k | return 1; |
327 | 48.5k | } |
328 | | |
329 | | OSSL_PQUEUE *ossl_pqueue_new(int (*compare)(const void *, const void *)) |
330 | 3.20M | { |
331 | 3.20M | OSSL_PQUEUE *pq; |
332 | | |
333 | 3.20M | if (compare == NULL) |
334 | 0 | return NULL; |
335 | | |
336 | 3.20M | pq = OPENSSL_malloc(sizeof(*pq)); |
337 | 3.20M | if (pq == NULL) |
338 | 0 | return NULL; |
339 | 3.20M | pq->compare = compare; |
340 | 3.20M | pq->hmax = min_nodes; |
341 | 3.20M | pq->htop = 0; |
342 | 3.20M | pq->freelist = 0; |
343 | 3.20M | pq->heap = OPENSSL_malloc(sizeof(*pq->heap) * min_nodes); |
344 | 3.20M | pq->elements = OPENSSL_malloc(sizeof(*pq->elements) * min_nodes); |
345 | 3.20M | if (pq->heap == NULL || pq->elements == NULL) { |
346 | 0 | ossl_pqueue_free(pq); |
347 | 0 | return NULL; |
348 | 0 | } |
349 | 3.20M | pqueue_add_freelist(pq, 0); |
350 | 3.20M | return pq; |
351 | 3.20M | } |
352 | | |
353 | | void ossl_pqueue_free(OSSL_PQUEUE *pq) |
354 | 3.20M | { |
355 | 3.20M | if (pq != NULL) { |
356 | 3.20M | OPENSSL_free(pq->heap); |
357 | 3.20M | OPENSSL_free(pq->elements); |
358 | 3.20M | OPENSSL_free(pq); |
359 | 3.20M | } |
360 | 3.20M | } |
361 | | |
362 | | void ossl_pqueue_pop_free(OSSL_PQUEUE *pq, void (*freefunc)(void *)) |
363 | 0 | { |
364 | 0 | size_t i; |
365 | |
|
366 | 0 | if (pq != NULL) { |
367 | 0 | for (i = 0; i < pq->htop; i++) |
368 | 0 | (*freefunc)(pq->heap[i].data); |
369 | 0 | ossl_pqueue_free(pq); |
370 | 0 | } |
371 | 0 | } |
372 | | |
373 | | size_t ossl_pqueue_num(const OSSL_PQUEUE *pq) |
374 | 4.79M | { |
375 | 4.79M | return pq != NULL ? pq->htop : 0; |
376 | 4.79M | } |