Line | Count | Source (jump to first uncovered line) |
1 | | #define USE_THE_REPOSITORY_VARIABLE |
2 | | |
3 | | #include "git-compat-util.h" |
4 | | #include "pseudo-merge.h" |
5 | | #include "date.h" |
6 | | #include "oid-array.h" |
7 | | #include "strbuf.h" |
8 | | #include "config.h" |
9 | | #include "string-list.h" |
10 | | #include "refs.h" |
11 | | #include "pack-bitmap.h" |
12 | | #include "commit.h" |
13 | | #include "alloc.h" |
14 | | #include "progress.h" |
15 | | #include "hex.h" |
16 | | |
17 | 0 | #define DEFAULT_PSEUDO_MERGE_DECAY 1.0 |
18 | 0 | #define DEFAULT_PSEUDO_MERGE_MAX_MERGES 64 |
19 | 0 | #define DEFAULT_PSEUDO_MERGE_SAMPLE_RATE 1 |
20 | 0 | #define DEFAULT_PSEUDO_MERGE_THRESHOLD approxidate("1.week.ago") |
21 | 0 | #define DEFAULT_PSEUDO_MERGE_STABLE_THRESHOLD approxidate("1.month.ago") |
22 | 0 | #define DEFAULT_PSEUDO_MERGE_STABLE_SIZE 512 |
23 | | |
24 | | static double gitexp(double base, int exp) |
25 | 0 | { |
26 | 0 | double result = 1; |
27 | 0 | while (1) { |
28 | 0 | if (exp % 2) |
29 | 0 | result *= base; |
30 | 0 | exp >>= 1; |
31 | 0 | if (!exp) |
32 | 0 | break; |
33 | 0 | base *= base; |
34 | 0 | } |
35 | 0 | return result; |
36 | 0 | } |
37 | | |
38 | | static uint32_t pseudo_merge_group_size(const struct pseudo_merge_group *group, |
39 | | const struct pseudo_merge_matches *matches, |
40 | | uint32_t i) |
41 | 0 | { |
42 | 0 | double C = 0.0f; |
43 | 0 | uint32_t n; |
44 | | |
45 | | /* |
46 | | * The size of pseudo-merge groups decays according to a power series, |
47 | | * which looks like: |
48 | | * |
49 | | * f(n) = C * n^-k |
50 | | * |
51 | | * , where 'n' is the n-th pseudo-merge group, 'f(n)' is its size, 'k' |
52 | | * is the decay rate, and 'C' is a scaling value. |
53 | | * |
54 | | * The value of C depends on the number of groups, decay rate, and total |
55 | | * number of commits. It is computed such that if there are M and N |
56 | | * total groups and commits, respectively, that: |
57 | | * |
58 | | * N = f(0) + f(1) + ... f(M-1) |
59 | | * |
60 | | * Rearranging to isolate C, we get: |
61 | | * |
62 | | * N = \sum_{n=1}^M C / n^k |
63 | | * |
64 | | * N / C = \sum_{n=1}^M n^-k |
65 | | * |
66 | | * C = N / \sum_{n=1}^M n^-k |
67 | | * |
68 | | * For example, if we have a decay rate of 'k' being equal to 1.5, 'N' |
69 | | * total commits equal to 10,000, and 'M' being equal to 6 groups, then |
70 | | * the (rounded) group sizes are: |
71 | | * |
72 | | * { 5469, 1934, 1053, 684, 489, 372 } |
73 | | * |
74 | | * increasing the number of total groups, say to 10, scales the group |
75 | | * sizes appropriately: |
76 | | * |
77 | | * { 5012, 1772, 964, 626, 448, 341, 271, 221, 186, 158 } |
78 | | */ |
79 | 0 | for (n = 0; n < group->max_merges; n++) |
80 | 0 | C += 1.0 / gitexp(n + 1, group->decay); |
81 | 0 | C = matches->unstable_nr / C; |
82 | |
|
83 | 0 | return (uint32_t)((C / gitexp(i + 1, group->decay)) + 0.5); |
84 | 0 | } |
85 | | |
86 | | static void pseudo_merge_group_init(struct pseudo_merge_group *group) |
87 | 0 | { |
88 | 0 | memset(group, 0, sizeof(struct pseudo_merge_group)); |
89 | |
|
90 | 0 | strmap_init_with_options(&group->matches, NULL, 0); |
91 | |
|
92 | 0 | group->decay = DEFAULT_PSEUDO_MERGE_DECAY; |
93 | 0 | group->max_merges = DEFAULT_PSEUDO_MERGE_MAX_MERGES; |
94 | 0 | group->sample_rate = DEFAULT_PSEUDO_MERGE_SAMPLE_RATE; |
95 | 0 | group->threshold = DEFAULT_PSEUDO_MERGE_THRESHOLD; |
96 | 0 | group->stable_threshold = DEFAULT_PSEUDO_MERGE_STABLE_THRESHOLD; |
97 | 0 | group->stable_size = DEFAULT_PSEUDO_MERGE_STABLE_SIZE; |
98 | 0 | } |
99 | | |
100 | | static int pseudo_merge_config(const char *var, const char *value, |
101 | | const struct config_context *ctx, |
102 | | void *cb_data) |
103 | 0 | { |
104 | 0 | struct string_list *list = cb_data; |
105 | 0 | struct string_list_item *item; |
106 | 0 | struct pseudo_merge_group *group; |
107 | 0 | struct strbuf buf = STRBUF_INIT; |
108 | 0 | const char *sub, *key; |
109 | 0 | size_t sub_len; |
110 | 0 | int ret = 0; |
111 | |
|
112 | 0 | if (parse_config_key(var, "bitmappseudomerge", &sub, &sub_len, &key)) |
113 | 0 | goto done; |
114 | | |
115 | 0 | if (!sub_len) |
116 | 0 | goto done; |
117 | | |
118 | 0 | strbuf_add(&buf, sub, sub_len); |
119 | |
|
120 | 0 | item = string_list_lookup(list, buf.buf); |
121 | 0 | if (!item) { |
122 | 0 | item = string_list_insert(list, buf.buf); |
123 | |
|
124 | 0 | item->util = xmalloc(sizeof(struct pseudo_merge_group)); |
125 | 0 | pseudo_merge_group_init(item->util); |
126 | 0 | } |
127 | |
|
128 | 0 | group = item->util; |
129 | |
|
130 | 0 | if (!strcmp(key, "pattern")) { |
131 | 0 | struct strbuf re = STRBUF_INIT; |
132 | |
|
133 | 0 | free(group->pattern); |
134 | 0 | if (*value != '^') |
135 | 0 | strbuf_addch(&re, '^'); |
136 | 0 | strbuf_addstr(&re, value); |
137 | |
|
138 | 0 | group->pattern = xcalloc(1, sizeof(regex_t)); |
139 | 0 | if (regcomp(group->pattern, re.buf, REG_EXTENDED)) |
140 | 0 | die(_("failed to load pseudo-merge regex for %s: '%s'"), |
141 | 0 | sub, re.buf); |
142 | | |
143 | 0 | strbuf_release(&re); |
144 | 0 | } else if (!strcmp(key, "decay")) { |
145 | 0 | group->decay = git_config_double(var, value, ctx->kvi); |
146 | 0 | if (group->decay < 0) { |
147 | 0 | warning(_("%s must be non-negative, using default"), var); |
148 | 0 | group->decay = DEFAULT_PSEUDO_MERGE_DECAY; |
149 | 0 | } |
150 | 0 | } else if (!strcmp(key, "samplerate")) { |
151 | 0 | group->sample_rate = git_config_double(var, value, ctx->kvi); |
152 | 0 | if (!(0 <= group->sample_rate && group->sample_rate <= 1)) { |
153 | 0 | warning(_("%s must be between 0 and 1, using default"), var); |
154 | 0 | group->sample_rate = DEFAULT_PSEUDO_MERGE_SAMPLE_RATE; |
155 | 0 | } |
156 | 0 | } else if (!strcmp(key, "threshold")) { |
157 | 0 | if (git_config_expiry_date(&group->threshold, var, value)) { |
158 | 0 | ret = -1; |
159 | 0 | goto done; |
160 | 0 | } |
161 | 0 | } else if (!strcmp(key, "maxmerges")) { |
162 | 0 | group->max_merges = git_config_int(var, value, ctx->kvi); |
163 | 0 | if (group->max_merges < 0) { |
164 | 0 | warning(_("%s must be non-negative, using default"), var); |
165 | 0 | group->max_merges = DEFAULT_PSEUDO_MERGE_MAX_MERGES; |
166 | 0 | } |
167 | 0 | } else if (!strcmp(key, "stablethreshold")) { |
168 | 0 | if (git_config_expiry_date(&group->stable_threshold, var, value)) { |
169 | 0 | ret = -1; |
170 | 0 | goto done; |
171 | 0 | } |
172 | 0 | } else if (!strcmp(key, "stablesize")) { |
173 | 0 | group->stable_size = git_config_int(var, value, ctx->kvi); |
174 | 0 | if (group->stable_size <= 0) { |
175 | 0 | warning(_("%s must be positive, using default"), var); |
176 | 0 | group->stable_size = DEFAULT_PSEUDO_MERGE_STABLE_SIZE; |
177 | 0 | } |
178 | 0 | } |
179 | | |
180 | 0 | done: |
181 | 0 | strbuf_release(&buf); |
182 | |
|
183 | 0 | return ret; |
184 | 0 | } |
185 | | |
186 | | void load_pseudo_merges_from_config(struct repository *r, |
187 | | struct string_list *list) |
188 | 0 | { |
189 | 0 | struct string_list_item *item; |
190 | |
|
191 | 0 | repo_config(r, pseudo_merge_config, list); |
192 | |
|
193 | 0 | for_each_string_list_item(item, list) { |
194 | 0 | struct pseudo_merge_group *group = item->util; |
195 | 0 | if (!group->pattern) |
196 | 0 | die(_("pseudo-merge group '%s' missing required pattern"), |
197 | 0 | item->string); |
198 | 0 | if (group->threshold < group->stable_threshold) |
199 | 0 | die(_("pseudo-merge group '%s' has unstable threshold " |
200 | 0 | "before stable one"), item->string); |
201 | 0 | } |
202 | 0 | } |
203 | | |
204 | | static int find_pseudo_merge_group_for_ref(const char *refname, |
205 | | const char *referent UNUSED, |
206 | | const struct object_id *oid, |
207 | | int flags UNUSED, |
208 | | void *_data) |
209 | 0 | { |
210 | 0 | struct bitmap_writer *writer = _data; |
211 | 0 | struct object_id peeled; |
212 | 0 | struct commit *c; |
213 | 0 | uint32_t i; |
214 | 0 | int has_bitmap; |
215 | |
|
216 | 0 | if (!peel_iterated_oid(the_repository, oid, &peeled)) |
217 | 0 | oid = &peeled; |
218 | |
|
219 | 0 | c = lookup_commit(the_repository, oid); |
220 | 0 | if (!c) |
221 | 0 | return 0; |
222 | 0 | if (!packlist_find(writer->to_pack, oid)) |
223 | 0 | return 0; |
224 | | |
225 | 0 | has_bitmap = bitmap_writer_has_bitmapped_object_id(writer, oid); |
226 | |
|
227 | 0 | for (i = 0; i < writer->pseudo_merge_groups.nr; i++) { |
228 | 0 | struct pseudo_merge_group *group; |
229 | 0 | struct pseudo_merge_matches *matches; |
230 | 0 | struct strbuf group_name = STRBUF_INIT; |
231 | 0 | regmatch_t captures[16]; |
232 | 0 | size_t j; |
233 | |
|
234 | 0 | group = writer->pseudo_merge_groups.items[i].util; |
235 | 0 | if (regexec(group->pattern, refname, ARRAY_SIZE(captures), |
236 | 0 | captures, 0)) |
237 | 0 | continue; |
238 | | |
239 | 0 | if (captures[ARRAY_SIZE(captures) - 1].rm_so != -1) |
240 | 0 | warning(_("pseudo-merge regex from config has too many capture " |
241 | 0 | "groups (max=%"PRIuMAX")"), |
242 | 0 | (uintmax_t)ARRAY_SIZE(captures) - 2); |
243 | |
|
244 | 0 | for (j = !!group->pattern->re_nsub; j < ARRAY_SIZE(captures); j++) { |
245 | 0 | regmatch_t *match = &captures[j]; |
246 | 0 | if (match->rm_so == -1) |
247 | 0 | continue; |
248 | | |
249 | 0 | if (group_name.len) |
250 | 0 | strbuf_addch(&group_name, '-'); |
251 | |
|
252 | 0 | strbuf_add(&group_name, refname + match->rm_so, |
253 | 0 | match->rm_eo - match->rm_so); |
254 | 0 | } |
255 | |
|
256 | 0 | matches = strmap_get(&group->matches, group_name.buf); |
257 | 0 | if (!matches) { |
258 | 0 | matches = xcalloc(1, sizeof(*matches)); |
259 | 0 | strmap_put(&group->matches, strbuf_detach(&group_name, NULL), |
260 | 0 | matches); |
261 | 0 | } |
262 | |
|
263 | 0 | if (c->date <= group->stable_threshold) { |
264 | 0 | ALLOC_GROW(matches->stable, matches->stable_nr + 1, |
265 | 0 | matches->stable_alloc); |
266 | 0 | matches->stable[matches->stable_nr++] = c; |
267 | 0 | } else if (c->date <= group->threshold && !has_bitmap) { |
268 | 0 | ALLOC_GROW(matches->unstable, matches->unstable_nr + 1, |
269 | 0 | matches->unstable_alloc); |
270 | 0 | matches->unstable[matches->unstable_nr++] = c; |
271 | 0 | } |
272 | |
|
273 | 0 | strbuf_release(&group_name); |
274 | 0 | } |
275 | |
|
276 | 0 | return 0; |
277 | 0 | } |
278 | | |
279 | | static struct commit *push_pseudo_merge(struct pseudo_merge_group *group) |
280 | 0 | { |
281 | 0 | struct commit *merge; |
282 | |
|
283 | 0 | ALLOC_GROW(group->merges, group->merges_nr + 1, group->merges_alloc); |
284 | |
|
285 | 0 | merge = alloc_commit_node(the_repository); |
286 | 0 | merge->object.parsed = 1; |
287 | 0 | merge->object.flags |= BITMAP_PSEUDO_MERGE; |
288 | |
|
289 | 0 | group->merges[group->merges_nr++] = merge; |
290 | |
|
291 | 0 | return merge; |
292 | 0 | } |
293 | | |
294 | | static struct pseudo_merge_commit_idx *pseudo_merge_idx(kh_oid_map_t *pseudo_merge_commits, |
295 | | const struct object_id *oid) |
296 | | |
297 | 0 | { |
298 | 0 | struct pseudo_merge_commit_idx *pmc; |
299 | 0 | int hash_ret; |
300 | 0 | khiter_t hash_pos = kh_put_oid_map(pseudo_merge_commits, *oid, |
301 | 0 | &hash_ret); |
302 | |
|
303 | 0 | if (hash_ret) { |
304 | 0 | CALLOC_ARRAY(pmc, 1); |
305 | 0 | kh_value(pseudo_merge_commits, hash_pos) = pmc; |
306 | 0 | } else { |
307 | 0 | pmc = kh_value(pseudo_merge_commits, hash_pos); |
308 | 0 | } |
309 | |
|
310 | 0 | return pmc; |
311 | 0 | } |
312 | | |
313 | 0 | #define MIN_PSEUDO_MERGE_SIZE 8 |
314 | | |
315 | | static void select_pseudo_merges_1(struct bitmap_writer *writer, |
316 | | struct pseudo_merge_group *group, |
317 | | struct pseudo_merge_matches *matches) |
318 | 0 | { |
319 | 0 | uint32_t i, j; |
320 | 0 | uint32_t stable_merges_nr; |
321 | |
|
322 | 0 | if (!matches->stable_nr && !matches->unstable_nr) |
323 | 0 | return; /* all tips in this group already have bitmaps */ |
324 | | |
325 | 0 | stable_merges_nr = matches->stable_nr / group->stable_size; |
326 | 0 | if (matches->stable_nr % group->stable_size) |
327 | 0 | stable_merges_nr++; |
328 | | |
329 | | /* make stable_merges_nr pseudo merges for stable commits */ |
330 | 0 | for (i = 0, j = 0; i < stable_merges_nr; i++) { |
331 | 0 | struct commit *merge; |
332 | 0 | struct commit_list **p; |
333 | |
|
334 | 0 | merge = push_pseudo_merge(group); |
335 | 0 | p = &merge->parents; |
336 | | |
337 | | /* |
338 | | * For each pseudo-merge created above, add parents to the |
339 | | * allocated commit node from the stable set of commits |
340 | | * (un-bitmapped, newer than the stable threshold). |
341 | | */ |
342 | 0 | do { |
343 | 0 | struct commit *c; |
344 | 0 | struct pseudo_merge_commit_idx *pmc; |
345 | |
|
346 | 0 | if (j >= matches->stable_nr) |
347 | 0 | break; |
348 | | |
349 | 0 | c = matches->stable[j++]; |
350 | | /* |
351 | | * Here and below, make sure that we keep our mapping of |
352 | | * commits -> pseudo-merge(s) which include the key'd |
353 | | * commit up-to-date. |
354 | | */ |
355 | 0 | pmc = pseudo_merge_idx(writer->pseudo_merge_commits, |
356 | 0 | &c->object.oid); |
357 | |
|
358 | 0 | ALLOC_GROW(pmc->pseudo_merge, pmc->nr + 1, pmc->alloc); |
359 | |
|
360 | 0 | pmc->pseudo_merge[pmc->nr++] = writer->pseudo_merges_nr; |
361 | 0 | p = commit_list_append(c, p); |
362 | 0 | } while (j % group->stable_size); |
363 | | |
364 | 0 | if (merge->parents) { |
365 | 0 | bitmap_writer_push_commit(writer, merge, 1); |
366 | 0 | writer->pseudo_merges_nr++; |
367 | 0 | } |
368 | 0 | } |
369 | | |
370 | | /* make up to group->max_merges pseudo merges for unstable commits */ |
371 | 0 | for (i = 0, j = 0; i < group->max_merges; i++) { |
372 | 0 | struct commit *merge; |
373 | 0 | struct commit_list **p; |
374 | 0 | uint32_t size, end; |
375 | |
|
376 | 0 | merge = push_pseudo_merge(group); |
377 | 0 | p = &merge->parents; |
378 | |
|
379 | 0 | size = pseudo_merge_group_size(group, matches, i); |
380 | 0 | end = size < MIN_PSEUDO_MERGE_SIZE ? matches->unstable_nr : j + size; |
381 | | |
382 | | /* |
383 | | * For each pseudo-merge commit created above, add parents to |
384 | | * the allocated commit node from the unstable set of commits |
385 | | * (newer than the stable threshold). |
386 | | * |
387 | | * Account for the sample rate, since not every candidate from |
388 | | * the set of stable commits will be included as a pseudo-merge |
389 | | * parent. |
390 | | */ |
391 | 0 | for (; j < end && j < matches->unstable_nr; j++) { |
392 | 0 | struct commit *c = matches->unstable[j]; |
393 | 0 | struct pseudo_merge_commit_idx *pmc; |
394 | |
|
395 | 0 | if (j % (uint32_t)(1.0 / group->sample_rate)) |
396 | 0 | continue; |
397 | | |
398 | 0 | pmc = pseudo_merge_idx(writer->pseudo_merge_commits, |
399 | 0 | &c->object.oid); |
400 | |
|
401 | 0 | ALLOC_GROW(pmc->pseudo_merge, pmc->nr + 1, pmc->alloc); |
402 | |
|
403 | 0 | pmc->pseudo_merge[pmc->nr++] = writer->pseudo_merges_nr; |
404 | 0 | p = commit_list_append(c, p); |
405 | 0 | } |
406 | |
|
407 | 0 | if (merge->parents) { |
408 | 0 | bitmap_writer_push_commit(writer, merge, 1); |
409 | 0 | writer->pseudo_merges_nr++; } |
410 | 0 | if (end >= matches->unstable_nr) |
411 | 0 | break; |
412 | 0 | } |
413 | 0 | } |
414 | | |
415 | | static int commit_date_cmp(const void *va, const void *vb) |
416 | 0 | { |
417 | 0 | timestamp_t a = (*(const struct commit **)va)->date; |
418 | 0 | timestamp_t b = (*(const struct commit **)vb)->date; |
419 | |
|
420 | 0 | if (a < b) |
421 | 0 | return -1; |
422 | 0 | else if (a > b) |
423 | 0 | return 1; |
424 | 0 | return 0; |
425 | 0 | } |
426 | | |
427 | | static void sort_pseudo_merge_matches(struct pseudo_merge_matches *matches) |
428 | 0 | { |
429 | 0 | QSORT(matches->stable, matches->stable_nr, commit_date_cmp); |
430 | 0 | QSORT(matches->unstable, matches->unstable_nr, commit_date_cmp); |
431 | 0 | } |
432 | | |
433 | | void select_pseudo_merges(struct bitmap_writer *writer) |
434 | 0 | { |
435 | 0 | struct progress *progress = NULL; |
436 | 0 | uint32_t i; |
437 | |
|
438 | 0 | if (!writer->pseudo_merge_groups.nr) |
439 | 0 | return; |
440 | | |
441 | 0 | if (writer->show_progress) |
442 | 0 | progress = start_progress("Selecting pseudo-merge commits", |
443 | 0 | writer->pseudo_merge_groups.nr); |
444 | |
|
445 | 0 | refs_for_each_ref(get_main_ref_store(the_repository), |
446 | 0 | find_pseudo_merge_group_for_ref, writer); |
447 | |
|
448 | 0 | for (i = 0; i < writer->pseudo_merge_groups.nr; i++) { |
449 | 0 | struct pseudo_merge_group *group; |
450 | 0 | struct hashmap_iter iter; |
451 | 0 | struct strmap_entry *e; |
452 | |
|
453 | 0 | group = writer->pseudo_merge_groups.items[i].util; |
454 | 0 | strmap_for_each_entry(&group->matches, &iter, e) { |
455 | 0 | struct pseudo_merge_matches *matches = e->value; |
456 | |
|
457 | 0 | sort_pseudo_merge_matches(matches); |
458 | |
|
459 | 0 | select_pseudo_merges_1(writer, group, matches); |
460 | 0 | } |
461 | |
|
462 | 0 | display_progress(progress, i + 1); |
463 | 0 | } |
464 | |
|
465 | 0 | stop_progress(&progress); |
466 | 0 | } |
467 | | |
468 | | void free_pseudo_merge_map(struct pseudo_merge_map *pm) |
469 | 0 | { |
470 | 0 | uint32_t i; |
471 | 0 | for (i = 0; i < pm->nr; i++) { |
472 | 0 | ewah_pool_free(pm->v[i].commits); |
473 | 0 | ewah_pool_free(pm->v[i].bitmap); |
474 | 0 | } |
475 | 0 | free(pm->v); |
476 | 0 | } |
477 | | |
478 | | struct pseudo_merge_commit_ext { |
479 | | uint32_t nr; |
480 | | const unsigned char *ptr; |
481 | | }; |
482 | | |
483 | | static int pseudo_merge_ext_at(const struct pseudo_merge_map *pm, |
484 | | struct pseudo_merge_commit_ext *ext, size_t at) |
485 | 0 | { |
486 | 0 | if (at >= pm->map_size) |
487 | 0 | return error(_("extended pseudo-merge read out-of-bounds " |
488 | 0 | "(%"PRIuMAX" >= %"PRIuMAX")"), |
489 | 0 | (uintmax_t)at, (uintmax_t)pm->map_size); |
490 | 0 | if (at + 4 >= pm->map_size) |
491 | 0 | return error(_("extended pseudo-merge entry is too short " |
492 | 0 | "(%"PRIuMAX" >= %"PRIuMAX")"), |
493 | 0 | (uintmax_t)(at + 4), (uintmax_t)pm->map_size); |
494 | | |
495 | 0 | ext->nr = get_be32(pm->map + at); |
496 | 0 | ext->ptr = pm->map + at + sizeof(uint32_t); |
497 | |
|
498 | 0 | return 0; |
499 | 0 | } |
500 | | |
501 | | struct ewah_bitmap *pseudo_merge_bitmap(const struct pseudo_merge_map *pm, |
502 | | struct pseudo_merge *merge) |
503 | 0 | { |
504 | 0 | if (!merge->loaded_commits) |
505 | 0 | BUG("cannot use unloaded pseudo-merge bitmap"); |
506 | | |
507 | 0 | if (!merge->loaded_bitmap) { |
508 | 0 | size_t at = merge->bitmap_at; |
509 | |
|
510 | 0 | merge->bitmap = read_bitmap(pm->map, pm->map_size, &at); |
511 | 0 | merge->loaded_bitmap = 1; |
512 | 0 | } |
513 | |
|
514 | 0 | return merge->bitmap; |
515 | 0 | } |
516 | | |
517 | | struct pseudo_merge *use_pseudo_merge(const struct pseudo_merge_map *pm, |
518 | | struct pseudo_merge *merge) |
519 | 0 | { |
520 | 0 | if (!merge->loaded_commits) { |
521 | 0 | size_t pos = merge->at; |
522 | |
|
523 | 0 | merge->commits = read_bitmap(pm->map, pm->map_size, &pos); |
524 | 0 | merge->bitmap_at = pos; |
525 | 0 | merge->loaded_commits = 1; |
526 | 0 | } |
527 | 0 | return merge; |
528 | 0 | } |
529 | | |
530 | | static struct pseudo_merge *pseudo_merge_at(const struct pseudo_merge_map *pm, |
531 | | struct object_id *oid, |
532 | | size_t want) |
533 | 0 | { |
534 | 0 | size_t lo = 0; |
535 | 0 | size_t hi = pm->nr; |
536 | |
|
537 | 0 | while (lo < hi) { |
538 | 0 | size_t mi = lo + (hi - lo) / 2; |
539 | 0 | size_t got = pm->v[mi].at; |
540 | |
|
541 | 0 | if (got == want) |
542 | 0 | return use_pseudo_merge(pm, &pm->v[mi]); |
543 | 0 | else if (got < want) |
544 | 0 | hi = mi; |
545 | 0 | else |
546 | 0 | lo = mi + 1; |
547 | 0 | } |
548 | | |
549 | 0 | warning(_("could not find pseudo-merge for commit %s at offset %"PRIuMAX), |
550 | 0 | oid_to_hex(oid), (uintmax_t)want); |
551 | |
|
552 | 0 | return NULL; |
553 | 0 | } |
554 | | |
555 | | struct pseudo_merge_commit { |
556 | | uint32_t commit_pos; |
557 | | uint64_t pseudo_merge_ofs; |
558 | | }; |
559 | | |
560 | 0 | #define PSEUDO_MERGE_COMMIT_RAWSZ (sizeof(uint32_t)+sizeof(uint64_t)) |
561 | | |
562 | | static void read_pseudo_merge_commit_at(struct pseudo_merge_commit *merge, |
563 | | const unsigned char *at) |
564 | 0 | { |
565 | 0 | merge->commit_pos = get_be32(at); |
566 | 0 | merge->pseudo_merge_ofs = get_be64(at + sizeof(uint32_t)); |
567 | 0 | } |
568 | | |
569 | | static int nth_pseudo_merge_ext(const struct pseudo_merge_map *pm, |
570 | | struct pseudo_merge_commit_ext *ext, |
571 | | struct pseudo_merge_commit *merge, |
572 | | uint32_t n) |
573 | 0 | { |
574 | 0 | size_t ofs; |
575 | |
|
576 | 0 | if (n >= ext->nr) |
577 | 0 | return error(_("extended pseudo-merge lookup out-of-bounds " |
578 | 0 | "(%"PRIu32" >= %"PRIu32")"), n, ext->nr); |
579 | | |
580 | 0 | ofs = get_be64(ext->ptr + st_mult(n, sizeof(uint64_t))); |
581 | 0 | if (ofs >= pm->map_size) |
582 | 0 | return error(_("out-of-bounds read: (%"PRIuMAX" >= %"PRIuMAX")"), |
583 | 0 | (uintmax_t)ofs, (uintmax_t)pm->map_size); |
584 | | |
585 | 0 | read_pseudo_merge_commit_at(merge, pm->map + ofs); |
586 | |
|
587 | 0 | return 0; |
588 | 0 | } |
589 | | |
590 | | static unsigned apply_pseudo_merge(const struct pseudo_merge_map *pm, |
591 | | struct pseudo_merge *merge, |
592 | | struct bitmap *result, |
593 | | struct bitmap *roots) |
594 | 0 | { |
595 | 0 | if (merge->satisfied) |
596 | 0 | return 0; |
597 | | |
598 | 0 | if (!ewah_bitmap_is_subset(merge->commits, roots ? roots : result)) |
599 | 0 | return 0; |
600 | | |
601 | 0 | bitmap_or_ewah(result, pseudo_merge_bitmap(pm, merge)); |
602 | 0 | if (roots) |
603 | 0 | bitmap_or_ewah(roots, pseudo_merge_bitmap(pm, merge)); |
604 | 0 | merge->satisfied = 1; |
605 | |
|
606 | 0 | return 1; |
607 | 0 | } |
608 | | |
609 | | static int pseudo_merge_commit_cmp(const void *va, const void *vb) |
610 | 0 | { |
611 | 0 | struct pseudo_merge_commit merge; |
612 | 0 | uint32_t key = *(uint32_t*)va; |
613 | |
|
614 | 0 | read_pseudo_merge_commit_at(&merge, vb); |
615 | |
|
616 | 0 | if (key < merge.commit_pos) |
617 | 0 | return -1; |
618 | 0 | if (key > merge.commit_pos) |
619 | 0 | return 1; |
620 | 0 | return 0; |
621 | 0 | } |
622 | | |
623 | | static struct pseudo_merge_commit *find_pseudo_merge(const struct pseudo_merge_map *pm, |
624 | | uint32_t pos) |
625 | 0 | { |
626 | 0 | if (!pm->commits_nr) |
627 | 0 | return NULL; |
628 | | |
629 | 0 | return bsearch(&pos, pm->commits, pm->commits_nr, |
630 | 0 | PSEUDO_MERGE_COMMIT_RAWSZ, pseudo_merge_commit_cmp); |
631 | 0 | } |
632 | | |
633 | | int apply_pseudo_merges_for_commit(const struct pseudo_merge_map *pm, |
634 | | struct bitmap *result, |
635 | | struct commit *commit, uint32_t commit_pos) |
636 | 0 | { |
637 | 0 | struct pseudo_merge *merge; |
638 | 0 | struct pseudo_merge_commit *merge_commit; |
639 | 0 | int ret = 0; |
640 | |
|
641 | 0 | merge_commit = find_pseudo_merge(pm, commit_pos); |
642 | 0 | if (!merge_commit) |
643 | 0 | return 0; |
644 | | |
645 | 0 | if (merge_commit->pseudo_merge_ofs & ((uint64_t)1<<63)) { |
646 | 0 | struct pseudo_merge_commit_ext ext = { 0 }; |
647 | 0 | off_t ofs = merge_commit->pseudo_merge_ofs & ~((uint64_t)1<<63); |
648 | 0 | uint32_t i; |
649 | |
|
650 | 0 | if (pseudo_merge_ext_at(pm, &ext, ofs) < -1) { |
651 | 0 | warning(_("could not read extended pseudo-merge table " |
652 | 0 | "for commit %s"), |
653 | 0 | oid_to_hex(&commit->object.oid)); |
654 | 0 | return ret; |
655 | 0 | } |
656 | | |
657 | 0 | for (i = 0; i < ext.nr; i++) { |
658 | 0 | if (nth_pseudo_merge_ext(pm, &ext, merge_commit, i) < 0) |
659 | 0 | return ret; |
660 | | |
661 | 0 | merge = pseudo_merge_at(pm, &commit->object.oid, |
662 | 0 | merge_commit->pseudo_merge_ofs); |
663 | |
|
664 | 0 | if (!merge) |
665 | 0 | return ret; |
666 | | |
667 | 0 | if (apply_pseudo_merge(pm, merge, result, NULL)) |
668 | 0 | ret++; |
669 | 0 | } |
670 | 0 | } else { |
671 | 0 | merge = pseudo_merge_at(pm, &commit->object.oid, |
672 | 0 | merge_commit->pseudo_merge_ofs); |
673 | |
|
674 | 0 | if (!merge) |
675 | 0 | return ret; |
676 | | |
677 | 0 | if (apply_pseudo_merge(pm, merge, result, NULL)) |
678 | 0 | ret++; |
679 | 0 | } |
680 | | |
681 | 0 | if (ret) |
682 | 0 | cascade_pseudo_merges(pm, result, NULL); |
683 | |
|
684 | 0 | return ret; |
685 | 0 | } |
686 | | |
687 | | int cascade_pseudo_merges(const struct pseudo_merge_map *pm, |
688 | | struct bitmap *result, |
689 | | struct bitmap *roots) |
690 | 0 | { |
691 | 0 | unsigned any_satisfied; |
692 | 0 | int ret = 0; |
693 | |
|
694 | 0 | do { |
695 | 0 | struct pseudo_merge *merge; |
696 | 0 | uint32_t i; |
697 | |
|
698 | 0 | any_satisfied = 0; |
699 | |
|
700 | 0 | for (i = 0; i < pm->nr; i++) { |
701 | 0 | merge = use_pseudo_merge(pm, &pm->v[i]); |
702 | 0 | if (apply_pseudo_merge(pm, merge, result, roots)) { |
703 | 0 | any_satisfied |= 1; |
704 | 0 | ret++; |
705 | 0 | } |
706 | 0 | } |
707 | 0 | } while (any_satisfied); |
708 | |
|
709 | 0 | return ret; |
710 | 0 | } |
711 | | |
712 | | struct pseudo_merge *pseudo_merge_for_parents(const struct pseudo_merge_map *pm, |
713 | | struct bitmap *parents) |
714 | 0 | { |
715 | 0 | struct pseudo_merge *match = NULL; |
716 | 0 | size_t i; |
717 | |
|
718 | 0 | if (!pm->nr) |
719 | 0 | return NULL; |
720 | | |
721 | | /* |
722 | | * NOTE: this loop is quadratic in the worst-case (where no |
723 | | * matching pseudo-merge bitmaps are found), but in practice |
724 | | * this is OK for a few reasons: |
725 | | * |
726 | | * - Rejecting pseudo-merge bitmaps that do not match the |
727 | | * given commit is done quickly (i.e. `bitmap_equals_ewah()` |
728 | | * returns early when we know the two bitmaps aren't equal. |
729 | | * |
730 | | * - Already matched pseudo-merge bitmaps (which we track with |
731 | | * the `->satisfied` bit here) are skipped as potential |
732 | | * candidates. |
733 | | * |
734 | | * - The number of pseudo-merges should be small (in the |
735 | | * hundreds for most repositories). |
736 | | * |
737 | | * If in the future this semi-quadratic behavior does become a |
738 | | * problem, another approach would be to keep track of which |
739 | | * pseudo-merges are still "viable" after enumerating the |
740 | | * pseudo-merge commit's parents: |
741 | | * |
742 | | * - A pseudo-merge bitmap becomes non-viable when the bit(s) |
743 | | * corresponding to one or more parent(s) of the given |
744 | | * commit are not set in a candidate pseudo-merge's commits |
745 | | * bitmap. |
746 | | * |
747 | | * - After processing all bits, enumerate the remaining set of |
748 | | * viable pseudo-merge bitmaps, and check that their |
749 | | * popcount() matches the number of parents in the given |
750 | | * commit. |
751 | | */ |
752 | 0 | for (i = 0; i < pm->nr; i++) { |
753 | 0 | struct pseudo_merge *candidate = use_pseudo_merge(pm, &pm->v[i]); |
754 | 0 | if (!candidate || candidate->satisfied) |
755 | 0 | continue; |
756 | 0 | if (!bitmap_equals_ewah(parents, candidate->commits)) |
757 | 0 | continue; |
758 | | |
759 | 0 | match = candidate; |
760 | 0 | match->satisfied = 1; |
761 | 0 | break; |
762 | 0 | } |
763 | |
|
764 | 0 | return match; |
765 | 0 | } |