Line | Count | Source (jump to first uncovered line) |
1 | | #define USE_THE_REPOSITORY_VARIABLE |
2 | | |
3 | | #include "git-compat-util.h" |
4 | | #include "tag.h" |
5 | | #include "commit.h" |
6 | | #include "commit-graph.h" |
7 | | #include "environment.h" |
8 | | #include "gettext.h" |
9 | | #include "hex.h" |
10 | | #include "repository.h" |
11 | | #include "object-name.h" |
12 | | #include "object-store-ll.h" |
13 | | #include "utf8.h" |
14 | | #include "diff.h" |
15 | | #include "revision.h" |
16 | | #include "notes.h" |
17 | | #include "alloc.h" |
18 | | #include "gpg-interface.h" |
19 | | #include "mergesort.h" |
20 | | #include "commit-slab.h" |
21 | | #include "prio-queue.h" |
22 | | #include "hash-lookup.h" |
23 | | #include "wt-status.h" |
24 | | #include "advice.h" |
25 | | #include "refs.h" |
26 | | #include "commit-reach.h" |
27 | | #include "setup.h" |
28 | | #include "shallow.h" |
29 | | #include "tree.h" |
30 | | #include "hook.h" |
31 | | #include "parse.h" |
32 | | #include "object-file-convert.h" |
33 | | |
34 | | static struct commit_extra_header *read_commit_extra_header_lines(const char *buf, size_t len, const char **); |
35 | | |
36 | | int save_commit_buffer = 1; |
37 | | int no_graft_file_deprecated_advice; |
38 | | |
39 | | const char *commit_type = "commit"; |
40 | | |
41 | | struct commit *lookup_commit_reference_gently(struct repository *r, |
42 | | const struct object_id *oid, int quiet) |
43 | 0 | { |
44 | 0 | struct object *obj = deref_tag(r, |
45 | 0 | parse_object(r, oid), |
46 | 0 | NULL, 0); |
47 | |
|
48 | 0 | if (!obj) |
49 | 0 | return NULL; |
50 | 0 | return object_as_type(obj, OBJ_COMMIT, quiet); |
51 | 0 | } |
52 | | |
53 | | struct commit *lookup_commit_reference(struct repository *r, const struct object_id *oid) |
54 | 0 | { |
55 | 0 | return lookup_commit_reference_gently(r, oid, 0); |
56 | 0 | } |
57 | | |
58 | | struct commit *lookup_commit_or_die(const struct object_id *oid, const char *ref_name) |
59 | 0 | { |
60 | 0 | struct commit *c = lookup_commit_reference(the_repository, oid); |
61 | 0 | if (!c) |
62 | 0 | die(_("could not parse %s"), ref_name); |
63 | 0 | if (!oideq(oid, &c->object.oid)) { |
64 | 0 | warning(_("%s %s is not a commit!"), |
65 | 0 | ref_name, oid_to_hex(oid)); |
66 | 0 | } |
67 | 0 | return c; |
68 | 0 | } |
69 | | |
70 | | struct commit *lookup_commit_object(struct repository *r, |
71 | | const struct object_id *oid) |
72 | 0 | { |
73 | 0 | struct object *obj = parse_object(r, oid); |
74 | 0 | return obj ? object_as_type(obj, OBJ_COMMIT, 0) : NULL; |
75 | |
|
76 | 0 | } |
77 | | |
78 | | struct commit *lookup_commit(struct repository *r, const struct object_id *oid) |
79 | 0 | { |
80 | 0 | struct object *obj = lookup_object(r, oid); |
81 | 0 | if (!obj) |
82 | 0 | return create_object(r, oid, alloc_commit_node(r)); |
83 | 0 | return object_as_type(obj, OBJ_COMMIT, 0); |
84 | 0 | } |
85 | | |
86 | | struct commit *lookup_commit_reference_by_name(const char *name) |
87 | 0 | { |
88 | 0 | return lookup_commit_reference_by_name_gently(name, 0); |
89 | 0 | } |
90 | | |
91 | | struct commit *lookup_commit_reference_by_name_gently(const char *name, |
92 | | int quiet) |
93 | 0 | { |
94 | 0 | struct object_id oid; |
95 | 0 | struct commit *commit; |
96 | |
|
97 | 0 | if (repo_get_oid_committish(the_repository, name, &oid)) |
98 | 0 | return NULL; |
99 | 0 | commit = lookup_commit_reference_gently(the_repository, &oid, quiet); |
100 | 0 | if (repo_parse_commit(the_repository, commit)) |
101 | 0 | return NULL; |
102 | 0 | return commit; |
103 | 0 | } |
104 | | |
105 | | static timestamp_t parse_commit_date(const char *buf, const char *tail) |
106 | 0 | { |
107 | 0 | const char *dateptr; |
108 | 0 | const char *eol; |
109 | |
|
110 | 0 | if (buf + 6 >= tail) |
111 | 0 | return 0; |
112 | 0 | if (memcmp(buf, "author", 6)) |
113 | 0 | return 0; |
114 | 0 | while (buf < tail && *buf++ != '\n') |
115 | 0 | /* nada */; |
116 | 0 | if (buf + 9 >= tail) |
117 | 0 | return 0; |
118 | 0 | if (memcmp(buf, "committer", 9)) |
119 | 0 | return 0; |
120 | | |
121 | | /* |
122 | | * Jump to end-of-line so that we can walk backwards to find the |
123 | | * end-of-email ">". This is more forgiving of malformed cases |
124 | | * because unexpected characters tend to be in the name and email |
125 | | * fields. |
126 | | */ |
127 | 0 | eol = memchr(buf, '\n', tail - buf); |
128 | 0 | if (!eol) |
129 | 0 | return 0; |
130 | 0 | dateptr = eol; |
131 | 0 | while (dateptr > buf && dateptr[-1] != '>') |
132 | 0 | dateptr--; |
133 | 0 | if (dateptr == buf) |
134 | 0 | return 0; |
135 | | |
136 | | /* |
137 | | * Trim leading whitespace, but make sure we have at least one |
138 | | * non-whitespace character, as parse_timestamp() will otherwise walk |
139 | | * right past the newline we found in "eol" when skipping whitespace |
140 | | * itself. |
141 | | * |
142 | | * In theory it would be sufficient to allow any character not matched |
143 | | * by isspace(), but there's a catch: our isspace() does not |
144 | | * necessarily match the behavior of parse_timestamp(), as the latter |
145 | | * is implemented by system routines which match more exotic control |
146 | | * codes, or even locale-dependent sequences. |
147 | | * |
148 | | * Since we expect the timestamp to be a number, we can check for that. |
149 | | * Anything else (e.g., a non-numeric token like "foo") would just |
150 | | * cause parse_timestamp() to return 0 anyway. |
151 | | */ |
152 | 0 | while (dateptr < eol && isspace(*dateptr)) |
153 | 0 | dateptr++; |
154 | 0 | if (!isdigit(*dateptr) && *dateptr != '-') |
155 | 0 | return 0; |
156 | | |
157 | | /* |
158 | | * We know there is at least one digit (or dash), so we'll begin |
159 | | * parsing there and stop at worst case at eol. |
160 | | * |
161 | | * Note that we may feed parse_timestamp() extra characters here if the |
162 | | * commit is malformed, and it will parse as far as it can. For |
163 | | * example, "123foo456" would return "123". That might be questionable |
164 | | * (versus returning "0"), but it would help in a hypothetical case |
165 | | * like "123456+0100", where the whitespace from the timezone is |
166 | | * missing. Since such syntactic errors may be baked into history and |
167 | | * hard to correct now, let's err on trying to make our best guess |
168 | | * here, rather than insist on perfect syntax. |
169 | | */ |
170 | 0 | return parse_timestamp(dateptr, NULL, 10); |
171 | 0 | } |
172 | | |
173 | | static const struct object_id *commit_graft_oid_access(size_t index, const void *table) |
174 | 0 | { |
175 | 0 | const struct commit_graft * const *commit_graft_table = table; |
176 | 0 | return &commit_graft_table[index]->oid; |
177 | 0 | } |
178 | | |
179 | | int commit_graft_pos(struct repository *r, const struct object_id *oid) |
180 | 0 | { |
181 | 0 | return oid_pos(oid, r->parsed_objects->grafts, |
182 | 0 | r->parsed_objects->grafts_nr, |
183 | 0 | commit_graft_oid_access); |
184 | 0 | } |
185 | | |
186 | | static void unparse_commit(struct repository *r, const struct object_id *oid) |
187 | 0 | { |
188 | 0 | struct commit *c = lookup_commit(r, oid); |
189 | |
|
190 | 0 | if (!c->object.parsed) |
191 | 0 | return; |
192 | 0 | free_commit_list(c->parents); |
193 | 0 | c->parents = NULL; |
194 | 0 | c->object.parsed = 0; |
195 | 0 | } |
196 | | |
197 | | int register_commit_graft(struct repository *r, struct commit_graft *graft, |
198 | | int ignore_dups) |
199 | 0 | { |
200 | 0 | int pos = commit_graft_pos(r, &graft->oid); |
201 | |
|
202 | 0 | if (0 <= pos) { |
203 | 0 | if (ignore_dups) |
204 | 0 | free(graft); |
205 | 0 | else { |
206 | 0 | free(r->parsed_objects->grafts[pos]); |
207 | 0 | r->parsed_objects->grafts[pos] = graft; |
208 | 0 | } |
209 | 0 | return 1; |
210 | 0 | } |
211 | 0 | pos = -pos - 1; |
212 | 0 | ALLOC_GROW(r->parsed_objects->grafts, |
213 | 0 | r->parsed_objects->grafts_nr + 1, |
214 | 0 | r->parsed_objects->grafts_alloc); |
215 | 0 | r->parsed_objects->grafts_nr++; |
216 | 0 | if (pos < r->parsed_objects->grafts_nr) |
217 | 0 | memmove(r->parsed_objects->grafts + pos + 1, |
218 | 0 | r->parsed_objects->grafts + pos, |
219 | 0 | (r->parsed_objects->grafts_nr - pos - 1) * |
220 | 0 | sizeof(*r->parsed_objects->grafts)); |
221 | 0 | r->parsed_objects->grafts[pos] = graft; |
222 | 0 | unparse_commit(r, &graft->oid); |
223 | 0 | return 0; |
224 | 0 | } |
225 | | |
226 | | struct commit_graft *read_graft_line(struct strbuf *line) |
227 | 0 | { |
228 | | /* The format is just "Commit Parent1 Parent2 ...\n" */ |
229 | 0 | int i, phase; |
230 | 0 | const char *tail = NULL; |
231 | 0 | struct commit_graft *graft = NULL; |
232 | 0 | struct object_id dummy_oid, *oid; |
233 | |
|
234 | 0 | strbuf_rtrim(line); |
235 | 0 | if (!line->len || line->buf[0] == '#') |
236 | 0 | return NULL; |
237 | | /* |
238 | | * phase 0 verifies line, counts hashes in line and allocates graft |
239 | | * phase 1 fills graft |
240 | | */ |
241 | 0 | for (phase = 0; phase < 2; phase++) { |
242 | 0 | oid = graft ? &graft->oid : &dummy_oid; |
243 | 0 | if (parse_oid_hex(line->buf, oid, &tail)) |
244 | 0 | goto bad_graft_data; |
245 | 0 | for (i = 0; *tail != '\0'; i++) { |
246 | 0 | oid = graft ? &graft->parent[i] : &dummy_oid; |
247 | 0 | if (!isspace(*tail++) || parse_oid_hex(tail, oid, &tail)) |
248 | 0 | goto bad_graft_data; |
249 | 0 | } |
250 | 0 | if (!graft) { |
251 | 0 | graft = xmalloc(st_add(sizeof(*graft), |
252 | 0 | st_mult(sizeof(struct object_id), i))); |
253 | 0 | graft->nr_parent = i; |
254 | 0 | } |
255 | 0 | } |
256 | 0 | return graft; |
257 | | |
258 | 0 | bad_graft_data: |
259 | 0 | error("bad graft data: %s", line->buf); |
260 | 0 | assert(!graft); |
261 | 0 | return NULL; |
262 | 0 | } |
263 | | |
264 | | static int read_graft_file(struct repository *r, const char *graft_file) |
265 | 0 | { |
266 | 0 | FILE *fp = fopen_or_warn(graft_file, "r"); |
267 | 0 | struct strbuf buf = STRBUF_INIT; |
268 | 0 | if (!fp) |
269 | 0 | return -1; |
270 | 0 | if (!no_graft_file_deprecated_advice && |
271 | 0 | advice_enabled(ADVICE_GRAFT_FILE_DEPRECATED)) |
272 | 0 | advise(_("Support for <GIT_DIR>/info/grafts is deprecated\n" |
273 | 0 | "and will be removed in a future Git version.\n" |
274 | 0 | "\n" |
275 | 0 | "Please use \"git replace --convert-graft-file\"\n" |
276 | 0 | "to convert the grafts into replace refs.\n" |
277 | 0 | "\n" |
278 | 0 | "Turn this message off by running\n" |
279 | 0 | "\"git config advice.graftFileDeprecated false\"")); |
280 | 0 | while (!strbuf_getwholeline(&buf, fp, '\n')) { |
281 | | /* The format is just "Commit Parent1 Parent2 ...\n" */ |
282 | 0 | struct commit_graft *graft = read_graft_line(&buf); |
283 | 0 | if (!graft) |
284 | 0 | continue; |
285 | 0 | if (register_commit_graft(r, graft, 1)) |
286 | 0 | error("duplicate graft data: %s", buf.buf); |
287 | 0 | } |
288 | 0 | fclose(fp); |
289 | 0 | strbuf_release(&buf); |
290 | 0 | return 0; |
291 | 0 | } |
292 | | |
293 | | void prepare_commit_graft(struct repository *r) |
294 | 0 | { |
295 | 0 | char *graft_file; |
296 | |
|
297 | 0 | if (r->parsed_objects->commit_graft_prepared) |
298 | 0 | return; |
299 | 0 | if (!startup_info->have_repository) |
300 | 0 | return; |
301 | | |
302 | 0 | graft_file = get_graft_file(r); |
303 | 0 | read_graft_file(r, graft_file); |
304 | | /* make sure shallows are read */ |
305 | 0 | is_repository_shallow(r); |
306 | 0 | r->parsed_objects->commit_graft_prepared = 1; |
307 | 0 | } |
308 | | |
309 | | struct commit_graft *lookup_commit_graft(struct repository *r, const struct object_id *oid) |
310 | 0 | { |
311 | 0 | int pos; |
312 | 0 | prepare_commit_graft(r); |
313 | 0 | pos = commit_graft_pos(r, oid); |
314 | 0 | if (pos < 0) |
315 | 0 | return NULL; |
316 | 0 | return r->parsed_objects->grafts[pos]; |
317 | 0 | } |
318 | | |
319 | | int for_each_commit_graft(each_commit_graft_fn fn, void *cb_data) |
320 | 0 | { |
321 | 0 | int i, ret; |
322 | 0 | for (i = ret = 0; i < the_repository->parsed_objects->grafts_nr && !ret; i++) |
323 | 0 | ret = fn(the_repository->parsed_objects->grafts[i], cb_data); |
324 | 0 | return ret; |
325 | 0 | } |
326 | | |
327 | | void reset_commit_grafts(struct repository *r) |
328 | 0 | { |
329 | 0 | int i; |
330 | |
|
331 | 0 | for (i = 0; i < r->parsed_objects->grafts_nr; i++) { |
332 | 0 | unparse_commit(r, &r->parsed_objects->grafts[i]->oid); |
333 | 0 | free(r->parsed_objects->grafts[i]); |
334 | 0 | } |
335 | 0 | r->parsed_objects->grafts_nr = 0; |
336 | 0 | r->parsed_objects->commit_graft_prepared = 0; |
337 | 0 | } |
338 | | |
339 | | struct commit_buffer { |
340 | | void *buffer; |
341 | | unsigned long size; |
342 | | }; |
343 | | define_commit_slab(buffer_slab, struct commit_buffer); |
344 | | |
345 | | struct buffer_slab *allocate_commit_buffer_slab(void) |
346 | 0 | { |
347 | 0 | struct buffer_slab *bs = xmalloc(sizeof(*bs)); |
348 | 0 | init_buffer_slab(bs); |
349 | 0 | return bs; |
350 | 0 | } |
351 | | |
352 | | void free_commit_buffer_slab(struct buffer_slab *bs) |
353 | 0 | { |
354 | 0 | clear_buffer_slab(bs); |
355 | 0 | free(bs); |
356 | 0 | } |
357 | | |
358 | | void set_commit_buffer(struct repository *r, struct commit *commit, void *buffer, unsigned long size) |
359 | 0 | { |
360 | 0 | struct commit_buffer *v = buffer_slab_at( |
361 | 0 | r->parsed_objects->buffer_slab, commit); |
362 | 0 | v->buffer = buffer; |
363 | 0 | v->size = size; |
364 | 0 | } |
365 | | |
366 | | const void *get_cached_commit_buffer(struct repository *r, const struct commit *commit, unsigned long *sizep) |
367 | 0 | { |
368 | 0 | struct commit_buffer *v = buffer_slab_peek( |
369 | 0 | r->parsed_objects->buffer_slab, commit); |
370 | 0 | if (!v) { |
371 | 0 | if (sizep) |
372 | 0 | *sizep = 0; |
373 | 0 | return NULL; |
374 | 0 | } |
375 | 0 | if (sizep) |
376 | 0 | *sizep = v->size; |
377 | 0 | return v->buffer; |
378 | 0 | } |
379 | | |
380 | | const void *repo_get_commit_buffer(struct repository *r, |
381 | | const struct commit *commit, |
382 | | unsigned long *sizep) |
383 | 0 | { |
384 | 0 | const void *ret = get_cached_commit_buffer(r, commit, sizep); |
385 | 0 | if (!ret) { |
386 | 0 | enum object_type type; |
387 | 0 | unsigned long size; |
388 | 0 | ret = repo_read_object_file(r, &commit->object.oid, &type, &size); |
389 | 0 | if (!ret) |
390 | 0 | die("cannot read commit object %s", |
391 | 0 | oid_to_hex(&commit->object.oid)); |
392 | 0 | if (type != OBJ_COMMIT) |
393 | 0 | die("expected commit for %s, got %s", |
394 | 0 | oid_to_hex(&commit->object.oid), type_name(type)); |
395 | 0 | if (sizep) |
396 | 0 | *sizep = size; |
397 | 0 | } |
398 | 0 | return ret; |
399 | 0 | } |
400 | | |
401 | | void repo_unuse_commit_buffer(struct repository *r, |
402 | | const struct commit *commit, |
403 | | const void *buffer) |
404 | 0 | { |
405 | 0 | struct commit_buffer *v = buffer_slab_peek( |
406 | 0 | r->parsed_objects->buffer_slab, commit); |
407 | 0 | if (!(v && v->buffer == buffer)) |
408 | 0 | free((void *)buffer); |
409 | 0 | } |
410 | | |
411 | | void free_commit_buffer(struct parsed_object_pool *pool, struct commit *commit) |
412 | 0 | { |
413 | 0 | struct commit_buffer *v = buffer_slab_peek( |
414 | 0 | pool->buffer_slab, commit); |
415 | 0 | if (v) { |
416 | 0 | FREE_AND_NULL(v->buffer); |
417 | 0 | v->size = 0; |
418 | 0 | } |
419 | 0 | } |
420 | | |
421 | | static inline void set_commit_tree(struct commit *c, struct tree *t) |
422 | 0 | { |
423 | 0 | c->maybe_tree = t; |
424 | 0 | } |
425 | | |
426 | | struct tree *repo_get_commit_tree(struct repository *r, |
427 | | const struct commit *commit) |
428 | 0 | { |
429 | 0 | if (commit->maybe_tree || !commit->object.parsed) |
430 | 0 | return commit->maybe_tree; |
431 | | |
432 | 0 | if (commit_graph_position(commit) != COMMIT_NOT_FROM_GRAPH) |
433 | 0 | return get_commit_tree_in_graph(r, commit); |
434 | | |
435 | 0 | return NULL; |
436 | 0 | } |
437 | | |
438 | | struct object_id *get_commit_tree_oid(const struct commit *commit) |
439 | 0 | { |
440 | 0 | struct tree *tree = repo_get_commit_tree(the_repository, commit); |
441 | 0 | return tree ? &tree->object.oid : NULL; |
442 | 0 | } |
443 | | |
444 | | void release_commit_memory(struct parsed_object_pool *pool, struct commit *c) |
445 | 0 | { |
446 | 0 | set_commit_tree(c, NULL); |
447 | 0 | free_commit_buffer(pool, c); |
448 | 0 | c->index = 0; |
449 | 0 | free_commit_list(c->parents); |
450 | |
|
451 | 0 | c->object.parsed = 0; |
452 | 0 | } |
453 | | |
454 | | const void *detach_commit_buffer(struct commit *commit, unsigned long *sizep) |
455 | 0 | { |
456 | 0 | struct commit_buffer *v = buffer_slab_peek( |
457 | 0 | the_repository->parsed_objects->buffer_slab, commit); |
458 | 0 | void *ret; |
459 | |
|
460 | 0 | if (!v) { |
461 | 0 | if (sizep) |
462 | 0 | *sizep = 0; |
463 | 0 | return NULL; |
464 | 0 | } |
465 | 0 | ret = v->buffer; |
466 | 0 | if (sizep) |
467 | 0 | *sizep = v->size; |
468 | |
|
469 | 0 | v->buffer = NULL; |
470 | 0 | v->size = 0; |
471 | 0 | return ret; |
472 | 0 | } |
473 | | |
474 | | int parse_commit_buffer(struct repository *r, struct commit *item, const void *buffer, unsigned long size, int check_graph) |
475 | 0 | { |
476 | 0 | const char *tail = buffer; |
477 | 0 | const char *bufptr = buffer; |
478 | 0 | struct object_id parent; |
479 | 0 | struct commit_list **pptr; |
480 | 0 | struct commit_graft *graft; |
481 | 0 | const int tree_entry_len = the_hash_algo->hexsz + 5; |
482 | 0 | const int parent_entry_len = the_hash_algo->hexsz + 7; |
483 | 0 | struct tree *tree; |
484 | |
|
485 | 0 | if (item->object.parsed) |
486 | 0 | return 0; |
487 | | /* |
488 | | * Presumably this is leftover from an earlier failed parse; |
489 | | * clear it out in preparation for us re-parsing (we'll hit the |
490 | | * same error, but that's good, since it lets our caller know |
491 | | * the result cannot be trusted. |
492 | | */ |
493 | 0 | free_commit_list(item->parents); |
494 | 0 | item->parents = NULL; |
495 | |
|
496 | 0 | tail += size; |
497 | 0 | if (tail <= bufptr + tree_entry_len + 1 || memcmp(bufptr, "tree ", 5) || |
498 | 0 | bufptr[tree_entry_len] != '\n') |
499 | 0 | return error("bogus commit object %s", oid_to_hex(&item->object.oid)); |
500 | 0 | if (get_oid_hex(bufptr + 5, &parent) < 0) |
501 | 0 | return error("bad tree pointer in commit %s", |
502 | 0 | oid_to_hex(&item->object.oid)); |
503 | 0 | tree = lookup_tree(r, &parent); |
504 | 0 | if (!tree) |
505 | 0 | return error("bad tree pointer %s in commit %s", |
506 | 0 | oid_to_hex(&parent), |
507 | 0 | oid_to_hex(&item->object.oid)); |
508 | 0 | set_commit_tree(item, tree); |
509 | 0 | bufptr += tree_entry_len + 1; /* "tree " + "hex sha1" + "\n" */ |
510 | 0 | pptr = &item->parents; |
511 | |
|
512 | 0 | graft = lookup_commit_graft(r, &item->object.oid); |
513 | 0 | if (graft) |
514 | 0 | r->parsed_objects->substituted_parent = 1; |
515 | 0 | while (bufptr + parent_entry_len < tail && !memcmp(bufptr, "parent ", 7)) { |
516 | 0 | struct commit *new_parent; |
517 | |
|
518 | 0 | if (tail <= bufptr + parent_entry_len + 1 || |
519 | 0 | get_oid_hex(bufptr + 7, &parent) || |
520 | 0 | bufptr[parent_entry_len] != '\n') |
521 | 0 | return error("bad parents in commit %s", oid_to_hex(&item->object.oid)); |
522 | 0 | bufptr += parent_entry_len + 1; |
523 | | /* |
524 | | * The clone is shallow if nr_parent < 0, and we must |
525 | | * not traverse its real parents even when we unhide them. |
526 | | */ |
527 | 0 | if (graft && (graft->nr_parent < 0 || !grafts_keep_true_parents)) |
528 | 0 | continue; |
529 | 0 | new_parent = lookup_commit(r, &parent); |
530 | 0 | if (!new_parent) |
531 | 0 | return error("bad parent %s in commit %s", |
532 | 0 | oid_to_hex(&parent), |
533 | 0 | oid_to_hex(&item->object.oid)); |
534 | 0 | pptr = &commit_list_insert(new_parent, pptr)->next; |
535 | 0 | } |
536 | 0 | if (graft) { |
537 | 0 | int i; |
538 | 0 | struct commit *new_parent; |
539 | 0 | for (i = 0; i < graft->nr_parent; i++) { |
540 | 0 | new_parent = lookup_commit(r, |
541 | 0 | &graft->parent[i]); |
542 | 0 | if (!new_parent) |
543 | 0 | return error("bad graft parent %s in commit %s", |
544 | 0 | oid_to_hex(&graft->parent[i]), |
545 | 0 | oid_to_hex(&item->object.oid)); |
546 | 0 | pptr = &commit_list_insert(new_parent, pptr)->next; |
547 | 0 | } |
548 | 0 | } |
549 | 0 | item->date = parse_commit_date(bufptr, tail); |
550 | |
|
551 | 0 | if (check_graph) |
552 | 0 | load_commit_graph_info(r, item); |
553 | |
|
554 | 0 | item->object.parsed = 1; |
555 | 0 | return 0; |
556 | 0 | } |
557 | | |
558 | | int repo_parse_commit_internal(struct repository *r, |
559 | | struct commit *item, |
560 | | int quiet_on_missing, |
561 | | int use_commit_graph) |
562 | 0 | { |
563 | 0 | enum object_type type; |
564 | 0 | void *buffer; |
565 | 0 | unsigned long size; |
566 | 0 | struct object_info oi = { |
567 | 0 | .typep = &type, |
568 | 0 | .sizep = &size, |
569 | 0 | .contentp = &buffer, |
570 | 0 | }; |
571 | | /* |
572 | | * Git does not support partial clones that exclude commits, so set |
573 | | * OBJECT_INFO_SKIP_FETCH_OBJECT to fail fast when an object is missing. |
574 | | */ |
575 | 0 | int flags = OBJECT_INFO_LOOKUP_REPLACE | OBJECT_INFO_SKIP_FETCH_OBJECT | |
576 | 0 | OBJECT_INFO_DIE_IF_CORRUPT; |
577 | 0 | int ret; |
578 | |
|
579 | 0 | if (!item) |
580 | 0 | return -1; |
581 | 0 | if (item->object.parsed) |
582 | 0 | return 0; |
583 | 0 | if (use_commit_graph && parse_commit_in_graph(r, item)) { |
584 | 0 | static int commit_graph_paranoia = -1; |
585 | |
|
586 | 0 | if (commit_graph_paranoia == -1) |
587 | 0 | commit_graph_paranoia = git_env_bool(GIT_COMMIT_GRAPH_PARANOIA, 0); |
588 | |
|
589 | 0 | if (commit_graph_paranoia && !has_object(r, &item->object.oid, 0)) { |
590 | 0 | unparse_commit(r, &item->object.oid); |
591 | 0 | return quiet_on_missing ? -1 : |
592 | 0 | error(_("commit %s exists in commit-graph but not in the object database"), |
593 | 0 | oid_to_hex(&item->object.oid)); |
594 | 0 | } |
595 | | |
596 | 0 | return 0; |
597 | 0 | } |
598 | | |
599 | 0 | if (oid_object_info_extended(r, &item->object.oid, &oi, flags) < 0) |
600 | 0 | return quiet_on_missing ? -1 : |
601 | 0 | error("Could not read %s", |
602 | 0 | oid_to_hex(&item->object.oid)); |
603 | 0 | if (type != OBJ_COMMIT) { |
604 | 0 | free(buffer); |
605 | 0 | return error("Object %s not a commit", |
606 | 0 | oid_to_hex(&item->object.oid)); |
607 | 0 | } |
608 | | |
609 | 0 | ret = parse_commit_buffer(r, item, buffer, size, 0); |
610 | 0 | if (save_commit_buffer && !ret) { |
611 | 0 | set_commit_buffer(r, item, buffer, size); |
612 | 0 | return 0; |
613 | 0 | } |
614 | 0 | free(buffer); |
615 | 0 | return ret; |
616 | 0 | } |
617 | | |
618 | | int repo_parse_commit_gently(struct repository *r, |
619 | | struct commit *item, int quiet_on_missing) |
620 | 0 | { |
621 | 0 | return repo_parse_commit_internal(r, item, quiet_on_missing, 1); |
622 | 0 | } |
623 | | |
624 | | void parse_commit_or_die(struct commit *item) |
625 | 0 | { |
626 | 0 | if (repo_parse_commit(the_repository, item)) |
627 | 0 | die("unable to parse commit %s", |
628 | 0 | item ? oid_to_hex(&item->object.oid) : "(null)"); |
629 | 0 | } |
630 | | |
631 | | int find_commit_subject(const char *commit_buffer, const char **subject) |
632 | 0 | { |
633 | 0 | const char *eol; |
634 | 0 | const char *p = commit_buffer; |
635 | |
|
636 | 0 | while (*p && (*p != '\n' || p[1] != '\n')) |
637 | 0 | p++; |
638 | 0 | if (*p) { |
639 | 0 | p = skip_blank_lines(p + 2); |
640 | 0 | eol = strchrnul(p, '\n'); |
641 | 0 | } else |
642 | 0 | eol = p; |
643 | |
|
644 | 0 | *subject = p; |
645 | |
|
646 | 0 | return eol - p; |
647 | 0 | } |
648 | | |
649 | | size_t commit_subject_length(const char *body) |
650 | 0 | { |
651 | 0 | const char *p = body; |
652 | 0 | while (*p) { |
653 | 0 | const char *next = skip_blank_lines(p); |
654 | 0 | if (next != p) |
655 | 0 | break; |
656 | 0 | p = strchrnul(p, '\n'); |
657 | 0 | if (*p) |
658 | 0 | p++; |
659 | 0 | } |
660 | 0 | return p - body; |
661 | 0 | } |
662 | | |
663 | | struct commit_list *commit_list_insert(struct commit *item, struct commit_list **list_p) |
664 | 0 | { |
665 | 0 | struct commit_list *new_list = xmalloc(sizeof(struct commit_list)); |
666 | 0 | new_list->item = item; |
667 | 0 | new_list->next = *list_p; |
668 | 0 | *list_p = new_list; |
669 | 0 | return new_list; |
670 | 0 | } |
671 | | |
672 | | int commit_list_contains(struct commit *item, struct commit_list *list) |
673 | 0 | { |
674 | 0 | while (list) { |
675 | 0 | if (list->item == item) |
676 | 0 | return 1; |
677 | 0 | list = list->next; |
678 | 0 | } |
679 | | |
680 | 0 | return 0; |
681 | 0 | } |
682 | | |
683 | | unsigned commit_list_count(const struct commit_list *l) |
684 | 0 | { |
685 | 0 | unsigned c = 0; |
686 | 0 | for (; l; l = l->next ) |
687 | 0 | c++; |
688 | 0 | return c; |
689 | 0 | } |
690 | | |
691 | | struct commit_list *copy_commit_list(const struct commit_list *list) |
692 | 0 | { |
693 | 0 | struct commit_list *head = NULL; |
694 | 0 | struct commit_list **pp = &head; |
695 | 0 | while (list) { |
696 | 0 | pp = commit_list_append(list->item, pp); |
697 | 0 | list = list->next; |
698 | 0 | } |
699 | 0 | return head; |
700 | 0 | } |
701 | | |
702 | | struct commit_list *reverse_commit_list(struct commit_list *list) |
703 | 0 | { |
704 | 0 | struct commit_list *next = NULL, *current, *backup; |
705 | 0 | for (current = list; current; current = backup) { |
706 | 0 | backup = current->next; |
707 | 0 | current->next = next; |
708 | 0 | next = current; |
709 | 0 | } |
710 | 0 | return next; |
711 | 0 | } |
712 | | |
713 | | void free_commit_list(struct commit_list *list) |
714 | 0 | { |
715 | 0 | while (list) |
716 | 0 | pop_commit(&list); |
717 | 0 | } |
718 | | |
719 | | struct commit_list * commit_list_insert_by_date(struct commit *item, struct commit_list **list) |
720 | 0 | { |
721 | 0 | struct commit_list **pp = list; |
722 | 0 | struct commit_list *p; |
723 | 0 | while ((p = *pp) != NULL) { |
724 | 0 | if (p->item->date < item->date) { |
725 | 0 | break; |
726 | 0 | } |
727 | 0 | pp = &p->next; |
728 | 0 | } |
729 | 0 | return commit_list_insert(item, pp); |
730 | 0 | } |
731 | | |
732 | | static int commit_list_compare_by_date(const struct commit_list *a, |
733 | | const struct commit_list *b) |
734 | 0 | { |
735 | 0 | timestamp_t a_date = a->item->date; |
736 | 0 | timestamp_t b_date = b->item->date; |
737 | 0 | if (a_date < b_date) |
738 | 0 | return 1; |
739 | 0 | if (a_date > b_date) |
740 | 0 | return -1; |
741 | 0 | return 0; |
742 | 0 | } |
743 | | |
744 | | DEFINE_LIST_SORT(static, commit_list_sort, struct commit_list, next); |
745 | | |
746 | | void commit_list_sort_by_date(struct commit_list **list) |
747 | 0 | { |
748 | 0 | commit_list_sort(list, commit_list_compare_by_date); |
749 | 0 | } |
750 | | |
751 | | struct commit *pop_most_recent_commit(struct commit_list **list, |
752 | | unsigned int mark) |
753 | 0 | { |
754 | 0 | struct commit *ret = pop_commit(list); |
755 | 0 | struct commit_list *parents = ret->parents; |
756 | |
|
757 | 0 | while (parents) { |
758 | 0 | struct commit *commit = parents->item; |
759 | 0 | if (!repo_parse_commit(the_repository, commit) && !(commit->object.flags & mark)) { |
760 | 0 | commit->object.flags |= mark; |
761 | 0 | commit_list_insert_by_date(commit, list); |
762 | 0 | } |
763 | 0 | parents = parents->next; |
764 | 0 | } |
765 | 0 | return ret; |
766 | 0 | } |
767 | | |
768 | | static void clear_commit_marks_1(struct commit_list **plist, |
769 | | struct commit *commit, unsigned int mark) |
770 | 0 | { |
771 | 0 | while (commit) { |
772 | 0 | struct commit_list *parents; |
773 | |
|
774 | 0 | if (!(mark & commit->object.flags)) |
775 | 0 | return; |
776 | | |
777 | 0 | commit->object.flags &= ~mark; |
778 | |
|
779 | 0 | parents = commit->parents; |
780 | 0 | if (!parents) |
781 | 0 | return; |
782 | | |
783 | 0 | while ((parents = parents->next)) { |
784 | 0 | if (parents->item->object.flags & mark) |
785 | 0 | commit_list_insert(parents->item, plist); |
786 | 0 | } |
787 | |
|
788 | 0 | commit = commit->parents->item; |
789 | 0 | } |
790 | 0 | } |
791 | | |
792 | | void clear_commit_marks_many(int nr, struct commit **commit, unsigned int mark) |
793 | 0 | { |
794 | 0 | struct commit_list *list = NULL; |
795 | |
|
796 | 0 | while (nr--) { |
797 | 0 | clear_commit_marks_1(&list, *commit, mark); |
798 | 0 | commit++; |
799 | 0 | } |
800 | 0 | while (list) |
801 | 0 | clear_commit_marks_1(&list, pop_commit(&list), mark); |
802 | 0 | } |
803 | | |
804 | | void clear_commit_marks(struct commit *commit, unsigned int mark) |
805 | 0 | { |
806 | 0 | clear_commit_marks_many(1, &commit, mark); |
807 | 0 | } |
808 | | |
809 | | struct commit *pop_commit(struct commit_list **stack) |
810 | 0 | { |
811 | 0 | struct commit_list *top = *stack; |
812 | 0 | struct commit *item = top ? top->item : NULL; |
813 | |
|
814 | 0 | if (top) { |
815 | 0 | *stack = top->next; |
816 | 0 | free(top); |
817 | 0 | } |
818 | 0 | return item; |
819 | 0 | } |
820 | | |
821 | | /* |
822 | | * Topological sort support |
823 | | */ |
824 | | |
825 | | /* count number of children that have not been emitted */ |
826 | | define_commit_slab(indegree_slab, int); |
827 | | |
828 | | define_commit_slab(author_date_slab, timestamp_t); |
829 | | |
830 | | void record_author_date(struct author_date_slab *author_date, |
831 | | struct commit *commit) |
832 | 0 | { |
833 | 0 | const char *buffer = repo_get_commit_buffer(the_repository, commit, |
834 | 0 | NULL); |
835 | 0 | struct ident_split ident; |
836 | 0 | const char *ident_line; |
837 | 0 | size_t ident_len; |
838 | 0 | char *date_end; |
839 | 0 | timestamp_t date; |
840 | |
|
841 | 0 | ident_line = find_commit_header(buffer, "author", &ident_len); |
842 | 0 | if (!ident_line) |
843 | 0 | goto fail_exit; /* no author line */ |
844 | 0 | if (split_ident_line(&ident, ident_line, ident_len) || |
845 | 0 | !ident.date_begin || !ident.date_end) |
846 | 0 | goto fail_exit; /* malformed "author" line */ |
847 | | |
848 | 0 | date = parse_timestamp(ident.date_begin, &date_end, 10); |
849 | 0 | if (date_end != ident.date_end) |
850 | 0 | goto fail_exit; /* malformed date */ |
851 | 0 | *(author_date_slab_at(author_date, commit)) = date; |
852 | |
|
853 | 0 | fail_exit: |
854 | 0 | repo_unuse_commit_buffer(the_repository, commit, buffer); |
855 | 0 | } |
856 | | |
857 | | int compare_commits_by_author_date(const void *a_, const void *b_, |
858 | | void *cb_data) |
859 | 0 | { |
860 | 0 | const struct commit *a = a_, *b = b_; |
861 | 0 | struct author_date_slab *author_date = cb_data; |
862 | 0 | timestamp_t a_date = *(author_date_slab_at(author_date, a)); |
863 | 0 | timestamp_t b_date = *(author_date_slab_at(author_date, b)); |
864 | | |
865 | | /* newer commits with larger date first */ |
866 | 0 | if (a_date < b_date) |
867 | 0 | return 1; |
868 | 0 | else if (a_date > b_date) |
869 | 0 | return -1; |
870 | 0 | return 0; |
871 | 0 | } |
872 | | |
873 | | int compare_commits_by_gen_then_commit_date(const void *a_, const void *b_, |
874 | | void *unused UNUSED) |
875 | 0 | { |
876 | 0 | const struct commit *a = a_, *b = b_; |
877 | 0 | const timestamp_t generation_a = commit_graph_generation(a), |
878 | 0 | generation_b = commit_graph_generation(b); |
879 | | |
880 | | /* newer commits first */ |
881 | 0 | if (generation_a < generation_b) |
882 | 0 | return 1; |
883 | 0 | else if (generation_a > generation_b) |
884 | 0 | return -1; |
885 | | |
886 | | /* use date as a heuristic when generations are equal */ |
887 | 0 | if (a->date < b->date) |
888 | 0 | return 1; |
889 | 0 | else if (a->date > b->date) |
890 | 0 | return -1; |
891 | 0 | return 0; |
892 | 0 | } |
893 | | |
894 | | int compare_commits_by_commit_date(const void *a_, const void *b_, |
895 | | void *unused UNUSED) |
896 | 0 | { |
897 | 0 | const struct commit *a = a_, *b = b_; |
898 | | /* newer commits with larger date first */ |
899 | 0 | if (a->date < b->date) |
900 | 0 | return 1; |
901 | 0 | else if (a->date > b->date) |
902 | 0 | return -1; |
903 | 0 | return 0; |
904 | 0 | } |
905 | | |
906 | | /* |
907 | | * Performs an in-place topological sort on the list supplied. |
908 | | */ |
909 | | void sort_in_topological_order(struct commit_list **list, enum rev_sort_order sort_order) |
910 | 0 | { |
911 | 0 | struct commit_list *next, *orig = *list; |
912 | 0 | struct commit_list **pptr; |
913 | 0 | struct indegree_slab indegree; |
914 | 0 | struct prio_queue queue; |
915 | 0 | struct commit *commit; |
916 | 0 | struct author_date_slab author_date; |
917 | |
|
918 | 0 | if (!orig) |
919 | 0 | return; |
920 | 0 | *list = NULL; |
921 | |
|
922 | 0 | init_indegree_slab(&indegree); |
923 | 0 | memset(&queue, '\0', sizeof(queue)); |
924 | |
|
925 | 0 | switch (sort_order) { |
926 | 0 | default: /* REV_SORT_IN_GRAPH_ORDER */ |
927 | 0 | queue.compare = NULL; |
928 | 0 | break; |
929 | 0 | case REV_SORT_BY_COMMIT_DATE: |
930 | 0 | queue.compare = compare_commits_by_commit_date; |
931 | 0 | break; |
932 | 0 | case REV_SORT_BY_AUTHOR_DATE: |
933 | 0 | init_author_date_slab(&author_date); |
934 | 0 | queue.compare = compare_commits_by_author_date; |
935 | 0 | queue.cb_data = &author_date; |
936 | 0 | break; |
937 | 0 | } |
938 | | |
939 | | /* Mark them and clear the indegree */ |
940 | 0 | for (next = orig; next; next = next->next) { |
941 | 0 | struct commit *commit = next->item; |
942 | 0 | *(indegree_slab_at(&indegree, commit)) = 1; |
943 | | /* also record the author dates, if needed */ |
944 | 0 | if (sort_order == REV_SORT_BY_AUTHOR_DATE) |
945 | 0 | record_author_date(&author_date, commit); |
946 | 0 | } |
947 | | |
948 | | /* update the indegree */ |
949 | 0 | for (next = orig; next; next = next->next) { |
950 | 0 | struct commit_list *parents = next->item->parents; |
951 | 0 | while (parents) { |
952 | 0 | struct commit *parent = parents->item; |
953 | 0 | int *pi = indegree_slab_at(&indegree, parent); |
954 | |
|
955 | 0 | if (*pi) |
956 | 0 | (*pi)++; |
957 | 0 | parents = parents->next; |
958 | 0 | } |
959 | 0 | } |
960 | | |
961 | | /* |
962 | | * find the tips |
963 | | * |
964 | | * tips are nodes not reachable from any other node in the list |
965 | | * |
966 | | * the tips serve as a starting set for the work queue. |
967 | | */ |
968 | 0 | for (next = orig; next; next = next->next) { |
969 | 0 | struct commit *commit = next->item; |
970 | |
|
971 | 0 | if (*(indegree_slab_at(&indegree, commit)) == 1) |
972 | 0 | prio_queue_put(&queue, commit); |
973 | 0 | } |
974 | | |
975 | | /* |
976 | | * This is unfortunate; the initial tips need to be shown |
977 | | * in the order given from the revision traversal machinery. |
978 | | */ |
979 | 0 | if (sort_order == REV_SORT_IN_GRAPH_ORDER) |
980 | 0 | prio_queue_reverse(&queue); |
981 | | |
982 | | /* We no longer need the commit list */ |
983 | 0 | free_commit_list(orig); |
984 | |
|
985 | 0 | pptr = list; |
986 | 0 | *list = NULL; |
987 | 0 | while ((commit = prio_queue_get(&queue)) != NULL) { |
988 | 0 | struct commit_list *parents; |
989 | |
|
990 | 0 | for (parents = commit->parents; parents ; parents = parents->next) { |
991 | 0 | struct commit *parent = parents->item; |
992 | 0 | int *pi = indegree_slab_at(&indegree, parent); |
993 | |
|
994 | 0 | if (!*pi) |
995 | 0 | continue; |
996 | | |
997 | | /* |
998 | | * parents are only enqueued for emission |
999 | | * when all their children have been emitted thereby |
1000 | | * guaranteeing topological order. |
1001 | | */ |
1002 | 0 | if (--(*pi) == 1) |
1003 | 0 | prio_queue_put(&queue, parent); |
1004 | 0 | } |
1005 | | /* |
1006 | | * all children of commit have already been |
1007 | | * emitted. we can emit it now. |
1008 | | */ |
1009 | 0 | *(indegree_slab_at(&indegree, commit)) = 0; |
1010 | |
|
1011 | 0 | pptr = &commit_list_insert(commit, pptr)->next; |
1012 | 0 | } |
1013 | |
|
1014 | 0 | clear_indegree_slab(&indegree); |
1015 | 0 | clear_prio_queue(&queue); |
1016 | 0 | if (sort_order == REV_SORT_BY_AUTHOR_DATE) |
1017 | 0 | clear_author_date_slab(&author_date); |
1018 | 0 | } |
1019 | | |
1020 | | struct rev_collect { |
1021 | | struct commit **commit; |
1022 | | int nr; |
1023 | | int alloc; |
1024 | | unsigned int initial : 1; |
1025 | | }; |
1026 | | |
1027 | | static void add_one_commit(struct object_id *oid, struct rev_collect *revs) |
1028 | 0 | { |
1029 | 0 | struct commit *commit; |
1030 | |
|
1031 | 0 | if (is_null_oid(oid)) |
1032 | 0 | return; |
1033 | | |
1034 | 0 | commit = lookup_commit(the_repository, oid); |
1035 | 0 | if (!commit || |
1036 | 0 | (commit->object.flags & TMP_MARK) || |
1037 | 0 | repo_parse_commit(the_repository, commit)) |
1038 | 0 | return; |
1039 | | |
1040 | 0 | ALLOC_GROW(revs->commit, revs->nr + 1, revs->alloc); |
1041 | 0 | revs->commit[revs->nr++] = commit; |
1042 | 0 | commit->object.flags |= TMP_MARK; |
1043 | 0 | } |
1044 | | |
1045 | | static int collect_one_reflog_ent(struct object_id *ooid, struct object_id *noid, |
1046 | | const char *ident UNUSED, |
1047 | | timestamp_t timestamp UNUSED, int tz UNUSED, |
1048 | | const char *message UNUSED, void *cbdata) |
1049 | 0 | { |
1050 | 0 | struct rev_collect *revs = cbdata; |
1051 | |
|
1052 | 0 | if (revs->initial) { |
1053 | 0 | revs->initial = 0; |
1054 | 0 | add_one_commit(ooid, revs); |
1055 | 0 | } |
1056 | 0 | add_one_commit(noid, revs); |
1057 | 0 | return 0; |
1058 | 0 | } |
1059 | | |
1060 | | struct commit *get_fork_point(const char *refname, struct commit *commit) |
1061 | 0 | { |
1062 | 0 | struct object_id oid; |
1063 | 0 | struct rev_collect revs; |
1064 | 0 | struct commit_list *bases = NULL; |
1065 | 0 | int i; |
1066 | 0 | struct commit *ret = NULL; |
1067 | 0 | char *full_refname; |
1068 | |
|
1069 | 0 | switch (repo_dwim_ref(the_repository, refname, strlen(refname), &oid, |
1070 | 0 | &full_refname, 0)) { |
1071 | 0 | case 0: |
1072 | 0 | die("No such ref: '%s'", refname); |
1073 | 0 | case 1: |
1074 | 0 | break; /* good */ |
1075 | 0 | default: |
1076 | 0 | die("Ambiguous refname: '%s'", refname); |
1077 | 0 | } |
1078 | | |
1079 | 0 | memset(&revs, 0, sizeof(revs)); |
1080 | 0 | revs.initial = 1; |
1081 | 0 | refs_for_each_reflog_ent(get_main_ref_store(the_repository), |
1082 | 0 | full_refname, collect_one_reflog_ent, &revs); |
1083 | |
|
1084 | 0 | if (!revs.nr) |
1085 | 0 | add_one_commit(&oid, &revs); |
1086 | |
|
1087 | 0 | for (i = 0; i < revs.nr; i++) |
1088 | 0 | revs.commit[i]->object.flags &= ~TMP_MARK; |
1089 | |
|
1090 | 0 | if (repo_get_merge_bases_many(the_repository, commit, revs.nr, |
1091 | 0 | revs.commit, &bases) < 0) |
1092 | 0 | exit(128); |
1093 | | |
1094 | | /* |
1095 | | * There should be one and only one merge base, when we found |
1096 | | * a common ancestor among reflog entries. |
1097 | | */ |
1098 | 0 | if (!bases || bases->next) |
1099 | 0 | goto cleanup_return; |
1100 | | |
1101 | | /* And the found one must be one of the reflog entries */ |
1102 | 0 | for (i = 0; i < revs.nr; i++) |
1103 | 0 | if (&bases->item->object == &revs.commit[i]->object) |
1104 | 0 | break; /* found */ |
1105 | 0 | if (revs.nr <= i) |
1106 | 0 | goto cleanup_return; |
1107 | | |
1108 | 0 | ret = bases->item; |
1109 | |
|
1110 | 0 | cleanup_return: |
1111 | 0 | free(revs.commit); |
1112 | 0 | free_commit_list(bases); |
1113 | 0 | free(full_refname); |
1114 | 0 | return ret; |
1115 | 0 | } |
1116 | | |
1117 | | /* |
1118 | | * Indexed by hash algorithm identifier. |
1119 | | */ |
1120 | | static const char *gpg_sig_headers[] = { |
1121 | | NULL, |
1122 | | "gpgsig", |
1123 | | "gpgsig-sha256", |
1124 | | }; |
1125 | | |
1126 | | int add_header_signature(struct strbuf *buf, struct strbuf *sig, const struct git_hash_algo *algo) |
1127 | 0 | { |
1128 | 0 | int inspos, copypos; |
1129 | 0 | const char *eoh; |
1130 | 0 | const char *gpg_sig_header = gpg_sig_headers[hash_algo_by_ptr(algo)]; |
1131 | 0 | int gpg_sig_header_len = strlen(gpg_sig_header); |
1132 | | |
1133 | | /* find the end of the header */ |
1134 | 0 | eoh = strstr(buf->buf, "\n\n"); |
1135 | 0 | if (!eoh) |
1136 | 0 | inspos = buf->len; |
1137 | 0 | else |
1138 | 0 | inspos = eoh - buf->buf + 1; |
1139 | |
|
1140 | 0 | for (copypos = 0; sig->buf[copypos]; ) { |
1141 | 0 | const char *bol = sig->buf + copypos; |
1142 | 0 | const char *eol = strchrnul(bol, '\n'); |
1143 | 0 | int len = (eol - bol) + !!*eol; |
1144 | |
|
1145 | 0 | if (!copypos) { |
1146 | 0 | strbuf_insert(buf, inspos, gpg_sig_header, gpg_sig_header_len); |
1147 | 0 | inspos += gpg_sig_header_len; |
1148 | 0 | } |
1149 | 0 | strbuf_insertstr(buf, inspos++, " "); |
1150 | 0 | strbuf_insert(buf, inspos, bol, len); |
1151 | 0 | inspos += len; |
1152 | 0 | copypos += len; |
1153 | 0 | } |
1154 | 0 | return 0; |
1155 | 0 | } |
1156 | | |
1157 | | static int sign_commit_to_strbuf(struct strbuf *sig, struct strbuf *buf, const char *keyid) |
1158 | 0 | { |
1159 | 0 | if (!keyid || !*keyid) |
1160 | 0 | keyid = get_signing_key(); |
1161 | 0 | if (sign_buffer(buf, sig, keyid)) |
1162 | 0 | return -1; |
1163 | 0 | return 0; |
1164 | 0 | } |
1165 | | |
1166 | | int parse_signed_commit(const struct commit *commit, |
1167 | | struct strbuf *payload, struct strbuf *signature, |
1168 | | const struct git_hash_algo *algop) |
1169 | 0 | { |
1170 | 0 | unsigned long size; |
1171 | 0 | const char *buffer = repo_get_commit_buffer(the_repository, commit, |
1172 | 0 | &size); |
1173 | 0 | int ret = parse_buffer_signed_by_header(buffer, size, payload, signature, algop); |
1174 | |
|
1175 | 0 | repo_unuse_commit_buffer(the_repository, commit, buffer); |
1176 | 0 | return ret; |
1177 | 0 | } |
1178 | | |
1179 | | int parse_buffer_signed_by_header(const char *buffer, |
1180 | | unsigned long size, |
1181 | | struct strbuf *payload, |
1182 | | struct strbuf *signature, |
1183 | | const struct git_hash_algo *algop) |
1184 | 0 | { |
1185 | 0 | int in_signature = 0, saw_signature = 0, other_signature = 0; |
1186 | 0 | const char *line, *tail, *p; |
1187 | 0 | const char *gpg_sig_header = gpg_sig_headers[hash_algo_by_ptr(algop)]; |
1188 | |
|
1189 | 0 | line = buffer; |
1190 | 0 | tail = buffer + size; |
1191 | 0 | while (line < tail) { |
1192 | 0 | const char *sig = NULL; |
1193 | 0 | const char *next = memchr(line, '\n', tail - line); |
1194 | |
|
1195 | 0 | next = next ? next + 1 : tail; |
1196 | 0 | if (in_signature && line[0] == ' ') |
1197 | 0 | sig = line + 1; |
1198 | 0 | else if (skip_prefix(line, gpg_sig_header, &p) && |
1199 | 0 | *p == ' ') { |
1200 | 0 | sig = line + strlen(gpg_sig_header) + 1; |
1201 | 0 | other_signature = 0; |
1202 | 0 | } |
1203 | 0 | else if (starts_with(line, "gpgsig")) |
1204 | 0 | other_signature = 1; |
1205 | 0 | else if (other_signature && line[0] != ' ') |
1206 | 0 | other_signature = 0; |
1207 | 0 | if (sig) { |
1208 | 0 | strbuf_add(signature, sig, next - sig); |
1209 | 0 | saw_signature = 1; |
1210 | 0 | in_signature = 1; |
1211 | 0 | } else { |
1212 | 0 | if (*line == '\n') |
1213 | | /* dump the whole remainder of the buffer */ |
1214 | 0 | next = tail; |
1215 | 0 | if (!other_signature) |
1216 | 0 | strbuf_add(payload, line, next - line); |
1217 | 0 | in_signature = 0; |
1218 | 0 | } |
1219 | 0 | line = next; |
1220 | 0 | } |
1221 | 0 | return saw_signature; |
1222 | 0 | } |
1223 | | |
1224 | | int remove_signature(struct strbuf *buf) |
1225 | 0 | { |
1226 | 0 | const char *line = buf->buf; |
1227 | 0 | const char *tail = buf->buf + buf->len; |
1228 | 0 | int in_signature = 0; |
1229 | 0 | struct sigbuf { |
1230 | 0 | const char *start; |
1231 | 0 | const char *end; |
1232 | 0 | } sigs[2], *sigp = &sigs[0]; |
1233 | 0 | int i; |
1234 | 0 | const char *orig_buf = buf->buf; |
1235 | |
|
1236 | 0 | memset(sigs, 0, sizeof(sigs)); |
1237 | |
|
1238 | 0 | while (line < tail) { |
1239 | 0 | const char *next = memchr(line, '\n', tail - line); |
1240 | 0 | next = next ? next + 1 : tail; |
1241 | |
|
1242 | 0 | if (in_signature && line[0] == ' ') |
1243 | 0 | sigp->end = next; |
1244 | 0 | else if (starts_with(line, "gpgsig")) { |
1245 | 0 | int i; |
1246 | 0 | for (i = 1; i < GIT_HASH_NALGOS; i++) { |
1247 | 0 | const char *p; |
1248 | 0 | if (skip_prefix(line, gpg_sig_headers[i], &p) && |
1249 | 0 | *p == ' ') { |
1250 | 0 | sigp->start = line; |
1251 | 0 | sigp->end = next; |
1252 | 0 | in_signature = 1; |
1253 | 0 | } |
1254 | 0 | } |
1255 | 0 | } else { |
1256 | 0 | if (*line == '\n') |
1257 | | /* dump the whole remainder of the buffer */ |
1258 | 0 | next = tail; |
1259 | 0 | if (in_signature && sigp - sigs != ARRAY_SIZE(sigs)) |
1260 | 0 | sigp++; |
1261 | 0 | in_signature = 0; |
1262 | 0 | } |
1263 | 0 | line = next; |
1264 | 0 | } |
1265 | |
|
1266 | 0 | for (i = ARRAY_SIZE(sigs) - 1; i >= 0; i--) |
1267 | 0 | if (sigs[i].start) |
1268 | 0 | strbuf_remove(buf, sigs[i].start - orig_buf, sigs[i].end - sigs[i].start); |
1269 | |
|
1270 | 0 | return sigs[0].start != NULL; |
1271 | 0 | } |
1272 | | |
1273 | | static void handle_signed_tag(const struct commit *parent, struct commit_extra_header ***tail) |
1274 | 0 | { |
1275 | 0 | struct merge_remote_desc *desc; |
1276 | 0 | struct commit_extra_header *mergetag; |
1277 | 0 | char *buf; |
1278 | 0 | unsigned long size; |
1279 | 0 | enum object_type type; |
1280 | 0 | struct strbuf payload = STRBUF_INIT; |
1281 | 0 | struct strbuf signature = STRBUF_INIT; |
1282 | |
|
1283 | 0 | desc = merge_remote_util(parent); |
1284 | 0 | if (!desc || !desc->obj) |
1285 | 0 | return; |
1286 | 0 | buf = repo_read_object_file(the_repository, &desc->obj->oid, &type, |
1287 | 0 | &size); |
1288 | 0 | if (!buf || type != OBJ_TAG) |
1289 | 0 | goto free_return; |
1290 | 0 | if (!parse_signature(buf, size, &payload, &signature)) |
1291 | 0 | goto free_return; |
1292 | | /* |
1293 | | * We could verify this signature and either omit the tag when |
1294 | | * it does not validate, but the integrator may not have the |
1295 | | * public key of the signer of the tag being merged, while a |
1296 | | * later auditor may have it while auditing, so let's not run |
1297 | | * verify-signed-buffer here for now... |
1298 | | * |
1299 | | * if (verify_signed_buffer(buf, len, buf + len, size - len, ...)) |
1300 | | * warn("warning: signed tag unverified."); |
1301 | | */ |
1302 | 0 | CALLOC_ARRAY(mergetag, 1); |
1303 | 0 | mergetag->key = xstrdup("mergetag"); |
1304 | 0 | mergetag->value = buf; |
1305 | 0 | mergetag->len = size; |
1306 | |
|
1307 | 0 | **tail = mergetag; |
1308 | 0 | *tail = &mergetag->next; |
1309 | 0 | strbuf_release(&payload); |
1310 | 0 | strbuf_release(&signature); |
1311 | 0 | return; |
1312 | | |
1313 | 0 | free_return: |
1314 | 0 | free(buf); |
1315 | 0 | } |
1316 | | |
1317 | | int check_commit_signature(const struct commit *commit, struct signature_check *sigc) |
1318 | 0 | { |
1319 | 0 | struct strbuf payload = STRBUF_INIT; |
1320 | 0 | struct strbuf signature = STRBUF_INIT; |
1321 | 0 | int ret = 1; |
1322 | |
|
1323 | 0 | sigc->result = 'N'; |
1324 | |
|
1325 | 0 | if (parse_signed_commit(commit, &payload, &signature, the_hash_algo) <= 0) |
1326 | 0 | goto out; |
1327 | | |
1328 | 0 | sigc->payload_type = SIGNATURE_PAYLOAD_COMMIT; |
1329 | 0 | sigc->payload = strbuf_detach(&payload, &sigc->payload_len); |
1330 | 0 | ret = check_signature(sigc, signature.buf, signature.len); |
1331 | |
|
1332 | 0 | out: |
1333 | 0 | strbuf_release(&payload); |
1334 | 0 | strbuf_release(&signature); |
1335 | |
|
1336 | 0 | return ret; |
1337 | 0 | } |
1338 | | |
1339 | | void verify_merge_signature(struct commit *commit, int verbosity, |
1340 | | int check_trust) |
1341 | 0 | { |
1342 | 0 | char hex[GIT_MAX_HEXSZ + 1]; |
1343 | 0 | struct signature_check signature_check; |
1344 | 0 | int ret; |
1345 | 0 | memset(&signature_check, 0, sizeof(signature_check)); |
1346 | |
|
1347 | 0 | ret = check_commit_signature(commit, &signature_check); |
1348 | |
|
1349 | 0 | repo_find_unique_abbrev_r(the_repository, hex, &commit->object.oid, |
1350 | 0 | DEFAULT_ABBREV); |
1351 | 0 | switch (signature_check.result) { |
1352 | 0 | case 'G': |
1353 | 0 | if (ret || (check_trust && signature_check.trust_level < TRUST_MARGINAL)) |
1354 | 0 | die(_("Commit %s has an untrusted GPG signature, " |
1355 | 0 | "allegedly by %s."), hex, signature_check.signer); |
1356 | 0 | break; |
1357 | 0 | case 'B': |
1358 | 0 | die(_("Commit %s has a bad GPG signature " |
1359 | 0 | "allegedly by %s."), hex, signature_check.signer); |
1360 | 0 | default: /* 'N' */ |
1361 | 0 | die(_("Commit %s does not have a GPG signature."), hex); |
1362 | 0 | } |
1363 | 0 | if (verbosity >= 0 && signature_check.result == 'G') |
1364 | 0 | printf(_("Commit %s has a good GPG signature by %s\n"), |
1365 | 0 | hex, signature_check.signer); |
1366 | |
|
1367 | 0 | signature_check_clear(&signature_check); |
1368 | 0 | } |
1369 | | |
1370 | | void append_merge_tag_headers(const struct commit_list *parents, |
1371 | | struct commit_extra_header ***tail) |
1372 | 0 | { |
1373 | 0 | while (parents) { |
1374 | 0 | const struct commit *parent = parents->item; |
1375 | 0 | handle_signed_tag(parent, tail); |
1376 | 0 | parents = parents->next; |
1377 | 0 | } |
1378 | 0 | } |
1379 | | |
1380 | | static int convert_commit_extra_headers(const struct commit_extra_header *orig, |
1381 | | struct commit_extra_header **result) |
1382 | 0 | { |
1383 | 0 | const struct git_hash_algo *compat = the_repository->compat_hash_algo; |
1384 | 0 | const struct git_hash_algo *algo = the_repository->hash_algo; |
1385 | 0 | struct commit_extra_header *extra = NULL, **tail = &extra; |
1386 | 0 | struct strbuf out = STRBUF_INIT; |
1387 | 0 | while (orig) { |
1388 | 0 | struct commit_extra_header *new; |
1389 | 0 | CALLOC_ARRAY(new, 1); |
1390 | 0 | if (!strcmp(orig->key, "mergetag")) { |
1391 | 0 | if (convert_object_file(&out, algo, compat, |
1392 | 0 | orig->value, orig->len, |
1393 | 0 | OBJ_TAG, 1)) { |
1394 | 0 | free(new); |
1395 | 0 | free_commit_extra_headers(extra); |
1396 | 0 | return -1; |
1397 | 0 | } |
1398 | 0 | new->key = xstrdup("mergetag"); |
1399 | 0 | new->value = strbuf_detach(&out, &new->len); |
1400 | 0 | } else { |
1401 | 0 | new->key = xstrdup(orig->key); |
1402 | 0 | new->len = orig->len; |
1403 | 0 | new->value = xmemdupz(orig->value, orig->len); |
1404 | 0 | } |
1405 | 0 | *tail = new; |
1406 | 0 | tail = &new->next; |
1407 | 0 | orig = orig->next; |
1408 | 0 | } |
1409 | 0 | *result = extra; |
1410 | 0 | return 0; |
1411 | 0 | } |
1412 | | |
1413 | | static void add_extra_header(struct strbuf *buffer, |
1414 | | const struct commit_extra_header *extra) |
1415 | 0 | { |
1416 | 0 | strbuf_addstr(buffer, extra->key); |
1417 | 0 | if (extra->len) |
1418 | 0 | strbuf_add_lines(buffer, " ", extra->value, extra->len); |
1419 | 0 | else |
1420 | 0 | strbuf_addch(buffer, '\n'); |
1421 | 0 | } |
1422 | | |
1423 | | struct commit_extra_header *read_commit_extra_headers(struct commit *commit, |
1424 | | const char **exclude) |
1425 | 0 | { |
1426 | 0 | struct commit_extra_header *extra = NULL; |
1427 | 0 | unsigned long size; |
1428 | 0 | const char *buffer = repo_get_commit_buffer(the_repository, commit, |
1429 | 0 | &size); |
1430 | 0 | extra = read_commit_extra_header_lines(buffer, size, exclude); |
1431 | 0 | repo_unuse_commit_buffer(the_repository, commit, buffer); |
1432 | 0 | return extra; |
1433 | 0 | } |
1434 | | |
1435 | | int for_each_mergetag(each_mergetag_fn fn, struct commit *commit, void *data) |
1436 | 0 | { |
1437 | 0 | struct commit_extra_header *extra, *to_free; |
1438 | 0 | int res = 0; |
1439 | |
|
1440 | 0 | to_free = read_commit_extra_headers(commit, NULL); |
1441 | 0 | for (extra = to_free; !res && extra; extra = extra->next) { |
1442 | 0 | if (strcmp(extra->key, "mergetag")) |
1443 | 0 | continue; /* not a merge tag */ |
1444 | 0 | res = fn(commit, extra, data); |
1445 | 0 | } |
1446 | 0 | free_commit_extra_headers(to_free); |
1447 | 0 | return res; |
1448 | 0 | } |
1449 | | |
1450 | | static inline int standard_header_field(const char *field, size_t len) |
1451 | 0 | { |
1452 | 0 | return ((len == 4 && !memcmp(field, "tree", 4)) || |
1453 | 0 | (len == 6 && !memcmp(field, "parent", 6)) || |
1454 | 0 | (len == 6 && !memcmp(field, "author", 6)) || |
1455 | 0 | (len == 9 && !memcmp(field, "committer", 9)) || |
1456 | 0 | (len == 8 && !memcmp(field, "encoding", 8))); |
1457 | 0 | } |
1458 | | |
1459 | | static int excluded_header_field(const char *field, size_t len, const char **exclude) |
1460 | 0 | { |
1461 | 0 | if (!exclude) |
1462 | 0 | return 0; |
1463 | | |
1464 | 0 | while (*exclude) { |
1465 | 0 | size_t xlen = strlen(*exclude); |
1466 | 0 | if (len == xlen && !memcmp(field, *exclude, xlen)) |
1467 | 0 | return 1; |
1468 | 0 | exclude++; |
1469 | 0 | } |
1470 | 0 | return 0; |
1471 | 0 | } |
1472 | | |
1473 | | static struct commit_extra_header *read_commit_extra_header_lines( |
1474 | | const char *buffer, size_t size, |
1475 | | const char **exclude) |
1476 | 0 | { |
1477 | 0 | struct commit_extra_header *extra = NULL, **tail = &extra, *it = NULL; |
1478 | 0 | const char *line, *next, *eof, *eob; |
1479 | 0 | struct strbuf buf = STRBUF_INIT; |
1480 | |
|
1481 | 0 | for (line = buffer, eob = line + size; |
1482 | 0 | line < eob && *line != '\n'; |
1483 | 0 | line = next) { |
1484 | 0 | next = memchr(line, '\n', eob - line); |
1485 | 0 | next = next ? next + 1 : eob; |
1486 | 0 | if (*line == ' ') { |
1487 | | /* continuation */ |
1488 | 0 | if (it) |
1489 | 0 | strbuf_add(&buf, line + 1, next - (line + 1)); |
1490 | 0 | continue; |
1491 | 0 | } |
1492 | 0 | if (it) |
1493 | 0 | it->value = strbuf_detach(&buf, &it->len); |
1494 | 0 | strbuf_reset(&buf); |
1495 | 0 | it = NULL; |
1496 | |
|
1497 | 0 | eof = memchr(line, ' ', next - line); |
1498 | 0 | if (!eof) |
1499 | 0 | eof = next; |
1500 | 0 | else if (standard_header_field(line, eof - line) || |
1501 | 0 | excluded_header_field(line, eof - line, exclude)) |
1502 | 0 | continue; |
1503 | | |
1504 | 0 | CALLOC_ARRAY(it, 1); |
1505 | 0 | it->key = xmemdupz(line, eof-line); |
1506 | 0 | *tail = it; |
1507 | 0 | tail = &it->next; |
1508 | 0 | if (eof + 1 < next) |
1509 | 0 | strbuf_add(&buf, eof + 1, next - (eof + 1)); |
1510 | 0 | } |
1511 | 0 | if (it) |
1512 | 0 | it->value = strbuf_detach(&buf, &it->len); |
1513 | 0 | return extra; |
1514 | 0 | } |
1515 | | |
1516 | | void free_commit_extra_headers(struct commit_extra_header *extra) |
1517 | 0 | { |
1518 | 0 | while (extra) { |
1519 | 0 | struct commit_extra_header *next = extra->next; |
1520 | 0 | free(extra->key); |
1521 | 0 | free(extra->value); |
1522 | 0 | free(extra); |
1523 | 0 | extra = next; |
1524 | 0 | } |
1525 | 0 | } |
1526 | | |
1527 | | int commit_tree(const char *msg, size_t msg_len, const struct object_id *tree, |
1528 | | const struct commit_list *parents, struct object_id *ret, |
1529 | | const char *author, const char *sign_commit) |
1530 | 0 | { |
1531 | 0 | struct commit_extra_header *extra = NULL, **tail = &extra; |
1532 | 0 | int result; |
1533 | |
|
1534 | 0 | append_merge_tag_headers(parents, &tail); |
1535 | 0 | result = commit_tree_extended(msg, msg_len, tree, parents, ret, author, |
1536 | 0 | NULL, sign_commit, extra); |
1537 | 0 | free_commit_extra_headers(extra); |
1538 | 0 | return result; |
1539 | 0 | } |
1540 | | |
1541 | | static int find_invalid_utf8(const char *buf, int len) |
1542 | 0 | { |
1543 | 0 | int offset = 0; |
1544 | 0 | static const unsigned int max_codepoint[] = { |
1545 | 0 | 0x7f, 0x7ff, 0xffff, 0x10ffff |
1546 | 0 | }; |
1547 | |
|
1548 | 0 | while (len) { |
1549 | 0 | unsigned char c = *buf++; |
1550 | 0 | int bytes, bad_offset; |
1551 | 0 | unsigned int codepoint; |
1552 | 0 | unsigned int min_val, max_val; |
1553 | |
|
1554 | 0 | len--; |
1555 | 0 | offset++; |
1556 | | |
1557 | | /* Simple US-ASCII? No worries. */ |
1558 | 0 | if (c < 0x80) |
1559 | 0 | continue; |
1560 | | |
1561 | 0 | bad_offset = offset-1; |
1562 | | |
1563 | | /* |
1564 | | * Count how many more high bits set: that's how |
1565 | | * many more bytes this sequence should have. |
1566 | | */ |
1567 | 0 | bytes = 0; |
1568 | 0 | while (c & 0x40) { |
1569 | 0 | c <<= 1; |
1570 | 0 | bytes++; |
1571 | 0 | } |
1572 | | |
1573 | | /* |
1574 | | * Must be between 1 and 3 more bytes. Longer sequences result in |
1575 | | * codepoints beyond U+10FFFF, which are guaranteed never to exist. |
1576 | | */ |
1577 | 0 | if (bytes < 1 || 3 < bytes) |
1578 | 0 | return bad_offset; |
1579 | | |
1580 | | /* Do we *have* that many bytes? */ |
1581 | 0 | if (len < bytes) |
1582 | 0 | return bad_offset; |
1583 | | |
1584 | | /* |
1585 | | * Place the encoded bits at the bottom of the value and compute the |
1586 | | * valid range. |
1587 | | */ |
1588 | 0 | codepoint = (c & 0x7f) >> bytes; |
1589 | 0 | min_val = max_codepoint[bytes-1] + 1; |
1590 | 0 | max_val = max_codepoint[bytes]; |
1591 | |
|
1592 | 0 | offset += bytes; |
1593 | 0 | len -= bytes; |
1594 | | |
1595 | | /* And verify that they are good continuation bytes */ |
1596 | 0 | do { |
1597 | 0 | codepoint <<= 6; |
1598 | 0 | codepoint |= *buf & 0x3f; |
1599 | 0 | if ((*buf++ & 0xc0) != 0x80) |
1600 | 0 | return bad_offset; |
1601 | 0 | } while (--bytes); |
1602 | | |
1603 | | /* Reject codepoints that are out of range for the sequence length. */ |
1604 | 0 | if (codepoint < min_val || codepoint > max_val) |
1605 | 0 | return bad_offset; |
1606 | | /* Surrogates are only for UTF-16 and cannot be encoded in UTF-8. */ |
1607 | 0 | if ((codepoint & 0x1ff800) == 0xd800) |
1608 | 0 | return bad_offset; |
1609 | | /* U+xxFFFE and U+xxFFFF are guaranteed non-characters. */ |
1610 | 0 | if ((codepoint & 0xfffe) == 0xfffe) |
1611 | 0 | return bad_offset; |
1612 | | /* So are anything in the range U+FDD0..U+FDEF. */ |
1613 | 0 | if (codepoint >= 0xfdd0 && codepoint <= 0xfdef) |
1614 | 0 | return bad_offset; |
1615 | 0 | } |
1616 | 0 | return -1; |
1617 | 0 | } |
1618 | | |
1619 | | /* |
1620 | | * This verifies that the buffer is in proper utf8 format. |
1621 | | * |
1622 | | * If it isn't, it assumes any non-utf8 characters are Latin1, |
1623 | | * and does the conversion. |
1624 | | */ |
1625 | | static int verify_utf8(struct strbuf *buf) |
1626 | 0 | { |
1627 | 0 | int ok = 1; |
1628 | 0 | long pos = 0; |
1629 | |
|
1630 | 0 | for (;;) { |
1631 | 0 | int bad; |
1632 | 0 | unsigned char c; |
1633 | 0 | unsigned char replace[2]; |
1634 | |
|
1635 | 0 | bad = find_invalid_utf8(buf->buf + pos, buf->len - pos); |
1636 | 0 | if (bad < 0) |
1637 | 0 | return ok; |
1638 | 0 | pos += bad; |
1639 | 0 | ok = 0; |
1640 | 0 | c = buf->buf[pos]; |
1641 | 0 | strbuf_remove(buf, pos, 1); |
1642 | | |
1643 | | /* We know 'c' must be in the range 128-255 */ |
1644 | 0 | replace[0] = 0xc0 + (c >> 6); |
1645 | 0 | replace[1] = 0x80 + (c & 0x3f); |
1646 | 0 | strbuf_insert(buf, pos, replace, 2); |
1647 | 0 | pos += 2; |
1648 | 0 | } |
1649 | 0 | } |
1650 | | |
1651 | | static const char commit_utf8_warn[] = |
1652 | | N_("Warning: commit message did not conform to UTF-8.\n" |
1653 | | "You may want to amend it after fixing the message, or set the config\n" |
1654 | | "variable i18n.commitEncoding to the encoding your project uses.\n"); |
1655 | | |
1656 | | static void write_commit_tree(struct strbuf *buffer, const char *msg, size_t msg_len, |
1657 | | const struct object_id *tree, |
1658 | | const struct object_id *parents, size_t parents_len, |
1659 | | const char *author, const char *committer, |
1660 | | const struct commit_extra_header *extra) |
1661 | 0 | { |
1662 | 0 | int encoding_is_utf8; |
1663 | 0 | size_t i; |
1664 | | |
1665 | | /* Not having i18n.commitencoding is the same as having utf-8 */ |
1666 | 0 | encoding_is_utf8 = is_encoding_utf8(git_commit_encoding); |
1667 | |
|
1668 | 0 | strbuf_grow(buffer, 8192); /* should avoid reallocs for the headers */ |
1669 | 0 | strbuf_addf(buffer, "tree %s\n", oid_to_hex(tree)); |
1670 | | |
1671 | | /* |
1672 | | * NOTE! This ordering means that the same exact tree merged with a |
1673 | | * different order of parents will be a _different_ changeset even |
1674 | | * if everything else stays the same. |
1675 | | */ |
1676 | 0 | for (i = 0; i < parents_len; i++) |
1677 | 0 | strbuf_addf(buffer, "parent %s\n", oid_to_hex(&parents[i])); |
1678 | | |
1679 | | /* Person/date information */ |
1680 | 0 | if (!author) |
1681 | 0 | author = git_author_info(IDENT_STRICT); |
1682 | 0 | strbuf_addf(buffer, "author %s\n", author); |
1683 | 0 | if (!committer) |
1684 | 0 | committer = git_committer_info(IDENT_STRICT); |
1685 | 0 | strbuf_addf(buffer, "committer %s\n", committer); |
1686 | 0 | if (!encoding_is_utf8) |
1687 | 0 | strbuf_addf(buffer, "encoding %s\n", git_commit_encoding); |
1688 | |
|
1689 | 0 | while (extra) { |
1690 | 0 | add_extra_header(buffer, extra); |
1691 | 0 | extra = extra->next; |
1692 | 0 | } |
1693 | 0 | strbuf_addch(buffer, '\n'); |
1694 | | |
1695 | | /* And add the comment */ |
1696 | 0 | strbuf_add(buffer, msg, msg_len); |
1697 | 0 | } |
1698 | | |
1699 | | int commit_tree_extended(const char *msg, size_t msg_len, |
1700 | | const struct object_id *tree, |
1701 | | const struct commit_list *parents, struct object_id *ret, |
1702 | | const char *author, const char *committer, |
1703 | | const char *sign_commit, |
1704 | | const struct commit_extra_header *extra) |
1705 | 0 | { |
1706 | 0 | struct repository *r = the_repository; |
1707 | 0 | int result = 0; |
1708 | 0 | int encoding_is_utf8; |
1709 | 0 | struct strbuf buffer = STRBUF_INIT, compat_buffer = STRBUF_INIT; |
1710 | 0 | struct strbuf sig = STRBUF_INIT, compat_sig = STRBUF_INIT; |
1711 | 0 | struct object_id *parent_buf = NULL, *compat_oid = NULL; |
1712 | 0 | struct object_id compat_oid_buf; |
1713 | 0 | size_t i, nparents; |
1714 | | |
1715 | | /* Not having i18n.commitencoding is the same as having utf-8 */ |
1716 | 0 | encoding_is_utf8 = is_encoding_utf8(git_commit_encoding); |
1717 | |
|
1718 | 0 | assert_oid_type(tree, OBJ_TREE); |
1719 | |
|
1720 | 0 | if (memchr(msg, '\0', msg_len)) |
1721 | 0 | return error("a NUL byte in commit log message not allowed."); |
1722 | | |
1723 | 0 | nparents = commit_list_count(parents); |
1724 | 0 | CALLOC_ARRAY(parent_buf, nparents); |
1725 | 0 | i = 0; |
1726 | 0 | for (const struct commit_list *p = parents; p; p = p->next) |
1727 | 0 | oidcpy(&parent_buf[i++], &p->item->object.oid); |
1728 | |
|
1729 | 0 | write_commit_tree(&buffer, msg, msg_len, tree, parent_buf, nparents, author, committer, extra); |
1730 | 0 | if (sign_commit && sign_commit_to_strbuf(&sig, &buffer, sign_commit)) { |
1731 | 0 | result = -1; |
1732 | 0 | goto out; |
1733 | 0 | } |
1734 | 0 | if (r->compat_hash_algo) { |
1735 | 0 | struct commit_extra_header *compat_extra = NULL; |
1736 | 0 | struct object_id mapped_tree; |
1737 | 0 | struct object_id *mapped_parents; |
1738 | |
|
1739 | 0 | CALLOC_ARRAY(mapped_parents, nparents); |
1740 | |
|
1741 | 0 | if (repo_oid_to_algop(r, tree, r->compat_hash_algo, &mapped_tree)) { |
1742 | 0 | result = -1; |
1743 | 0 | free(mapped_parents); |
1744 | 0 | goto out; |
1745 | 0 | } |
1746 | 0 | for (i = 0; i < nparents; i++) |
1747 | 0 | if (repo_oid_to_algop(r, &parent_buf[i], r->compat_hash_algo, &mapped_parents[i])) { |
1748 | 0 | result = -1; |
1749 | 0 | free(mapped_parents); |
1750 | 0 | goto out; |
1751 | 0 | } |
1752 | 0 | if (convert_commit_extra_headers(extra, &compat_extra)) { |
1753 | 0 | result = -1; |
1754 | 0 | free(mapped_parents); |
1755 | 0 | goto out; |
1756 | 0 | } |
1757 | 0 | write_commit_tree(&compat_buffer, msg, msg_len, &mapped_tree, |
1758 | 0 | mapped_parents, nparents, author, committer, compat_extra); |
1759 | 0 | free_commit_extra_headers(compat_extra); |
1760 | 0 | free(mapped_parents); |
1761 | |
|
1762 | 0 | if (sign_commit && sign_commit_to_strbuf(&compat_sig, &compat_buffer, sign_commit)) { |
1763 | 0 | result = -1; |
1764 | 0 | goto out; |
1765 | 0 | } |
1766 | 0 | } |
1767 | | |
1768 | 0 | if (sign_commit) { |
1769 | 0 | struct sig_pairs { |
1770 | 0 | struct strbuf *sig; |
1771 | 0 | const struct git_hash_algo *algo; |
1772 | 0 | } bufs [2] = { |
1773 | 0 | { &compat_sig, r->compat_hash_algo }, |
1774 | 0 | { &sig, r->hash_algo }, |
1775 | 0 | }; |
1776 | 0 | int i; |
1777 | | |
1778 | | /* |
1779 | | * We write algorithms in the order they were implemented in |
1780 | | * Git to produce a stable hash when multiple algorithms are |
1781 | | * used. |
1782 | | */ |
1783 | 0 | if (r->compat_hash_algo && hash_algo_by_ptr(bufs[0].algo) > hash_algo_by_ptr(bufs[1].algo)) |
1784 | 0 | SWAP(bufs[0], bufs[1]); |
1785 | | |
1786 | | /* |
1787 | | * We traverse each algorithm in order, and apply the signature |
1788 | | * to each buffer. |
1789 | | */ |
1790 | 0 | for (i = 0; i < ARRAY_SIZE(bufs); i++) { |
1791 | 0 | if (!bufs[i].algo) |
1792 | 0 | continue; |
1793 | 0 | add_header_signature(&buffer, bufs[i].sig, bufs[i].algo); |
1794 | 0 | if (r->compat_hash_algo) |
1795 | 0 | add_header_signature(&compat_buffer, bufs[i].sig, bufs[i].algo); |
1796 | 0 | } |
1797 | 0 | } |
1798 | | |
1799 | | /* And check the encoding. */ |
1800 | 0 | if (encoding_is_utf8 && (!verify_utf8(&buffer) || !verify_utf8(&compat_buffer))) |
1801 | 0 | fprintf(stderr, _(commit_utf8_warn)); |
1802 | |
|
1803 | 0 | if (r->compat_hash_algo) { |
1804 | 0 | hash_object_file(r->compat_hash_algo, compat_buffer.buf, compat_buffer.len, |
1805 | 0 | OBJ_COMMIT, &compat_oid_buf); |
1806 | 0 | compat_oid = &compat_oid_buf; |
1807 | 0 | } |
1808 | |
|
1809 | 0 | result = write_object_file_flags(buffer.buf, buffer.len, OBJ_COMMIT, |
1810 | 0 | ret, compat_oid, 0); |
1811 | 0 | out: |
1812 | 0 | free(parent_buf); |
1813 | 0 | strbuf_release(&buffer); |
1814 | 0 | strbuf_release(&compat_buffer); |
1815 | 0 | strbuf_release(&sig); |
1816 | 0 | strbuf_release(&compat_sig); |
1817 | 0 | return result; |
1818 | 0 | } |
1819 | | |
1820 | | define_commit_slab(merge_desc_slab, struct merge_remote_desc *); |
1821 | | static struct merge_desc_slab merge_desc_slab = COMMIT_SLAB_INIT(1, merge_desc_slab); |
1822 | | |
1823 | | struct merge_remote_desc *merge_remote_util(const struct commit *commit) |
1824 | 0 | { |
1825 | 0 | return *merge_desc_slab_at(&merge_desc_slab, commit); |
1826 | 0 | } |
1827 | | |
1828 | | void set_merge_remote_desc(struct commit *commit, |
1829 | | const char *name, struct object *obj) |
1830 | 0 | { |
1831 | 0 | struct merge_remote_desc *desc; |
1832 | 0 | FLEX_ALLOC_STR(desc, name, name); |
1833 | 0 | desc->obj = obj; |
1834 | 0 | *merge_desc_slab_at(&merge_desc_slab, commit) = desc; |
1835 | 0 | } |
1836 | | |
1837 | | struct commit *get_merge_parent(const char *name) |
1838 | 0 | { |
1839 | 0 | struct object *obj; |
1840 | 0 | struct commit *commit; |
1841 | 0 | struct object_id oid; |
1842 | 0 | if (repo_get_oid(the_repository, name, &oid)) |
1843 | 0 | return NULL; |
1844 | 0 | obj = parse_object(the_repository, &oid); |
1845 | 0 | commit = (struct commit *)repo_peel_to_type(the_repository, name, 0, |
1846 | 0 | obj, OBJ_COMMIT); |
1847 | 0 | if (commit && !merge_remote_util(commit)) |
1848 | 0 | set_merge_remote_desc(commit, name, obj); |
1849 | 0 | return commit; |
1850 | 0 | } |
1851 | | |
1852 | | /* |
1853 | | * Append a commit to the end of the commit_list. |
1854 | | * |
1855 | | * next starts by pointing to the variable that holds the head of an |
1856 | | * empty commit_list, and is updated to point to the "next" field of |
1857 | | * the last item on the list as new commits are appended. |
1858 | | * |
1859 | | * Usage example: |
1860 | | * |
1861 | | * struct commit_list *list; |
1862 | | * struct commit_list **next = &list; |
1863 | | * |
1864 | | * next = commit_list_append(c1, next); |
1865 | | * next = commit_list_append(c2, next); |
1866 | | * assert(commit_list_count(list) == 2); |
1867 | | * return list; |
1868 | | */ |
1869 | | struct commit_list **commit_list_append(struct commit *commit, |
1870 | | struct commit_list **next) |
1871 | 0 | { |
1872 | 0 | struct commit_list *new_commit = xmalloc(sizeof(struct commit_list)); |
1873 | 0 | new_commit->item = commit; |
1874 | 0 | *next = new_commit; |
1875 | 0 | new_commit->next = NULL; |
1876 | 0 | return &new_commit->next; |
1877 | 0 | } |
1878 | | |
1879 | | const char *find_commit_header(const char *msg, const char *key, size_t *out_len) |
1880 | 0 | { |
1881 | 0 | int key_len = strlen(key); |
1882 | 0 | const char *line = msg; |
1883 | |
|
1884 | 0 | while (line) { |
1885 | 0 | const char *eol = strchrnul(line, '\n'); |
1886 | |
|
1887 | 0 | if (line == eol) |
1888 | 0 | return NULL; |
1889 | | |
1890 | 0 | if (eol - line > key_len && |
1891 | 0 | !strncmp(line, key, key_len) && |
1892 | 0 | line[key_len] == ' ') { |
1893 | 0 | *out_len = eol - line - key_len - 1; |
1894 | 0 | return line + key_len + 1; |
1895 | 0 | } |
1896 | 0 | line = *eol ? eol + 1 : NULL; |
1897 | 0 | } |
1898 | 0 | return NULL; |
1899 | 0 | } |
1900 | | |
1901 | | /* |
1902 | | * Inspect the given string and determine the true "end" of the log message, in |
1903 | | * order to find where to put a new Signed-off-by trailer. Ignored are |
1904 | | * trailing comment lines and blank lines. To support "git commit -s |
1905 | | * --amend" on an existing commit, we also ignore "Conflicts:". To |
1906 | | * support "git commit -v", we truncate at cut lines. |
1907 | | * |
1908 | | * Returns the number of bytes from the tail to ignore, to be fed as |
1909 | | * the second parameter to append_signoff(). |
1910 | | */ |
1911 | | size_t ignored_log_message_bytes(const char *buf, size_t len) |
1912 | 0 | { |
1913 | 0 | size_t boc = 0; |
1914 | 0 | size_t bol = 0; |
1915 | 0 | int in_old_conflicts_block = 0; |
1916 | 0 | size_t cutoff = wt_status_locate_end(buf, len); |
1917 | |
|
1918 | 0 | while (bol < cutoff) { |
1919 | 0 | const char *next_line = memchr(buf + bol, '\n', len - bol); |
1920 | |
|
1921 | 0 | if (!next_line) |
1922 | 0 | next_line = buf + len; |
1923 | 0 | else |
1924 | 0 | next_line++; |
1925 | |
|
1926 | 0 | if (starts_with_mem(buf + bol, cutoff - bol, comment_line_str) || |
1927 | 0 | buf[bol] == '\n') { |
1928 | | /* is this the first of the run of comments? */ |
1929 | 0 | if (!boc) |
1930 | 0 | boc = bol; |
1931 | | /* otherwise, it is just continuing */ |
1932 | 0 | } else if (starts_with(buf + bol, "Conflicts:\n")) { |
1933 | 0 | in_old_conflicts_block = 1; |
1934 | 0 | if (!boc) |
1935 | 0 | boc = bol; |
1936 | 0 | } else if (in_old_conflicts_block && buf[bol] == '\t') { |
1937 | 0 | ; /* a pathname in the conflicts block */ |
1938 | 0 | } else if (boc) { |
1939 | | /* the previous was not trailing comment */ |
1940 | 0 | boc = 0; |
1941 | 0 | in_old_conflicts_block = 0; |
1942 | 0 | } |
1943 | 0 | bol = next_line - buf; |
1944 | 0 | } |
1945 | 0 | return boc ? len - boc : len - cutoff; |
1946 | 0 | } |
1947 | | |
1948 | | int run_commit_hook(int editor_is_used, const char *index_file, |
1949 | | int *invoked_hook, const char *name, ...) |
1950 | 0 | { |
1951 | 0 | struct run_hooks_opt opt = RUN_HOOKS_OPT_INIT; |
1952 | 0 | va_list args; |
1953 | 0 | const char *arg; |
1954 | |
|
1955 | 0 | strvec_pushf(&opt.env, "GIT_INDEX_FILE=%s", index_file); |
1956 | | |
1957 | | /* |
1958 | | * Let the hook know that no editor will be launched. |
1959 | | */ |
1960 | 0 | if (!editor_is_used) |
1961 | 0 | strvec_push(&opt.env, "GIT_EDITOR=:"); |
1962 | |
|
1963 | 0 | va_start(args, name); |
1964 | 0 | while ((arg = va_arg(args, const char *))) |
1965 | 0 | strvec_push(&opt.args, arg); |
1966 | 0 | va_end(args); |
1967 | |
|
1968 | 0 | opt.invoked_hook = invoked_hook; |
1969 | 0 | return run_hooks_opt(the_repository, name, &opt); |
1970 | 0 | } |