Coverage Report

Created: 2026-01-09 07:10

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/git/entry.c
Line
Count
Source
1
#define USE_THE_REPOSITORY_VARIABLE
2
3
#include "git-compat-util.h"
4
#include "odb.h"
5
#include "odb/streaming.h"
6
#include "dir.h"
7
#include "environment.h"
8
#include "gettext.h"
9
#include "hex.h"
10
#include "name-hash.h"
11
#include "sparse-index.h"
12
#include "submodule.h"
13
#include "symlinks.h"
14
#include "progress.h"
15
#include "fsmonitor.h"
16
#include "entry.h"
17
#include "parallel-checkout.h"
18
19
static void create_directories(const char *path, int path_len,
20
             const struct checkout *state)
21
0
{
22
0
  char *buf = xmallocz(path_len);
23
0
  int len = 0;
24
25
0
  while (len < path_len) {
26
0
    do {
27
0
      buf[len] = path[len];
28
0
      len++;
29
0
    } while (len < path_len && path[len] != '/');
30
0
    if (len >= path_len)
31
0
      break;
32
0
    buf[len] = 0;
33
34
    /*
35
     * For 'checkout-index --prefix=<dir>', <dir> is
36
     * allowed to be a symlink to an existing directory,
37
     * and we set 'state->base_dir_len' below, such that
38
     * we test the path components of the prefix with the
39
     * stat() function instead of the lstat() function.
40
     */
41
0
    if (has_dirs_only_path(buf, len, state->base_dir_len))
42
0
      continue; /* ok, it is already a directory. */
43
44
    /*
45
     * If this mkdir() would fail, it could be that there
46
     * is already a symlink or something else exists
47
     * there, therefore we then try to unlink it and try
48
     * one more time to create the directory.
49
     */
50
0
    if (mkdir(buf, 0777)) {
51
0
      if (errno == EEXIST && state->force &&
52
0
          !unlink_or_warn(buf) && !mkdir(buf, 0777))
53
0
        continue;
54
0
      die_errno("cannot create directory at '%s'", buf);
55
0
    }
56
0
  }
57
0
  free(buf);
58
0
}
59
60
static void remove_subtree(struct strbuf *path)
61
0
{
62
0
  DIR *dir = opendir(path->buf);
63
0
  struct dirent *de;
64
0
  int origlen = path->len;
65
66
0
  if (!dir)
67
0
    die_errno("cannot opendir '%s'", path->buf);
68
0
  while ((de = readdir_skip_dot_and_dotdot(dir)) != NULL) {
69
0
    struct stat st;
70
71
0
    strbuf_addch(path, '/');
72
0
    strbuf_addstr(path, de->d_name);
73
0
    if (lstat(path->buf, &st))
74
0
      die_errno("cannot lstat '%s'", path->buf);
75
0
    if (S_ISDIR(st.st_mode))
76
0
      remove_subtree(path);
77
0
    else if (unlink(path->buf))
78
0
      die_errno("cannot unlink '%s'", path->buf);
79
0
    strbuf_setlen(path, origlen);
80
0
  }
81
0
  closedir(dir);
82
0
  if (rmdir(path->buf))
83
0
    die_errno("cannot rmdir '%s'", path->buf);
84
0
}
85
86
static int create_file(const char *path, unsigned int mode)
87
0
{
88
0
  mode = (mode & 0100) ? 0777 : 0666;
89
0
  return open(path, O_WRONLY | O_CREAT | O_EXCL, mode);
90
0
}
91
92
void *read_blob_entry(const struct cache_entry *ce, size_t *size)
93
0
{
94
0
  enum object_type type;
95
0
  unsigned long ul;
96
0
  void *blob_data = odb_read_object(the_repository->objects, &ce->oid,
97
0
            &type, &ul);
98
99
0
  *size = ul;
100
0
  if (blob_data) {
101
0
    if (type == OBJ_BLOB)
102
0
      return blob_data;
103
0
    free(blob_data);
104
0
  }
105
0
  return NULL;
106
0
}
107
108
static int open_output_fd(char *path, const struct cache_entry *ce, int to_tempfile)
109
0
{
110
0
  int symlink = (ce->ce_mode & S_IFMT) != S_IFREG;
111
0
  if (to_tempfile) {
112
0
    xsnprintf(path, TEMPORARY_FILENAME_LENGTH, "%s",
113
0
        symlink ? ".merge_link_XXXXXX" : ".merge_file_XXXXXX");
114
0
    return mkstemp(path);
115
0
  } else {
116
0
    return create_file(path, !symlink ? ce->ce_mode : 0666);
117
0
  }
118
0
}
119
120
int fstat_checkout_output(int fd, const struct checkout *state, struct stat *st)
121
0
{
122
  /* use fstat() only when path == ce->name */
123
0
  if (fstat_is_reliable() &&
124
0
      state->refresh_cache && !state->base_dir_len) {
125
0
    return !fstat(fd, st);
126
0
  }
127
0
  return 0;
128
0
}
129
130
static int streaming_write_entry(const struct cache_entry *ce, char *path,
131
         struct stream_filter *filter,
132
         const struct checkout *state, int to_tempfile,
133
         int *fstat_done, struct stat *statbuf)
134
0
{
135
0
  int result = 0;
136
0
  int fd;
137
138
0
  fd = open_output_fd(path, ce, to_tempfile);
139
0
  if (fd < 0)
140
0
    return -1;
141
142
0
  result |= odb_stream_blob_to_fd(the_repository->objects, fd, &ce->oid, filter, 1);
143
0
  *fstat_done = fstat_checkout_output(fd, state, statbuf);
144
0
  result |= close(fd);
145
146
0
  if (result)
147
0
    unlink(path);
148
0
  return result;
149
0
}
150
151
void enable_delayed_checkout(struct checkout *state)
152
0
{
153
0
  if (!state->delayed_checkout) {
154
0
    state->delayed_checkout = xmalloc(sizeof(*state->delayed_checkout));
155
0
    state->delayed_checkout->state = CE_CAN_DELAY;
156
0
    string_list_init_nodup(&state->delayed_checkout->filters);
157
0
    string_list_init_nodup(&state->delayed_checkout->paths);
158
0
  }
159
0
}
160
161
static int remove_available_paths(struct string_list_item *item, void *cb_data)
162
0
{
163
0
  struct string_list *available_paths = cb_data;
164
0
  struct string_list_item *available;
165
166
0
  available = string_list_lookup(available_paths, item->string);
167
0
  if (available)
168
0
    available->util = item->util;
169
0
  return !available;
170
0
}
171
172
static int string_is_not_null(struct string_list_item *item, void *data UNUSED)
173
0
{
174
0
  return !!item->string;
175
0
}
176
177
int finish_delayed_checkout(struct checkout *state, int show_progress)
178
0
{
179
0
  int errs = 0;
180
0
  unsigned processed_paths = 0;
181
0
  off_t filtered_bytes = 0;
182
0
  struct string_list_item *filter, *path;
183
0
  struct progress *progress = NULL;
184
0
  struct delayed_checkout *dco = state->delayed_checkout;
185
186
0
  if (!state->delayed_checkout)
187
0
    return errs;
188
189
0
  dco->state = CE_RETRY;
190
0
  if (show_progress)
191
0
    progress = start_delayed_progress(the_repository,
192
0
              _("Filtering content"),
193
0
              dco->paths.nr);
194
0
  while (dco->filters.nr > 0) {
195
0
    for_each_string_list_item(filter, &dco->filters) {
196
0
      struct string_list available_paths = STRING_LIST_INIT_DUP;
197
198
0
      if (!async_query_available_blobs(filter->string, &available_paths)) {
199
        /* Filter reported an error */
200
0
        errs = 1;
201
0
        filter->string = NULL;
202
0
        continue;
203
0
      }
204
0
      if (available_paths.nr <= 0) {
205
        /*
206
         * Filter responded with no entries. That means
207
         * the filter is done and we can remove the
208
         * filter from the list (see
209
         * "string_list_remove_empty_items" call below).
210
         */
211
0
        filter->string = NULL;
212
0
        continue;
213
0
      }
214
215
      /*
216
       * In dco->paths we store a list of all delayed paths.
217
       * The filter just send us a list of available paths.
218
       * Remove them from the list.
219
       */
220
0
      filter_string_list(&dco->paths, 0,
221
0
        &remove_available_paths, &available_paths);
222
223
0
      for_each_string_list_item(path, &available_paths) {
224
0
        struct cache_entry* ce;
225
226
0
        if (!path->util) {
227
0
          error("external filter '%s' signaled that '%s' "
228
0
                "is now available although it has not been "
229
0
                "delayed earlier",
230
0
                filter->string, path->string);
231
0
          errs |= 1;
232
233
          /*
234
           * Do not ask the filter for available blobs,
235
           * again, as the filter is likely buggy.
236
           */
237
0
          filter->string = NULL;
238
0
          continue;
239
0
        }
240
0
        ce = index_file_exists(state->istate, path->string,
241
0
                   strlen(path->string), 0);
242
0
        if (ce) {
243
0
          display_progress(progress, ++processed_paths);
244
0
          errs |= checkout_entry(ce, state, NULL, path->util);
245
0
          filtered_bytes += ce->ce_stat_data.sd_size;
246
0
          display_throughput(progress, filtered_bytes);
247
0
        } else
248
0
          errs = 1;
249
0
      }
250
251
0
      string_list_clear(&available_paths, 0);
252
0
    }
253
254
0
    filter_string_list(&dco->filters, 0, string_is_not_null, NULL);
255
0
  }
256
0
  stop_progress(&progress);
257
0
  string_list_clear(&dco->filters, 0);
258
259
  /* At this point we should not have any delayed paths anymore. */
260
0
  errs |= dco->paths.nr;
261
0
  for_each_string_list_item(path, &dco->paths) {
262
0
    error("'%s' was not filtered properly", path->string);
263
0
  }
264
0
  string_list_clear(&dco->paths, 0);
265
266
0
  free(dco);
267
0
  state->delayed_checkout = NULL;
268
269
0
  return errs;
270
0
}
271
272
void update_ce_after_write(const struct checkout *state, struct cache_entry *ce,
273
         struct stat *st)
274
0
{
275
0
  if (state->refresh_cache) {
276
0
    assert(state->istate);
277
0
    fill_stat_cache_info(state->istate, ce, st);
278
0
    ce->ce_flags |= CE_UPDATE_IN_BASE;
279
0
    mark_fsmonitor_invalid(state->istate, ce);
280
0
    state->istate->cache_changed |= CE_ENTRY_CHANGED;
281
0
  }
282
0
}
283
284
/* Note: ca is used (and required) iff the entry refers to a regular file. */
285
static int write_entry(struct cache_entry *ce, char *path, struct conv_attrs *ca,
286
           const struct checkout *state, int to_tempfile,
287
           int *nr_checkouts)
288
0
{
289
0
  unsigned int ce_mode_s_ifmt = ce->ce_mode & S_IFMT;
290
0
  struct delayed_checkout *dco = state->delayed_checkout;
291
0
  int fd, ret, fstat_done = 0;
292
0
  char *new_blob;
293
0
  struct strbuf buf = STRBUF_INIT;
294
0
  size_t size;
295
0
  ssize_t wrote;
296
0
  size_t newsize = 0;
297
0
  struct stat st;
298
0
  const struct submodule *sub;
299
0
  struct checkout_metadata meta;
300
0
  static int scratch_nr_checkouts;
301
302
0
  clone_checkout_metadata(&meta, &state->meta, &ce->oid);
303
304
0
  if (ce_mode_s_ifmt == S_IFREG) {
305
0
    struct stream_filter *filter = get_stream_filter_ca(ca, &ce->oid);
306
0
    if (filter &&
307
0
        !streaming_write_entry(ce, path, filter,
308
0
             state, to_tempfile,
309
0
             &fstat_done, &st))
310
0
      goto finish;
311
0
  }
312
313
0
  switch (ce_mode_s_ifmt) {
314
0
  case S_IFLNK:
315
0
    new_blob = read_blob_entry(ce, &size);
316
0
    if (!new_blob)
317
0
      return error("unable to read sha1 file of %s (%s)",
318
0
             ce->name, oid_to_hex(&ce->oid));
319
320
    /*
321
     * We can't make a real symlink; write out a regular file entry
322
     * with the symlink destination as its contents.
323
     */
324
0
    if (!has_symlinks || to_tempfile)
325
0
      goto write_file_entry;
326
327
0
    ret = symlink(new_blob, path);
328
0
    free(new_blob);
329
0
    if (ret)
330
0
      return error_errno("unable to create symlink %s", path);
331
0
    break;
332
333
0
  case S_IFREG:
334
    /*
335
     * We do not send the blob in case of a retry, so do not
336
     * bother reading it at all.
337
     */
338
0
    if (dco && dco->state == CE_RETRY) {
339
0
      new_blob = NULL;
340
0
      size = 0;
341
0
    } else {
342
0
      new_blob = read_blob_entry(ce, &size);
343
0
      if (!new_blob)
344
0
        return error("unable to read sha1 file of %s (%s)",
345
0
               ce->name, oid_to_hex(&ce->oid));
346
0
    }
347
348
    /*
349
     * Convert from git internal format to working tree format
350
     */
351
0
    if (dco && dco->state != CE_NO_DELAY) {
352
0
      ret = async_convert_to_working_tree_ca(ca, ce->name,
353
0
                     new_blob, size,
354
0
                     &buf, &meta, dco);
355
0
      if (ret) {
356
0
        struct string_list_item *item =
357
0
          string_list_lookup(&dco->paths, ce->name);
358
0
        if (item) {
359
0
          item->util = nr_checkouts ? nr_checkouts
360
0
              : &scratch_nr_checkouts;
361
0
          free(new_blob);
362
0
          goto delayed;
363
0
        }
364
0
      }
365
0
    } else {
366
0
      ret = convert_to_working_tree_ca(ca, ce->name, new_blob,
367
0
               size, &buf, &meta);
368
0
    }
369
370
0
    if (ret) {
371
0
      free(new_blob);
372
0
      new_blob = strbuf_detach(&buf, &newsize);
373
0
      size = newsize;
374
0
    }
375
    /*
376
     * No "else" here as errors from convert are OK at this
377
     * point. If the error would have been fatal (e.g.
378
     * filter is required), then we would have died already.
379
     */
380
381
0
  write_file_entry:
382
0
    fd = open_output_fd(path, ce, to_tempfile);
383
0
    if (fd < 0) {
384
0
      free(new_blob);
385
0
      return error_errno("unable to create file %s", path);
386
0
    }
387
388
0
    wrote = write_in_full(fd, new_blob, size);
389
0
    if (!to_tempfile)
390
0
      fstat_done = fstat_checkout_output(fd, state, &st);
391
0
    close(fd);
392
0
    free(new_blob);
393
0
    if (wrote < 0)
394
0
      return error("unable to write file %s", path);
395
0
    break;
396
397
0
  case S_IFGITLINK:
398
0
    if (to_tempfile)
399
0
      return error("cannot create temporary submodule %s", ce->name);
400
0
    if (mkdir(path, 0777) < 0)
401
0
      return error("cannot create submodule directory %s", path);
402
0
    sub = submodule_from_ce(ce);
403
0
    if (sub)
404
0
      return submodule_move_head(ce->name, state->super_prefix,
405
0
        NULL, oid_to_hex(&ce->oid),
406
0
        state->force ? SUBMODULE_MOVE_HEAD_FORCE : 0);
407
0
    break;
408
409
0
  default:
410
0
    return error("unknown file mode for %s in index", ce->name);
411
0
  }
412
413
0
finish:
414
0
  if (state->refresh_cache) {
415
0
    if (!fstat_done && lstat(ce->name, &st) < 0)
416
0
      return error_errno("unable to stat just-written file %s",
417
0
             ce->name);
418
0
    update_ce_after_write(state, ce , &st);
419
0
  }
420
0
  if (nr_checkouts)
421
0
    (*nr_checkouts)++;
422
0
delayed:
423
0
  return 0;
424
0
}
425
426
/*
427
 * This is like 'lstat()', except it refuses to follow symlinks
428
 * in the path, after skipping "skiplen".
429
 */
430
static int check_path(const char *path, int len, struct stat *st, int skiplen)
431
0
{
432
0
  const char *slash = path + len;
433
434
0
  while (path < slash && *slash != '/')
435
0
    slash--;
436
0
  if (!has_dirs_only_path(path, slash - path, skiplen)) {
437
0
    errno = ENOENT;
438
0
    return -1;
439
0
  }
440
0
  return lstat(path, st);
441
0
}
442
443
static void mark_colliding_entries(const struct checkout *state,
444
           struct cache_entry *ce, struct stat *st)
445
0
{
446
0
  int trust_ino = check_stat;
447
448
#if defined(GIT_WINDOWS_NATIVE) || defined(__CYGWIN__)
449
  trust_ino = 0;
450
#endif
451
452
0
  ce->ce_flags |= CE_MATCHED;
453
454
  /* TODO: audit for interaction with sparse-index. */
455
0
  ensure_full_index(state->istate);
456
0
  for (size_t i = 0; i < state->istate->cache_nr; i++) {
457
0
    struct cache_entry *dup = state->istate->cache[i];
458
459
0
    if (dup == ce) {
460
      /*
461
       * Parallel checkout doesn't create the files in index
462
       * order. So the other side of the collision may appear
463
       * after the given cache_entry in the array.
464
       */
465
0
      if (parallel_checkout_status() == PC_RUNNING)
466
0
        continue;
467
0
      else
468
0
        break;
469
0
    }
470
471
0
    if (dup->ce_flags & (CE_MATCHED | CE_VALID | CE_SKIP_WORKTREE))
472
0
      continue;
473
474
0
    if ((trust_ino && !match_stat_data(&dup->ce_stat_data, st)) ||
475
0
        paths_collide(ce->name, dup->name)) {
476
0
      dup->ce_flags |= CE_MATCHED;
477
0
      break;
478
0
    }
479
0
  }
480
0
}
481
482
int checkout_entry_ca(struct cache_entry *ce, struct conv_attrs *ca,
483
          const struct checkout *state, char *topath,
484
          int *nr_checkouts)
485
0
{
486
0
  static struct strbuf path = STRBUF_INIT;
487
0
  struct stat st;
488
0
  struct conv_attrs ca_buf;
489
490
0
  if (ce->ce_flags & CE_WT_REMOVE) {
491
0
    if (topath)
492
      /*
493
       * No content and thus no path to create, so we have
494
       * no pathname to return.
495
       */
496
0
      BUG("Can't remove entry to a path");
497
0
    unlink_entry(ce, state->super_prefix);
498
0
    return 0;
499
0
  }
500
501
0
  if (topath) {
502
0
    if (S_ISREG(ce->ce_mode) && !ca) {
503
0
      convert_attrs(state->istate, &ca_buf, ce->name);
504
0
      ca = &ca_buf;
505
0
    }
506
0
    return write_entry(ce, topath, ca, state, 1, nr_checkouts);
507
0
  }
508
509
0
  strbuf_reset(&path);
510
0
  strbuf_add(&path, state->base_dir, state->base_dir_len);
511
0
  strbuf_add(&path, ce->name, ce_namelen(ce));
512
513
0
  if (!check_path(path.buf, path.len, &st, state->base_dir_len)) {
514
0
    const struct submodule *sub;
515
0
    unsigned changed = ie_match_stat(state->istate, ce, &st,
516
0
             CE_MATCH_IGNORE_VALID | CE_MATCH_IGNORE_SKIP_WORKTREE);
517
    /*
518
     * Needs to be checked before !changed returns early,
519
     * as the possibly empty directory was not changed
520
     */
521
0
    sub = submodule_from_ce(ce);
522
0
    if (sub) {
523
0
      int err;
524
0
      if (!is_submodule_populated_gently(ce->name, &err)) {
525
0
        struct stat sb;
526
0
        if (lstat(ce->name, &sb))
527
0
          die(_("could not stat file '%s'"), ce->name);
528
0
        if (!(st.st_mode & S_IFDIR))
529
0
          unlink_or_warn(ce->name);
530
531
0
        return submodule_move_head(ce->name, state->super_prefix,
532
0
          NULL, oid_to_hex(&ce->oid), 0);
533
0
      } else
534
0
        return submodule_move_head(ce->name, state->super_prefix,
535
0
          "HEAD", oid_to_hex(&ce->oid),
536
0
          state->force ? SUBMODULE_MOVE_HEAD_FORCE : 0);
537
0
    }
538
539
0
    if (!changed)
540
0
      return 0;
541
0
    if (!state->force) {
542
0
      if (!state->quiet)
543
0
        fprintf(stderr,
544
0
          "%s already exists, no checkout\n",
545
0
          path.buf);
546
0
      return -1;
547
0
    }
548
549
0
    if (state->clone)
550
0
      mark_colliding_entries(state, ce, &st);
551
552
    /*
553
     * We unlink the old file, to get the new one with the
554
     * right permissions (including umask, which is nasty
555
     * to emulate by hand - much easier to let the system
556
     * just do the right thing)
557
     */
558
0
    if (S_ISDIR(st.st_mode)) {
559
      /* If it is a gitlink, leave it alone! */
560
0
      if (S_ISGITLINK(ce->ce_mode))
561
0
        return 0;
562
      /*
563
       * We must avoid replacing submodules' leading
564
       * directories with symbolic links, lest recursive
565
       * clones can write into arbitrary locations.
566
       *
567
       * Technically, this logic is not limited
568
       * to recursive clones, or for that matter to
569
       * submodules' paths colliding with symbolic links'
570
       * paths. Yet it strikes a balance in favor of
571
       * simplicity, and if paths are colliding, we might
572
       * just as well keep the directories during a clone.
573
       */
574
0
      if (state->clone && S_ISLNK(ce->ce_mode))
575
0
        return 0;
576
0
      remove_subtree(&path);
577
0
    } else if (unlink(path.buf))
578
0
      return error_errno("unable to unlink old '%s'", path.buf);
579
0
  } else if (state->not_new)
580
0
    return 0;
581
582
0
  create_directories(path.buf, path.len, state);
583
584
0
  if (S_ISREG(ce->ce_mode) && !ca) {
585
0
    convert_attrs(state->istate, &ca_buf, ce->name);
586
0
    ca = &ca_buf;
587
0
  }
588
589
0
  if (!enqueue_checkout(ce, ca, nr_checkouts))
590
0
    return 0;
591
592
0
  return write_entry(ce, path.buf, ca, state, 0, nr_checkouts);
593
0
}
594
595
void unlink_entry(const struct cache_entry *ce, const char *super_prefix)
596
0
{
597
0
  const struct submodule *sub = submodule_from_ce(ce);
598
0
  if (sub) {
599
    /* state.force is set at the caller. */
600
0
    submodule_move_head(ce->name, super_prefix, "HEAD", NULL,
601
0
            SUBMODULE_MOVE_HEAD_FORCE);
602
0
  }
603
0
  if (check_leading_path(ce->name, ce_namelen(ce), 1) >= 0)
604
0
    return;
605
0
  if (remove_or_warn(ce->ce_mode, ce->name))
606
0
    return;
607
0
  schedule_dir_for_removal(ce->name, ce_namelen(ce));
608
0
}
609
610
int remove_or_warn(unsigned int mode, const char *file)
611
0
{
612
0
  return S_ISGITLINK(mode) ? rmdir_or_warn(file) : unlink_or_warn(file);
613
0
}