1 #define USE_THE_REPOSITORY_VARIABLE
3 #include "git-compat-util.h"
4 #include "object-store-ll.h"
6 #include "environment.h"
10 #include "sparse-index.h"
11 #include "streaming.h"
12 #include "submodule.h"
15 #include "fsmonitor.h"
17 #include "parallel-checkout.h"
19 static void create_directories(const char *path
, int path_len
,
20 const struct checkout
*state
)
22 char *buf
= xmallocz(path_len
);
25 while (len
< path_len
) {
29 } while (len
< path_len
&& path
[len
] != '/');
35 * For 'checkout-index --prefix=<dir>', <dir> is
36 * allowed to be a symlink to an existing directory,
37 * and we set 'state->base_dir_len' below, such that
38 * we test the path components of the prefix with the
39 * stat() function instead of the lstat() function.
41 if (has_dirs_only_path(buf
, len
, state
->base_dir_len
))
42 continue; /* ok, it is already a directory. */
45 * If this mkdir() would fail, it could be that there
46 * is already a symlink or something else exists
47 * there, therefore we then try to unlink it and try
48 * one more time to create the directory.
50 if (mkdir(buf
, 0777)) {
51 if (errno
== EEXIST
&& state
->force
&&
52 !unlink_or_warn(buf
) && !mkdir(buf
, 0777))
54 die_errno("cannot create directory at '%s'", buf
);
60 static void remove_subtree(struct strbuf
*path
)
62 DIR *dir
= opendir(path
->buf
);
64 int origlen
= path
->len
;
67 die_errno("cannot opendir '%s'", path
->buf
);
68 while ((de
= readdir_skip_dot_and_dotdot(dir
)) != NULL
) {
71 strbuf_addch(path
, '/');
72 strbuf_addstr(path
, de
->d_name
);
73 if (lstat(path
->buf
, &st
))
74 die_errno("cannot lstat '%s'", path
->buf
);
75 if (S_ISDIR(st
.st_mode
))
77 else if (unlink(path
->buf
))
78 die_errno("cannot unlink '%s'", path
->buf
);
79 strbuf_setlen(path
, origlen
);
83 die_errno("cannot rmdir '%s'", path
->buf
);
86 static int create_file(const char *path
, unsigned int mode
)
88 mode
= (mode
& 0100) ? 0777 : 0666;
89 return open(path
, O_WRONLY
| O_CREAT
| O_EXCL
, mode
);
92 void *read_blob_entry(const struct cache_entry
*ce
, size_t *size
)
94 enum object_type type
;
96 void *blob_data
= repo_read_object_file(the_repository
, &ce
->oid
,
101 if (type
== OBJ_BLOB
)
108 static int open_output_fd(char *path
, const struct cache_entry
*ce
, int to_tempfile
)
110 int symlink
= (ce
->ce_mode
& S_IFMT
) != S_IFREG
;
112 xsnprintf(path
, TEMPORARY_FILENAME_LENGTH
, "%s",
113 symlink
? ".merge_link_XXXXXX" : ".merge_file_XXXXXX");
114 return mkstemp(path
);
116 return create_file(path
, !symlink
? ce
->ce_mode
: 0666);
120 int fstat_checkout_output(int fd
, const struct checkout
*state
, struct stat
*st
)
122 /* use fstat() only when path == ce->name */
123 if (fstat_is_reliable() &&
124 state
->refresh_cache
&& !state
->base_dir_len
) {
125 return !fstat(fd
, st
);
130 static int streaming_write_entry(const struct cache_entry
*ce
, char *path
,
131 struct stream_filter
*filter
,
132 const struct checkout
*state
, int to_tempfile
,
133 int *fstat_done
, struct stat
*statbuf
)
138 fd
= open_output_fd(path
, ce
, to_tempfile
);
142 result
|= stream_blob_to_fd(fd
, &ce
->oid
, filter
, 1);
143 *fstat_done
= fstat_checkout_output(fd
, state
, statbuf
);
151 void enable_delayed_checkout(struct checkout
*state
)
153 if (!state
->delayed_checkout
) {
154 state
->delayed_checkout
= xmalloc(sizeof(*state
->delayed_checkout
));
155 state
->delayed_checkout
->state
= CE_CAN_DELAY
;
156 string_list_init_nodup(&state
->delayed_checkout
->filters
);
157 string_list_init_nodup(&state
->delayed_checkout
->paths
);
161 static int remove_available_paths(struct string_list_item
*item
, void *cb_data
)
163 struct string_list
*available_paths
= cb_data
;
164 struct string_list_item
*available
;
166 available
= string_list_lookup(available_paths
, item
->string
);
168 available
->util
= item
->util
;
172 static int string_is_not_null(struct string_list_item
*item
, void *data UNUSED
)
174 return !!item
->string
;
177 int finish_delayed_checkout(struct checkout
*state
, int show_progress
)
180 unsigned processed_paths
= 0;
181 off_t filtered_bytes
= 0;
182 struct string_list_item
*filter
, *path
;
183 struct progress
*progress
= NULL
;
184 struct delayed_checkout
*dco
= state
->delayed_checkout
;
186 if (!state
->delayed_checkout
)
189 dco
->state
= CE_RETRY
;
191 progress
= start_delayed_progress(_("Filtering content"), dco
->paths
.nr
);
192 while (dco
->filters
.nr
> 0) {
193 for_each_string_list_item(filter
, &dco
->filters
) {
194 struct string_list available_paths
= STRING_LIST_INIT_DUP
;
196 if (!async_query_available_blobs(filter
->string
, &available_paths
)) {
197 /* Filter reported an error */
199 filter
->string
= NULL
;
202 if (available_paths
.nr
<= 0) {
204 * Filter responded with no entries. That means
205 * the filter is done and we can remove the
206 * filter from the list (see
207 * "string_list_remove_empty_items" call below).
209 filter
->string
= NULL
;
214 * In dco->paths we store a list of all delayed paths.
215 * The filter just send us a list of available paths.
216 * Remove them from the list.
218 filter_string_list(&dco
->paths
, 0,
219 &remove_available_paths
, &available_paths
);
221 for_each_string_list_item(path
, &available_paths
) {
222 struct cache_entry
* ce
;
225 error("external filter '%s' signaled that '%s' "
226 "is now available although it has not been "
228 filter
->string
, path
->string
);
232 * Do not ask the filter for available blobs,
233 * again, as the filter is likely buggy.
235 filter
->string
= NULL
;
238 ce
= index_file_exists(state
->istate
, path
->string
,
239 strlen(path
->string
), 0);
241 display_progress(progress
, ++processed_paths
);
242 errs
|= checkout_entry(ce
, state
, NULL
, path
->util
);
243 filtered_bytes
+= ce
->ce_stat_data
.sd_size
;
244 display_throughput(progress
, filtered_bytes
);
249 string_list_clear(&available_paths
, 0);
252 filter_string_list(&dco
->filters
, 0, string_is_not_null
, NULL
);
254 stop_progress(&progress
);
255 string_list_clear(&dco
->filters
, 0);
257 /* At this point we should not have any delayed paths anymore. */
258 errs
|= dco
->paths
.nr
;
259 for_each_string_list_item(path
, &dco
->paths
) {
260 error("'%s' was not filtered properly", path
->string
);
262 string_list_clear(&dco
->paths
, 0);
265 state
->delayed_checkout
= NULL
;
270 void update_ce_after_write(const struct checkout
*state
, struct cache_entry
*ce
,
273 if (state
->refresh_cache
) {
274 assert(state
->istate
);
275 fill_stat_cache_info(state
->istate
, ce
, st
);
276 ce
->ce_flags
|= CE_UPDATE_IN_BASE
;
277 mark_fsmonitor_invalid(state
->istate
, ce
);
278 state
->istate
->cache_changed
|= CE_ENTRY_CHANGED
;
282 /* Note: ca is used (and required) iff the entry refers to a regular file. */
283 static int write_entry(struct cache_entry
*ce
, char *path
, struct conv_attrs
*ca
,
284 const struct checkout
*state
, int to_tempfile
,
287 unsigned int ce_mode_s_ifmt
= ce
->ce_mode
& S_IFMT
;
288 struct delayed_checkout
*dco
= state
->delayed_checkout
;
289 int fd
, ret
, fstat_done
= 0;
291 struct strbuf buf
= STRBUF_INIT
;
296 const struct submodule
*sub
;
297 struct checkout_metadata meta
;
298 static int scratch_nr_checkouts
;
300 clone_checkout_metadata(&meta
, &state
->meta
, &ce
->oid
);
302 if (ce_mode_s_ifmt
== S_IFREG
) {
303 struct stream_filter
*filter
= get_stream_filter_ca(ca
, &ce
->oid
);
305 !streaming_write_entry(ce
, path
, filter
,
311 switch (ce_mode_s_ifmt
) {
313 new_blob
= read_blob_entry(ce
, &size
);
315 return error("unable to read sha1 file of %s (%s)",
316 ce
->name
, oid_to_hex(&ce
->oid
));
319 * We can't make a real symlink; write out a regular file entry
320 * with the symlink destination as its contents.
322 if (!has_symlinks
|| to_tempfile
)
323 goto write_file_entry
;
325 ret
= symlink(new_blob
, path
);
328 return error_errno("unable to create symlink %s", path
);
333 * We do not send the blob in case of a retry, so do not
334 * bother reading it at all.
336 if (dco
&& dco
->state
== CE_RETRY
) {
340 new_blob
= read_blob_entry(ce
, &size
);
342 return error("unable to read sha1 file of %s (%s)",
343 ce
->name
, oid_to_hex(&ce
->oid
));
347 * Convert from git internal format to working tree format
349 if (dco
&& dco
->state
!= CE_NO_DELAY
) {
350 ret
= async_convert_to_working_tree_ca(ca
, ce
->name
,
354 struct string_list_item
*item
=
355 string_list_lookup(&dco
->paths
, ce
->name
);
357 item
->util
= nr_checkouts
? nr_checkouts
358 : &scratch_nr_checkouts
;
364 ret
= convert_to_working_tree_ca(ca
, ce
->name
, new_blob
,
370 new_blob
= strbuf_detach(&buf
, &newsize
);
374 * No "else" here as errors from convert are OK at this
375 * point. If the error would have been fatal (e.g.
376 * filter is required), then we would have died already.
380 fd
= open_output_fd(path
, ce
, to_tempfile
);
383 return error_errno("unable to create file %s", path
);
386 wrote
= write_in_full(fd
, new_blob
, size
);
388 fstat_done
= fstat_checkout_output(fd
, state
, &st
);
392 return error("unable to write file %s", path
);
397 return error("cannot create temporary submodule %s", ce
->name
);
398 if (mkdir(path
, 0777) < 0)
399 return error("cannot create submodule directory %s", path
);
400 sub
= submodule_from_ce(ce
);
402 return submodule_move_head(ce
->name
, state
->super_prefix
,
403 NULL
, oid_to_hex(&ce
->oid
),
404 state
->force
? SUBMODULE_MOVE_HEAD_FORCE
: 0);
408 return error("unknown file mode for %s in index", ce
->name
);
412 if (state
->refresh_cache
) {
413 if (!fstat_done
&& lstat(ce
->name
, &st
) < 0)
414 return error_errno("unable to stat just-written file %s",
416 update_ce_after_write(state
, ce
, &st
);
425 * This is like 'lstat()', except it refuses to follow symlinks
426 * in the path, after skipping "skiplen".
428 static int check_path(const char *path
, int len
, struct stat
*st
, int skiplen
)
430 const char *slash
= path
+ len
;
432 while (path
< slash
&& *slash
!= '/')
434 if (!has_dirs_only_path(path
, slash
- path
, skiplen
)) {
438 return lstat(path
, st
);
441 static void mark_colliding_entries(const struct checkout
*state
,
442 struct cache_entry
*ce
, struct stat
*st
)
444 int i
, trust_ino
= check_stat
;
446 #if defined(GIT_WINDOWS_NATIVE) || defined(__CYGWIN__)
450 ce
->ce_flags
|= CE_MATCHED
;
452 /* TODO: audit for interaction with sparse-index. */
453 ensure_full_index(state
->istate
);
454 for (i
= 0; i
< state
->istate
->cache_nr
; i
++) {
455 struct cache_entry
*dup
= state
->istate
->cache
[i
];
459 * Parallel checkout doesn't create the files in index
460 * order. So the other side of the collision may appear
461 * after the given cache_entry in the array.
463 if (parallel_checkout_status() == PC_RUNNING
)
469 if (dup
->ce_flags
& (CE_MATCHED
| CE_VALID
| CE_SKIP_WORKTREE
))
472 if ((trust_ino
&& !match_stat_data(&dup
->ce_stat_data
, st
)) ||
473 paths_collide(ce
->name
, dup
->name
)) {
474 dup
->ce_flags
|= CE_MATCHED
;
480 int checkout_entry_ca(struct cache_entry
*ce
, struct conv_attrs
*ca
,
481 const struct checkout
*state
, char *topath
,
484 static struct strbuf path
= STRBUF_INIT
;
486 struct conv_attrs ca_buf
;
488 if (ce
->ce_flags
& CE_WT_REMOVE
) {
491 * No content and thus no path to create, so we have
492 * no pathname to return.
494 BUG("Can't remove entry to a path");
495 unlink_entry(ce
, state
->super_prefix
);
500 if (S_ISREG(ce
->ce_mode
) && !ca
) {
501 convert_attrs(state
->istate
, &ca_buf
, ce
->name
);
504 return write_entry(ce
, topath
, ca
, state
, 1, nr_checkouts
);
508 strbuf_add(&path
, state
->base_dir
, state
->base_dir_len
);
509 strbuf_add(&path
, ce
->name
, ce_namelen(ce
));
511 if (!check_path(path
.buf
, path
.len
, &st
, state
->base_dir_len
)) {
512 const struct submodule
*sub
;
513 unsigned changed
= ie_match_stat(state
->istate
, ce
, &st
,
514 CE_MATCH_IGNORE_VALID
| CE_MATCH_IGNORE_SKIP_WORKTREE
);
516 * Needs to be checked before !changed returns early,
517 * as the possibly empty directory was not changed
519 sub
= submodule_from_ce(ce
);
522 if (!is_submodule_populated_gently(ce
->name
, &err
)) {
524 if (lstat(ce
->name
, &sb
))
525 die(_("could not stat file '%s'"), ce
->name
);
526 if (!(st
.st_mode
& S_IFDIR
))
527 unlink_or_warn(ce
->name
);
529 return submodule_move_head(ce
->name
, state
->super_prefix
,
530 NULL
, oid_to_hex(&ce
->oid
), 0);
532 return submodule_move_head(ce
->name
, state
->super_prefix
,
533 "HEAD", oid_to_hex(&ce
->oid
),
534 state
->force
? SUBMODULE_MOVE_HEAD_FORCE
: 0);
542 "%s already exists, no checkout\n",
548 mark_colliding_entries(state
, ce
, &st
);
551 * We unlink the old file, to get the new one with the
552 * right permissions (including umask, which is nasty
553 * to emulate by hand - much easier to let the system
554 * just do the right thing)
556 if (S_ISDIR(st
.st_mode
)) {
557 /* If it is a gitlink, leave it alone! */
558 if (S_ISGITLINK(ce
->ce_mode
))
561 * We must avoid replacing submodules' leading
562 * directories with symbolic links, lest recursive
563 * clones can write into arbitrary locations.
565 * Technically, this logic is not limited
566 * to recursive clones, or for that matter to
567 * submodules' paths colliding with symbolic links'
568 * paths. Yet it strikes a balance in favor of
569 * simplicity, and if paths are colliding, we might
570 * just as well keep the directories during a clone.
572 if (state
->clone
&& S_ISLNK(ce
->ce_mode
))
574 remove_subtree(&path
);
575 } else if (unlink(path
.buf
))
576 return error_errno("unable to unlink old '%s'", path
.buf
);
577 } else if (state
->not_new
)
580 create_directories(path
.buf
, path
.len
, state
);
582 if (S_ISREG(ce
->ce_mode
) && !ca
) {
583 convert_attrs(state
->istate
, &ca_buf
, ce
->name
);
587 if (!enqueue_checkout(ce
, ca
, nr_checkouts
))
590 return write_entry(ce
, path
.buf
, ca
, state
, 0, nr_checkouts
);
593 void unlink_entry(const struct cache_entry
*ce
, const char *super_prefix
)
595 const struct submodule
*sub
= submodule_from_ce(ce
);
597 /* state.force is set at the caller. */
598 submodule_move_head(ce
->name
, super_prefix
, "HEAD", NULL
,
599 SUBMODULE_MOVE_HEAD_FORCE
);
601 if (check_leading_path(ce
->name
, ce_namelen(ce
), 1) >= 0)
603 if (remove_or_warn(ce
->ce_mode
, ce
->name
))
605 schedule_dir_for_removal(ce
->name
, ce_namelen(ce
));
608 int remove_or_warn(unsigned int mode
, const char *file
)
610 return S_ISGITLINK(mode
) ? rmdir_or_warn(file
) : unlink_or_warn(file
);