1#include "cache.h"
2#include "blob.h"
3#include "dir.h"
4#include "streaming.h"
5#include "submodule.h"
6#include "progress.h"
7#include "fsmonitor.h"
8
9static void create_directories(const char *path, int path_len,
10 const struct checkout *state)
11{
12 char *buf = xmallocz(path_len);
13 int len = 0;
14
15 while (len < path_len) {
16 do {
17 buf[len] = path[len];
18 len++;
19 } while (len < path_len && path[len] != '/');
20 if (len >= path_len)
21 break;
22 buf[len] = 0;
23
24 /*
25 * For 'checkout-index --prefix=<dir>', <dir> is
26 * allowed to be a symlink to an existing directory,
27 * and we set 'state->base_dir_len' below, such that
28 * we test the path components of the prefix with the
29 * stat() function instead of the lstat() function.
30 */
31 if (has_dirs_only_path(buf, len, state->base_dir_len))
32 continue; /* ok, it is already a directory. */
33
34 /*
35 * If this mkdir() would fail, it could be that there
36 * is already a symlink or something else exists
37 * there, therefore we then try to unlink it and try
38 * one more time to create the directory.
39 */
40 if (mkdir(buf, 0777)) {
41 if (errno == EEXIST && state->force &&
42 !unlink_or_warn(buf) && !mkdir(buf, 0777))
43 continue;
44 die_errno("cannot create directory at '%s'", buf);
45 }
46 }
47 free(buf);
48}
49
50static void remove_subtree(struct strbuf *path)
51{
52 DIR *dir = opendir(path->buf);
53 struct dirent *de;
54 int origlen = path->len;
55
56 if (!dir)
57 die_errno("cannot opendir '%s'", path->buf);
58 while ((de = readdir(dir)) != NULL) {
59 struct stat st;
60
61 if (is_dot_or_dotdot(de->d_name))
62 continue;
63
64 strbuf_addch(path, '/');
65 strbuf_addstr(path, de->d_name);
66 if (lstat(path->buf, &st))
67 die_errno("cannot lstat '%s'", path->buf);
68 if (S_ISDIR(st.st_mode))
69 remove_subtree(path);
70 else if (unlink(path->buf))
71 die_errno("cannot unlink '%s'", path->buf);
72 strbuf_setlen(path, origlen);
73 }
74 closedir(dir);
75 if (rmdir(path->buf))
76 die_errno("cannot rmdir '%s'", path->buf);
77}
78
79static int create_file(const char *path, unsigned int mode)
80{
81 mode = (mode & 0100) ? 0777 : 0666;
82 return open(path, O_WRONLY | O_CREAT | O_EXCL, mode);
83}
84
85static void *read_blob_entry(const struct cache_entry *ce, unsigned long *size)
86{
87 enum object_type type;
88 void *blob_data = read_object_file(&ce->oid, &type, size);
89
90 if (blob_data) {
91 if (type == OBJ_BLOB)
92 return blob_data;
93 free(blob_data);
94 }
95 return NULL;
96}
97
98static int open_output_fd(char *path, const struct cache_entry *ce, int to_tempfile)
99{
100 int symlink = (ce->ce_mode & S_IFMT) != S_IFREG;
101 if (to_tempfile) {
102 xsnprintf(path, TEMPORARY_FILENAME_LENGTH, "%s",
103 symlink ? ".merge_link_XXXXXX" : ".merge_file_XXXXXX");
104 return mkstemp(path);
105 } else {
106 return create_file(path, !symlink ? ce->ce_mode : 0666);
107 }
108}
109
110static int fstat_output(int fd, const struct checkout *state, struct stat *st)
111{
112 /* use fstat() only when path == ce->name */
113 if (fstat_is_reliable() &&
114 state->refresh_cache && !state->base_dir_len) {
115 fstat(fd, st);
116 return 1;
117 }
118 return 0;
119}
120
121static int streaming_write_entry(const struct cache_entry *ce, char *path,
122 struct stream_filter *filter,
123 const struct checkout *state, int to_tempfile,
124 int *fstat_done, struct stat *statbuf)
125{
126 int result = 0;
127 int fd;
128
129 fd = open_output_fd(path, ce, to_tempfile);
130 if (fd < 0)
131 return -1;
132
133 result |= stream_blob_to_fd(fd, &ce->oid, filter, 1);
134 *fstat_done = fstat_output(fd, state, statbuf);
135 result |= close(fd);
136
137 if (result)
138 unlink(path);
139 return result;
140}
141
142void enable_delayed_checkout(struct checkout *state)
143{
144 if (!state->delayed_checkout) {
145 state->delayed_checkout = xmalloc(sizeof(*state->delayed_checkout));
146 state->delayed_checkout->state = CE_CAN_DELAY;
147 string_list_init(&state->delayed_checkout->filters, 0);
148 string_list_init(&state->delayed_checkout->paths, 0);
149 }
150}
151
152static int remove_available_paths(struct string_list_item *item, void *cb_data)
153{
154 struct string_list *available_paths = cb_data;
155 struct string_list_item *available;
156
157 available = string_list_lookup(available_paths, item->string);
158 if (available)
159 available->util = (void *)item->string;
160 return !available;
161}
162
163int finish_delayed_checkout(struct checkout *state)
164{
165 int errs = 0;
166 unsigned delayed_object_count;
167 off_t filtered_bytes = 0;
168 struct string_list_item *filter, *path;
169 struct progress *progress;
170 struct delayed_checkout *dco = state->delayed_checkout;
171
172 if (!state->delayed_checkout)
173 return errs;
174
175 dco->state = CE_RETRY;
176 delayed_object_count = dco->paths.nr;
177 progress = start_delayed_progress(_("Filtering content"), delayed_object_count);
178 while (dco->filters.nr > 0) {
179 for_each_string_list_item(filter, &dco->filters) {
180 struct string_list available_paths = STRING_LIST_INIT_NODUP;
181 display_progress(progress, delayed_object_count - dco->paths.nr);
182
183 if (!async_query_available_blobs(filter->string, &available_paths)) {
184 /* Filter reported an error */
185 errs = 1;
186 filter->string = "";
187 continue;
188 }
189 if (available_paths.nr <= 0) {
190 /*
191 * Filter responded with no entries. That means
192 * the filter is done and we can remove the
193 * filter from the list (see
194 * "string_list_remove_empty_items" call below).
195 */
196 filter->string = "";
197 continue;
198 }
199
200 /*
201 * In dco->paths we store a list of all delayed paths.
202 * The filter just send us a list of available paths.
203 * Remove them from the list.
204 */
205 filter_string_list(&dco->paths, 0,
206 &remove_available_paths, &available_paths);
207
208 for_each_string_list_item(path, &available_paths) {
209 struct cache_entry* ce;
210
211 if (!path->util) {
212 error("external filter '%s' signaled that '%s' "
213 "is now available although it has not been "
214 "delayed earlier",
215 filter->string, path->string);
216 errs |= 1;
217
218 /*
219 * Do not ask the filter for available blobs,
220 * again, as the filter is likely buggy.
221 */
222 filter->string = "";
223 continue;
224 }
225 ce = index_file_exists(state->istate, path->string,
226 strlen(path->string), 0);
227 if (ce) {
228 errs |= checkout_entry(ce, state, NULL);
229 filtered_bytes += ce->ce_stat_data.sd_size;
230 display_throughput(progress, filtered_bytes);
231 } else
232 errs = 1;
233 }
234 }
235 string_list_remove_empty_items(&dco->filters, 0);
236 }
237 stop_progress(&progress);
238 string_list_clear(&dco->filters, 0);
239
240 /* At this point we should not have any delayed paths anymore. */
241 errs |= dco->paths.nr;
242 for_each_string_list_item(path, &dco->paths) {
243 error("'%s' was not filtered properly", path->string);
244 }
245 string_list_clear(&dco->paths, 0);
246
247 free(dco);
248 state->delayed_checkout = NULL;
249
250 return errs;
251}
252
253static int write_entry(struct cache_entry *ce,
254 char *path, const struct checkout *state, int to_tempfile)
255{
256 unsigned int ce_mode_s_ifmt = ce->ce_mode & S_IFMT;
257 struct delayed_checkout *dco = state->delayed_checkout;
258 int fd, ret, fstat_done = 0;
259 char *new_blob;
260 struct strbuf buf = STRBUF_INIT;
261 unsigned long size;
262 ssize_t wrote;
263 size_t newsize = 0;
264 struct stat st;
265 const struct submodule *sub;
266
267 if (ce_mode_s_ifmt == S_IFREG) {
268 struct stream_filter *filter = get_stream_filter(ce->name,
269 ce->oid.hash);
270 if (filter &&
271 !streaming_write_entry(ce, path, filter,
272 state, to_tempfile,
273 &fstat_done, &st))
274 goto finish;
275 }
276
277 switch (ce_mode_s_ifmt) {
278 case S_IFLNK:
279 new_blob = read_blob_entry(ce, &size);
280 if (!new_blob)
281 return error("unable to read sha1 file of %s (%s)",
282 path, oid_to_hex(&ce->oid));
283
284 /*
285 * We can't make a real symlink; write out a regular file entry
286 * with the symlink destination as its contents.
287 */
288 if (!has_symlinks || to_tempfile)
289 goto write_file_entry;
290
291 ret = symlink(new_blob, path);
292 free(new_blob);
293 if (ret)
294 return error_errno("unable to create symlink %s", path);
295 break;
296
297 case S_IFREG:
298 /*
299 * We do not send the blob in case of a retry, so do not
300 * bother reading it at all.
301 */
302 if (dco && dco->state == CE_RETRY) {
303 new_blob = NULL;
304 size = 0;
305 } else {
306 new_blob = read_blob_entry(ce, &size);
307 if (!new_blob)
308 return error("unable to read sha1 file of %s (%s)",
309 path, oid_to_hex(&ce->oid));
310 }
311
312 /*
313 * Convert from git internal format to working tree format
314 */
315 if (dco && dco->state != CE_NO_DELAY) {
316 ret = async_convert_to_working_tree(ce->name, new_blob,
317 size, &buf, dco);
318 if (ret && string_list_has_string(&dco->paths, ce->name)) {
319 free(new_blob);
320 goto delayed;
321 }
322 } else
323 ret = convert_to_working_tree(ce->name, new_blob, size, &buf);
324
325 if (ret) {
326 free(new_blob);
327 new_blob = strbuf_detach(&buf, &newsize);
328 size = newsize;
329 }
330 /*
331 * No "else" here as errors from convert are OK at this
332 * point. If the error would have been fatal (e.g.
333 * filter is required), then we would have died already.
334 */
335
336 write_file_entry:
337 fd = open_output_fd(path, ce, to_tempfile);
338 if (fd < 0) {
339 free(new_blob);
340 return error_errno("unable to create file %s", path);
341 }
342
343 wrote = write_in_full(fd, new_blob, size);
344 if (!to_tempfile)
345 fstat_done = fstat_output(fd, state, &st);
346 close(fd);
347 free(new_blob);
348 if (wrote < 0)
349 return error("unable to write file %s", path);
350 break;
351
352 case S_IFGITLINK:
353 if (to_tempfile)
354 return error("cannot create temporary submodule %s", path);
355 if (mkdir(path, 0777) < 0)
356 return error("cannot create submodule directory %s", path);
357 sub = submodule_from_ce(ce);
358 if (sub)
359 return submodule_move_head(ce->name,
360 NULL, oid_to_hex(&ce->oid),
361 state->force ? SUBMODULE_MOVE_HEAD_FORCE : 0);
362 break;
363
364 default:
365 return error("unknown file mode for %s in index", path);
366 }
367
368finish:
369 if (state->refresh_cache) {
370 assert(state->istate);
371 if (!fstat_done)
372 if (lstat(ce->name, &st) < 0)
373 return error_errno("unable to stat just-written file %s",
374 ce->name);
375 fill_stat_cache_info(ce, &st);
376 ce->ce_flags |= CE_UPDATE_IN_BASE;
377 mark_fsmonitor_invalid(state->istate, ce);
378 state->istate->cache_changed |= CE_ENTRY_CHANGED;
379 }
380delayed:
381 return 0;
382}
383
384/*
385 * This is like 'lstat()', except it refuses to follow symlinks
386 * in the path, after skipping "skiplen".
387 */
388static int check_path(const char *path, int len, struct stat *st, int skiplen)
389{
390 const char *slash = path + len;
391
392 while (path < slash && *slash != '/')
393 slash--;
394 if (!has_dirs_only_path(path, slash - path, skiplen)) {
395 errno = ENOENT;
396 return -1;
397 }
398 return lstat(path, st);
399}
400
401/*
402 * Write the contents from ce out to the working tree.
403 *
404 * When topath[] is not NULL, instead of writing to the working tree
405 * file named by ce, a temporary file is created by this function and
406 * its name is returned in topath[], which must be able to hold at
407 * least TEMPORARY_FILENAME_LENGTH bytes long.
408 */
409int checkout_entry(struct cache_entry *ce,
410 const struct checkout *state, char *topath)
411{
412 static struct strbuf path = STRBUF_INIT;
413 struct stat st;
414
415 if (topath)
416 return write_entry(ce, topath, state, 1);
417
418 strbuf_reset(&path);
419 strbuf_add(&path, state->base_dir, state->base_dir_len);
420 strbuf_add(&path, ce->name, ce_namelen(ce));
421
422 if (!check_path(path.buf, path.len, &st, state->base_dir_len)) {
423 const struct submodule *sub;
424 unsigned changed = ce_match_stat(ce, &st, CE_MATCH_IGNORE_VALID|CE_MATCH_IGNORE_SKIP_WORKTREE);
425 /*
426 * Needs to be checked before !changed returns early,
427 * as the possibly empty directory was not changed
428 */
429 sub = submodule_from_ce(ce);
430 if (sub) {
431 int err;
432 if (!is_submodule_populated_gently(ce->name, &err)) {
433 struct stat sb;
434 if (lstat(ce->name, &sb))
435 die(_("could not stat file '%s'"), ce->name);
436 if (!(st.st_mode & S_IFDIR))
437 unlink_or_warn(ce->name);
438
439 return submodule_move_head(ce->name,
440 NULL, oid_to_hex(&ce->oid), 0);
441 } else
442 return submodule_move_head(ce->name,
443 "HEAD", oid_to_hex(&ce->oid),
444 state->force ? SUBMODULE_MOVE_HEAD_FORCE : 0);
445 }
446
447 if (!changed)
448 return 0;
449 if (!state->force) {
450 if (!state->quiet)
451 fprintf(stderr,
452 "%s already exists, no checkout\n",
453 path.buf);
454 return -1;
455 }
456
457 /*
458 * We unlink the old file, to get the new one with the
459 * right permissions (including umask, which is nasty
460 * to emulate by hand - much easier to let the system
461 * just do the right thing)
462 */
463 if (S_ISDIR(st.st_mode)) {
464 /* If it is a gitlink, leave it alone! */
465 if (S_ISGITLINK(ce->ce_mode))
466 return 0;
467 if (!state->force)
468 return error("%s is a directory", path.buf);
469 remove_subtree(&path);
470 } else if (unlink(path.buf))
471 return error_errno("unable to unlink old '%s'", path.buf);
472 } else if (state->not_new)
473 return 0;
474
475 create_directories(path.buf, path.len, state);
476 return write_entry(ce, path.buf, state, 0);
477}