ls-files -i: pay attention to exclusion of leading paths
[git] / builtin / ls-files.c
1 /*
2  * This merges the file listing in the directory cache index
3  * with the actual working directory list, and shows different
4  * combinations of the two.
5  *
6  * Copyright (C) Linus Torvalds, 2005
7  */
8 #include "cache.h"
9 #include "quote.h"
10 #include "dir.h"
11 #include "builtin.h"
12 #include "tree.h"
13 #include "parse-options.h"
14 #include "resolve-undo.h"
15 #include "string-list.h"
16
17 static int abbrev;
18 static int show_deleted;
19 static int show_cached;
20 static int show_others;
21 static int show_stage;
22 static int show_unmerged;
23 static int show_resolve_undo;
24 static int show_modified;
25 static int show_killed;
26 static int show_valid_bit;
27 static int line_terminator = '\n';
28 static int debug_mode;
29
30 static const char *prefix;
31 static int max_prefix_len;
32 static int prefix_len;
33 static const char **pathspec;
34 static int error_unmatch;
35 static char *ps_matched;
36 static const char *with_tree;
37 static int exc_given;
38
39 static const char *tag_cached = "";
40 static const char *tag_unmerged = "";
41 static const char *tag_removed = "";
42 static const char *tag_other = "";
43 static const char *tag_killed = "";
44 static const char *tag_modified = "";
45 static const char *tag_skip_worktree = "";
46 static const char *tag_resolve_undo = "";
47
48 static void write_name(const char* name, size_t len)
49 {
50         write_name_quoted_relative(name, len, prefix, prefix_len, stdout,
51                         line_terminator);
52 }
53
54 static void show_dir_entry(const char *tag, struct dir_entry *ent)
55 {
56         int len = max_prefix_len;
57
58         if (len >= ent->len)
59                 die("git ls-files: internal error - directory entry not superset of prefix");
60
61         if (!match_pathspec(pathspec, ent->name, ent->len, len, ps_matched))
62                 return;
63
64         fputs(tag, stdout);
65         write_name(ent->name, ent->len);
66 }
67
68 static void show_other_files(struct dir_struct *dir)
69 {
70         int i;
71
72         for (i = 0; i < dir->nr; i++) {
73                 struct dir_entry *ent = dir->entries[i];
74                 if (!cache_name_is_other(ent->name, ent->len))
75                         continue;
76                 show_dir_entry(tag_other, ent);
77         }
78 }
79
80 static void show_killed_files(struct dir_struct *dir)
81 {
82         int i;
83         for (i = 0; i < dir->nr; i++) {
84                 struct dir_entry *ent = dir->entries[i];
85                 char *cp, *sp;
86                 int pos, len, killed = 0;
87
88                 for (cp = ent->name; cp - ent->name < ent->len; cp = sp + 1) {
89                         sp = strchr(cp, '/');
90                         if (!sp) {
91                                 /* If ent->name is prefix of an entry in the
92                                  * cache, it will be killed.
93                                  */
94                                 pos = cache_name_pos(ent->name, ent->len);
95                                 if (0 <= pos)
96                                         die("bug in show-killed-files");
97                                 pos = -pos - 1;
98                                 while (pos < active_nr &&
99                                        ce_stage(active_cache[pos]))
100                                         pos++; /* skip unmerged */
101                                 if (active_nr <= pos)
102                                         break;
103                                 /* pos points at a name immediately after
104                                  * ent->name in the cache.  Does it expect
105                                  * ent->name to be a directory?
106                                  */
107                                 len = ce_namelen(active_cache[pos]);
108                                 if ((ent->len < len) &&
109                                     !strncmp(active_cache[pos]->name,
110                                              ent->name, ent->len) &&
111                                     active_cache[pos]->name[ent->len] == '/')
112                                         killed = 1;
113                                 break;
114                         }
115                         if (0 <= cache_name_pos(ent->name, sp - ent->name)) {
116                                 /* If any of the leading directories in
117                                  * ent->name is registered in the cache,
118                                  * ent->name will be killed.
119                                  */
120                                 killed = 1;
121                                 break;
122                         }
123                 }
124                 if (killed)
125                         show_dir_entry(tag_killed, dir->entries[i]);
126         }
127 }
128
129 static void show_ce_entry(const char *tag, struct cache_entry *ce)
130 {
131         int len = max_prefix_len;
132
133         if (len >= ce_namelen(ce))
134                 die("git ls-files: internal error - cache entry not superset of prefix");
135
136         if (!match_pathspec(pathspec, ce->name, ce_namelen(ce), len, ps_matched))
137                 return;
138
139         if (tag && *tag && show_valid_bit &&
140             (ce->ce_flags & CE_VALID)) {
141                 static char alttag[4];
142                 memcpy(alttag, tag, 3);
143                 if (isalpha(tag[0]))
144                         alttag[0] = tolower(tag[0]);
145                 else if (tag[0] == '?')
146                         alttag[0] = '!';
147                 else {
148                         alttag[0] = 'v';
149                         alttag[1] = tag[0];
150                         alttag[2] = ' ';
151                         alttag[3] = 0;
152                 }
153                 tag = alttag;
154         }
155
156         if (!show_stage) {
157                 fputs(tag, stdout);
158         } else {
159                 printf("%s%06o %s %d\t",
160                        tag,
161                        ce->ce_mode,
162                        find_unique_abbrev(ce->sha1,abbrev),
163                        ce_stage(ce));
164         }
165         write_name(ce->name, ce_namelen(ce));
166         if (debug_mode) {
167                 printf("  ctime: %d:%d\n", ce->ce_ctime.sec, ce->ce_ctime.nsec);
168                 printf("  mtime: %d:%d\n", ce->ce_mtime.sec, ce->ce_mtime.nsec);
169                 printf("  dev: %d\tino: %d\n", ce->ce_dev, ce->ce_ino);
170                 printf("  uid: %d\tgid: %d\n", ce->ce_uid, ce->ce_gid);
171                 printf("  size: %d\tflags: %x\n", ce->ce_size, ce->ce_flags);
172         }
173 }
174
175 static void show_ru_info(void)
176 {
177         struct string_list_item *item;
178
179         if (!the_index.resolve_undo)
180                 return;
181
182         for_each_string_list_item(item, the_index.resolve_undo) {
183                 const char *path = item->string;
184                 struct resolve_undo_info *ui = item->util;
185                 int i, len;
186
187                 len = strlen(path);
188                 if (len < max_prefix_len)
189                         continue; /* outside of the prefix */
190                 if (!match_pathspec(pathspec, path, len, max_prefix_len, ps_matched))
191                         continue; /* uninterested */
192                 for (i = 0; i < 3; i++) {
193                         if (!ui->mode[i])
194                                 continue;
195                         printf("%s%06o %s %d\t", tag_resolve_undo, ui->mode[i],
196                                find_unique_abbrev(ui->sha1[i], abbrev),
197                                i + 1);
198                         write_name(path, len);
199                 }
200         }
201 }
202
203 static void show_files(struct dir_struct *dir)
204 {
205         int i;
206         struct path_exclude_check check;
207
208         if ((dir->flags & DIR_SHOW_IGNORED))
209                 path_exclude_check_init(&check, dir);
210
211         /* For cached/deleted files we don't need to even do the readdir */
212         if (show_others || show_killed) {
213                 fill_directory(dir, pathspec);
214                 if (show_others)
215                         show_other_files(dir);
216                 if (show_killed)
217                         show_killed_files(dir);
218         }
219         if (show_cached | show_stage) {
220                 for (i = 0; i < active_nr; i++) {
221                         struct cache_entry *ce = active_cache[i];
222                         if ((dir->flags & DIR_SHOW_IGNORED) &&
223                             !path_excluded(&check, ce))
224                                 continue;
225                         if (show_unmerged && !ce_stage(ce))
226                                 continue;
227                         if (ce->ce_flags & CE_UPDATE)
228                                 continue;
229                         show_ce_entry(ce_stage(ce) ? tag_unmerged :
230                                 (ce_skip_worktree(ce) ? tag_skip_worktree : tag_cached), ce);
231                 }
232         }
233         if (show_deleted | show_modified) {
234                 for (i = 0; i < active_nr; i++) {
235                         struct cache_entry *ce = active_cache[i];
236                         struct stat st;
237                         int err;
238                         if ((dir->flags & DIR_SHOW_IGNORED) &&
239                             !path_excluded(&check, ce))
240                                 continue;
241                         if (ce->ce_flags & CE_UPDATE)
242                                 continue;
243                         if (ce_skip_worktree(ce))
244                                 continue;
245                         err = lstat(ce->name, &st);
246                         if (show_deleted && err)
247                                 show_ce_entry(tag_removed, ce);
248                         if (show_modified && ce_modified(ce, &st, 0))
249                                 show_ce_entry(tag_modified, ce);
250                 }
251         }
252
253         if ((dir->flags & DIR_SHOW_IGNORED))
254                 path_exclude_check_clear(&check);
255 }
256
257 /*
258  * Prune the index to only contain stuff starting with "prefix"
259  */
260 static void prune_cache(const char *prefix)
261 {
262         int pos = cache_name_pos(prefix, max_prefix_len);
263         unsigned int first, last;
264
265         if (pos < 0)
266                 pos = -pos-1;
267         memmove(active_cache, active_cache + pos,
268                 (active_nr - pos) * sizeof(struct cache_entry *));
269         active_nr -= pos;
270         first = 0;
271         last = active_nr;
272         while (last > first) {
273                 int next = (last + first) >> 1;
274                 struct cache_entry *ce = active_cache[next];
275                 if (!strncmp(ce->name, prefix, max_prefix_len)) {
276                         first = next+1;
277                         continue;
278                 }
279                 last = next;
280         }
281         active_nr = last;
282 }
283
284 static void strip_trailing_slash_from_submodules(void)
285 {
286         const char **p;
287
288         for (p = pathspec; *p != NULL; p++) {
289                 int len = strlen(*p), pos;
290
291                 if (len < 1 || (*p)[len - 1] != '/')
292                         continue;
293                 pos = cache_name_pos(*p, len - 1);
294                 if (pos >= 0 && S_ISGITLINK(active_cache[pos]->ce_mode))
295                         *p = xstrndup(*p, len - 1);
296         }
297 }
298
299 /*
300  * Read the tree specified with --with-tree option
301  * (typically, HEAD) into stage #1 and then
302  * squash them down to stage #0.  This is used for
303  * --error-unmatch to list and check the path patterns
304  * that were given from the command line.  We are not
305  * going to write this index out.
306  */
307 void overlay_tree_on_cache(const char *tree_name, const char *prefix)
308 {
309         struct tree *tree;
310         unsigned char sha1[20];
311         struct pathspec pathspec;
312         struct cache_entry *last_stage0 = NULL;
313         int i;
314
315         if (get_sha1(tree_name, sha1))
316                 die("tree-ish %s not found.", tree_name);
317         tree = parse_tree_indirect(sha1);
318         if (!tree)
319                 die("bad tree-ish %s", tree_name);
320
321         /* Hoist the unmerged entries up to stage #3 to make room */
322         for (i = 0; i < active_nr; i++) {
323                 struct cache_entry *ce = active_cache[i];
324                 if (!ce_stage(ce))
325                         continue;
326                 ce->ce_flags |= CE_STAGEMASK;
327         }
328
329         if (prefix) {
330                 static const char *(matchbuf[2]);
331                 matchbuf[0] = prefix;
332                 matchbuf[1] = NULL;
333                 init_pathspec(&pathspec, matchbuf);
334                 pathspec.items[0].use_wildcard = 0;
335         } else
336                 init_pathspec(&pathspec, NULL);
337         if (read_tree(tree, 1, &pathspec))
338                 die("unable to read tree entries %s", tree_name);
339
340         for (i = 0; i < active_nr; i++) {
341                 struct cache_entry *ce = active_cache[i];
342                 switch (ce_stage(ce)) {
343                 case 0:
344                         last_stage0 = ce;
345                         /* fallthru */
346                 default:
347                         continue;
348                 case 1:
349                         /*
350                          * If there is stage #0 entry for this, we do not
351                          * need to show it.  We use CE_UPDATE bit to mark
352                          * such an entry.
353                          */
354                         if (last_stage0 &&
355                             !strcmp(last_stage0->name, ce->name))
356                                 ce->ce_flags |= CE_UPDATE;
357                 }
358         }
359 }
360
361 int report_path_error(const char *ps_matched, const char **pathspec, const char *prefix)
362 {
363         /*
364          * Make sure all pathspec matched; otherwise it is an error.
365          */
366         struct strbuf sb = STRBUF_INIT;
367         const char *name;
368         int num, errors = 0;
369         for (num = 0; pathspec[num]; num++) {
370                 int other, found_dup;
371
372                 if (ps_matched[num])
373                         continue;
374                 /*
375                  * The caller might have fed identical pathspec
376                  * twice.  Do not barf on such a mistake.
377                  */
378                 for (found_dup = other = 0;
379                      !found_dup && pathspec[other];
380                      other++) {
381                         if (other == num || !ps_matched[other])
382                                 continue;
383                         if (!strcmp(pathspec[other], pathspec[num]))
384                                 /*
385                                  * Ok, we have a match already.
386                                  */
387                                 found_dup = 1;
388                 }
389                 if (found_dup)
390                         continue;
391
392                 name = quote_path_relative(pathspec[num], -1, &sb, prefix);
393                 error("pathspec '%s' did not match any file(s) known to git.",
394                       name);
395                 errors++;
396         }
397         strbuf_release(&sb);
398         return errors;
399 }
400
401 static const char * const ls_files_usage[] = {
402         "git ls-files [options] [<file>...]",
403         NULL
404 };
405
406 static int option_parse_z(const struct option *opt,
407                           const char *arg, int unset)
408 {
409         line_terminator = unset ? '\n' : '\0';
410
411         return 0;
412 }
413
414 static int option_parse_exclude(const struct option *opt,
415                                 const char *arg, int unset)
416 {
417         struct exclude_list *list = opt->value;
418
419         exc_given = 1;
420         add_exclude(arg, "", 0, list);
421
422         return 0;
423 }
424
425 static int option_parse_exclude_from(const struct option *opt,
426                                      const char *arg, int unset)
427 {
428         struct dir_struct *dir = opt->value;
429
430         exc_given = 1;
431         add_excludes_from_file(dir, arg);
432
433         return 0;
434 }
435
436 static int option_parse_exclude_standard(const struct option *opt,
437                                          const char *arg, int unset)
438 {
439         struct dir_struct *dir = opt->value;
440
441         exc_given = 1;
442         setup_standard_excludes(dir);
443
444         return 0;
445 }
446
447 int cmd_ls_files(int argc, const char **argv, const char *cmd_prefix)
448 {
449         int require_work_tree = 0, show_tag = 0;
450         const char *max_prefix;
451         struct dir_struct dir;
452         struct option builtin_ls_files_options[] = {
453                 { OPTION_CALLBACK, 'z', NULL, NULL, NULL,
454                         "paths are separated with NUL character",
455                         PARSE_OPT_NOARG, option_parse_z },
456                 OPT_BOOLEAN('t', NULL, &show_tag,
457                         "identify the file status with tags"),
458                 OPT_BOOLEAN('v', NULL, &show_valid_bit,
459                         "use lowercase letters for 'assume unchanged' files"),
460                 OPT_BOOLEAN('c', "cached", &show_cached,
461                         "show cached files in the output (default)"),
462                 OPT_BOOLEAN('d', "deleted", &show_deleted,
463                         "show deleted files in the output"),
464                 OPT_BOOLEAN('m', "modified", &show_modified,
465                         "show modified files in the output"),
466                 OPT_BOOLEAN('o', "others", &show_others,
467                         "show other files in the output"),
468                 OPT_BIT('i', "ignored", &dir.flags,
469                         "show ignored files in the output",
470                         DIR_SHOW_IGNORED),
471                 OPT_BOOLEAN('s', "stage", &show_stage,
472                         "show staged contents' object name in the output"),
473                 OPT_BOOLEAN('k', "killed", &show_killed,
474                         "show files on the filesystem that need to be removed"),
475                 OPT_BIT(0, "directory", &dir.flags,
476                         "show 'other' directories' name only",
477                         DIR_SHOW_OTHER_DIRECTORIES),
478                 OPT_NEGBIT(0, "empty-directory", &dir.flags,
479                         "don't show empty directories",
480                         DIR_HIDE_EMPTY_DIRECTORIES),
481                 OPT_BOOLEAN('u', "unmerged", &show_unmerged,
482                         "show unmerged files in the output"),
483                 OPT_BOOLEAN(0, "resolve-undo", &show_resolve_undo,
484                             "show resolve-undo information"),
485                 { OPTION_CALLBACK, 'x', "exclude", &dir.exclude_list[EXC_CMDL], "pattern",
486                         "skip files matching pattern",
487                         0, option_parse_exclude },
488                 { OPTION_CALLBACK, 'X', "exclude-from", &dir, "file",
489                         "exclude patterns are read from <file>",
490                         0, option_parse_exclude_from },
491                 OPT_STRING(0, "exclude-per-directory", &dir.exclude_per_dir, "file",
492                         "read additional per-directory exclude patterns in <file>"),
493                 { OPTION_CALLBACK, 0, "exclude-standard", &dir, NULL,
494                         "add the standard git exclusions",
495                         PARSE_OPT_NOARG, option_parse_exclude_standard },
496                 { OPTION_SET_INT, 0, "full-name", &prefix_len, NULL,
497                         "make the output relative to the project top directory",
498                         PARSE_OPT_NOARG | PARSE_OPT_NONEG, NULL },
499                 OPT_BOOLEAN(0, "error-unmatch", &error_unmatch,
500                         "if any <file> is not in the index, treat this as an error"),
501                 OPT_STRING(0, "with-tree", &with_tree, "tree-ish",
502                         "pretend that paths removed since <tree-ish> are still present"),
503                 OPT__ABBREV(&abbrev),
504                 OPT_BOOLEAN(0, "debug", &debug_mode, "show debugging data"),
505                 OPT_END()
506         };
507
508         if (argc == 2 && !strcmp(argv[1], "-h"))
509                 usage_with_options(ls_files_usage, builtin_ls_files_options);
510
511         memset(&dir, 0, sizeof(dir));
512         prefix = cmd_prefix;
513         if (prefix)
514                 prefix_len = strlen(prefix);
515         git_config(git_default_config, NULL);
516
517         if (read_cache() < 0)
518                 die("index file corrupt");
519
520         argc = parse_options(argc, argv, prefix, builtin_ls_files_options,
521                         ls_files_usage, 0);
522         if (show_tag || show_valid_bit) {
523                 tag_cached = "H ";
524                 tag_unmerged = "M ";
525                 tag_removed = "R ";
526                 tag_modified = "C ";
527                 tag_other = "? ";
528                 tag_killed = "K ";
529                 tag_skip_worktree = "S ";
530                 tag_resolve_undo = "U ";
531         }
532         if (show_modified || show_others || show_deleted || (dir.flags & DIR_SHOW_IGNORED) || show_killed)
533                 require_work_tree = 1;
534         if (show_unmerged)
535                 /*
536                  * There's no point in showing unmerged unless
537                  * you also show the stage information.
538                  */
539                 show_stage = 1;
540         if (dir.exclude_per_dir)
541                 exc_given = 1;
542
543         if (require_work_tree && !is_inside_work_tree())
544                 setup_work_tree();
545
546         pathspec = get_pathspec(prefix, argv);
547
548         /* be nice with submodule paths ending in a slash */
549         if (pathspec)
550                 strip_trailing_slash_from_submodules();
551
552         /* Find common prefix for all pathspec's */
553         max_prefix = common_prefix(pathspec);
554         max_prefix_len = max_prefix ? strlen(max_prefix) : 0;
555
556         /* Treat unmatching pathspec elements as errors */
557         if (pathspec && error_unmatch) {
558                 int num;
559                 for (num = 0; pathspec[num]; num++)
560                         ;
561                 ps_matched = xcalloc(1, num);
562         }
563
564         if ((dir.flags & DIR_SHOW_IGNORED) && !exc_given)
565                 die("ls-files --ignored needs some exclude pattern");
566
567         /* With no flags, we default to showing the cached files */
568         if (!(show_stage | show_deleted | show_others | show_unmerged |
569               show_killed | show_modified | show_resolve_undo))
570                 show_cached = 1;
571
572         if (max_prefix)
573                 prune_cache(max_prefix);
574         if (with_tree) {
575                 /*
576                  * Basic sanity check; show-stages and show-unmerged
577                  * would not make any sense with this option.
578                  */
579                 if (show_stage || show_unmerged)
580                         die("ls-files --with-tree is incompatible with -s or -u");
581                 overlay_tree_on_cache(with_tree, max_prefix);
582         }
583         show_files(&dir);
584         if (show_resolve_undo)
585                 show_ru_info();
586
587         if (ps_matched) {
588                 int bad;
589                 bad = report_path_error(ps_matched, pathspec, prefix);
590                 if (bad)
591                         fprintf(stderr, "Did you forget to 'git add'?\n");
592
593                 return bad ? 1 : 0;
594         }
595
596         return 0;
597 }