10 #include "parse-options.h"
16 #define QUOTE_PYTHON 4
19 typedef enum { FIELD_STR, FIELD_ULONG, FIELD_TIME } cmp_type;
23 unsigned long ul; /* used for sorting when not FIELD_STR */
27 struct ref_sort *next;
28 int atom; /* index into used_atom array */
34 unsigned char objectname[20];
35 struct atom_value *value;
44 { "objectsize", FIELD_ULONG },
48 { "numparent", FIELD_ULONG },
55 { "authordate", FIELD_TIME },
59 { "committerdate", FIELD_TIME },
63 { "taggerdate", FIELD_TIME },
65 { "creatordate", FIELD_TIME },
72 * An atom is a valid field atom listed above, possibly prefixed with
73 * a "*" to denote deref_tag().
75 * We parse given format string and sort specifiers, and make a list
76 * of properties that we need to extract out of objects. refinfo
77 * structure will hold an array of values extracted that can be
78 * indexed with the "atom number", which is an index into this
81 static const char **used_atom;
82 static cmp_type *used_atom_type;
83 static int used_atom_cnt, sort_atom_limit, need_tagged;
86 * Used to parse format string and sort specifiers
88 static int parse_atom(const char *atom, const char *ep)
94 if (*sp == '*' && sp < ep)
97 die("malformed field name: %.*s", (int)(ep-atom), atom);
99 /* Do we have the atom already used elsewhere? */
100 for (i = 0; i < used_atom_cnt; i++) {
101 int len = strlen(used_atom[i]);
102 if (len == ep - atom && !memcmp(used_atom[i], atom, len))
106 /* Is the atom a valid one? */
107 for (i = 0; i < ARRAY_SIZE(valid_atom); i++) {
108 int len = strlen(valid_atom[i].name);
110 * If the atom name has a colon, strip it and everything after
111 * it off - it specifies the format for this entry, and
112 * shouldn't be used for checking against the valid_atom
115 const char *formatp = strchr(sp, ':');
116 if (!formatp || ep < formatp)
118 if (len == formatp - sp && !memcmp(valid_atom[i].name, sp, len))
122 if (ARRAY_SIZE(valid_atom) <= i)
123 die("unknown field name: %.*s", (int)(ep-atom), atom);
125 /* Add it in, including the deref prefix */
128 used_atom = xrealloc(used_atom,
129 (sizeof *used_atom) * used_atom_cnt);
130 used_atom_type = xrealloc(used_atom_type,
131 (sizeof(*used_atom_type) * used_atom_cnt));
132 used_atom[at] = xmemdupz(atom, ep - atom);
133 used_atom_type[at] = valid_atom[i].cmp_type;
138 * In a format string, find the next occurrence of %(atom).
140 static const char *find_next(const char *cp)
144 /* %( is the start of an atom;
145 * %% is a quoted per-cent.
149 else if (cp[1] == '%')
150 cp++; /* skip over two % */
151 /* otherwise this is a singleton, literal % */
159 * Make sure the format string is well formed, and parse out
162 static int verify_format(const char *format)
165 for (cp = format; *cp && (sp = find_next(cp)); ) {
166 const char *ep = strchr(sp, ')');
168 return error("malformed format string %s", sp);
169 /* sp points at "%(" and ep points at the closing ")" */
170 parse_atom(sp + 2, ep);
177 * Given an object name, read the object data and size, and return a
178 * "struct object". If the object data we are returning is also borrowed
179 * by the "struct object" representation, set *eaten as well---it is a
180 * signal from parse_object_buffer to us not to free the buffer.
182 static void *get_obj(const unsigned char *sha1, struct object **obj, unsigned long *sz, int *eaten)
184 enum object_type type;
185 void *buf = read_sha1_file(sha1, &type, sz);
188 *obj = parse_object_buffer(sha1, type, *sz, buf, eaten);
194 /* See grab_values */
195 static void grab_common_values(struct atom_value *val, int deref, struct object *obj, void *buf, unsigned long sz)
199 for (i = 0; i < used_atom_cnt; i++) {
200 const char *name = used_atom[i];
201 struct atom_value *v = &val[i];
202 if (!!deref != (*name == '*'))
206 if (!strcmp(name, "objecttype"))
207 v->s = typename(obj->type);
208 else if (!strcmp(name, "objectsize")) {
209 char *s = xmalloc(40);
210 sprintf(s, "%lu", sz);
214 else if (!strcmp(name, "objectname")) {
215 char *s = xmalloc(41);
216 strcpy(s, sha1_to_hex(obj->sha1));
222 /* See grab_values */
223 static void grab_tag_values(struct atom_value *val, int deref, struct object *obj, void *buf, unsigned long sz)
226 struct tag *tag = (struct tag *) obj;
228 for (i = 0; i < used_atom_cnt; i++) {
229 const char *name = used_atom[i];
230 struct atom_value *v = &val[i];
231 if (!!deref != (*name == '*'))
235 if (!strcmp(name, "tag"))
237 else if (!strcmp(name, "type") && tag->tagged)
238 v->s = typename(tag->tagged->type);
239 else if (!strcmp(name, "object") && tag->tagged) {
240 char *s = xmalloc(41);
241 strcpy(s, sha1_to_hex(tag->tagged->sha1));
247 static int num_parents(struct commit *commit)
249 struct commit_list *parents;
252 for (i = 0, parents = commit->parents;
254 parents = parents->next)
259 /* See grab_values */
260 static void grab_commit_values(struct atom_value *val, int deref, struct object *obj, void *buf, unsigned long sz)
263 struct commit *commit = (struct commit *) obj;
265 for (i = 0; i < used_atom_cnt; i++) {
266 const char *name = used_atom[i];
267 struct atom_value *v = &val[i];
268 if (!!deref != (*name == '*'))
272 if (!strcmp(name, "tree")) {
273 char *s = xmalloc(41);
274 strcpy(s, sha1_to_hex(commit->tree->object.sha1));
277 if (!strcmp(name, "numparent")) {
278 char *s = xmalloc(40);
279 v->ul = num_parents(commit);
280 sprintf(s, "%lu", v->ul);
283 else if (!strcmp(name, "parent")) {
284 int num = num_parents(commit);
286 struct commit_list *parents;
287 char *s = xmalloc(41 * num + 1);
289 for (i = 0, parents = commit->parents;
291 parents = parents->next, i = i + 41) {
292 struct commit *parent = parents->item;
293 strcpy(s+i, sha1_to_hex(parent->object.sha1));
303 static const char *find_wholine(const char *who, int wholen, const char *buf, unsigned long sz)
307 if (!strncmp(buf, who, wholen) &&
309 return buf + wholen + 1;
310 eol = strchr(buf, '\n');
315 return ""; /* end of header */
321 static const char *copy_line(const char *buf)
323 const char *eol = strchrnul(buf, '\n');
324 return xmemdupz(buf, eol - buf);
327 static const char *copy_name(const char *buf)
330 for (cp = buf; *cp && *cp != '\n'; cp++) {
331 if (!strncmp(cp, " <", 2))
332 return xmemdupz(buf, cp - buf);
337 static const char *copy_email(const char *buf)
339 const char *email = strchr(buf, '<');
340 const char *eoemail = strchr(email, '>');
341 if (!email || !eoemail)
343 return xmemdupz(email, eoemail + 1 - email);
346 static void grab_date(const char *buf, struct atom_value *v, const char *atomname)
348 const char *eoemail = strstr(buf, "> ");
350 unsigned long timestamp;
352 enum date_mode date_mode = DATE_NORMAL;
356 * We got here because atomname ends in "date" or "date<something>";
357 * it's not possible that <something> is not ":<format>" because
358 * parse_atom() wouldn't have allowed it, so we can assume that no
359 * ":" means no format is specified, and use the default.
361 formatp = strchr(atomname, ':');
362 if (formatp != NULL) {
364 date_mode = parse_date_format(formatp);
369 timestamp = strtoul(eoemail + 2, &zone, 10);
370 if (timestamp == ULONG_MAX)
372 tz = strtol(zone, NULL, 10);
373 if ((tz == LONG_MIN || tz == LONG_MAX) && errno == ERANGE)
375 v->s = xstrdup(show_date(timestamp, tz, date_mode));
383 /* See grab_values */
384 static void grab_person(const char *who, struct atom_value *val, int deref, struct object *obj, void *buf, unsigned long sz)
387 int wholen = strlen(who);
388 const char *wholine = NULL;
390 for (i = 0; i < used_atom_cnt; i++) {
391 const char *name = used_atom[i];
392 struct atom_value *v = &val[i];
393 if (!!deref != (*name == '*'))
397 if (strncmp(who, name, wholen))
399 if (name[wholen] != 0 &&
400 strcmp(name + wholen, "name") &&
401 strcmp(name + wholen, "email") &&
402 prefixcmp(name + wholen, "date"))
405 wholine = find_wholine(who, wholen, buf, sz);
407 return; /* no point looking for it */
408 if (name[wholen] == 0)
409 v->s = copy_line(wholine);
410 else if (!strcmp(name + wholen, "name"))
411 v->s = copy_name(wholine);
412 else if (!strcmp(name + wholen, "email"))
413 v->s = copy_email(wholine);
414 else if (!prefixcmp(name + wholen, "date"))
415 grab_date(wholine, v, name);
418 /* For a tag or a commit object, if "creator" or "creatordate" is
419 * requested, do something special.
421 if (strcmp(who, "tagger") && strcmp(who, "committer"))
422 return; /* "author" for commit object is not wanted */
424 wholine = find_wholine(who, wholen, buf, sz);
427 for (i = 0; i < used_atom_cnt; i++) {
428 const char *name = used_atom[i];
429 struct atom_value *v = &val[i];
430 if (!!deref != (*name == '*'))
435 if (!prefixcmp(name, "creatordate"))
436 grab_date(wholine, v, name);
437 else if (!strcmp(name, "creator"))
438 v->s = copy_line(wholine);
442 static void find_subpos(const char *buf, unsigned long sz, const char **sub, const char **body)
445 const char *eol = strchr(buf, '\n');
448 if (eol[1] == '\n') {
450 break; /* found end of header */
458 *sub = buf; /* first non-empty line */
459 buf = strchr(buf, '\n');
462 return; /* no body */
465 buf++; /* skip blank between subject and body */
469 /* See grab_values */
470 static void grab_sub_body_contents(struct atom_value *val, int deref, struct object *obj, void *buf, unsigned long sz)
473 const char *subpos = NULL, *bodypos = NULL;
475 for (i = 0; i < used_atom_cnt; i++) {
476 const char *name = used_atom[i];
477 struct atom_value *v = &val[i];
478 if (!!deref != (*name == '*'))
482 if (strcmp(name, "subject") &&
483 strcmp(name, "body") &&
484 strcmp(name, "contents"))
487 find_subpos(buf, sz, &subpos, &bodypos);
491 if (!strcmp(name, "subject"))
492 v->s = copy_line(subpos);
493 else if (!strcmp(name, "body"))
494 v->s = xstrdup(bodypos);
495 else if (!strcmp(name, "contents"))
496 v->s = xstrdup(subpos);
500 /* We want to have empty print-string for field requests
501 * that do not apply (e.g. "authordate" for a tag object)
503 static void fill_missing_values(struct atom_value *val)
506 for (i = 0; i < used_atom_cnt; i++) {
507 struct atom_value *v = &val[i];
514 * val is a list of atom_value to hold returned values. Extract
515 * the values for atoms in used_atom array out of (obj, buf, sz).
516 * when deref is false, (obj, buf, sz) is the object that is
517 * pointed at by the ref itself; otherwise it is the object the
518 * ref (which is a tag) refers to.
520 static void grab_values(struct atom_value *val, int deref, struct object *obj, void *buf, unsigned long sz)
522 grab_common_values(val, deref, obj, buf, sz);
525 grab_tag_values(val, deref, obj, buf, sz);
526 grab_sub_body_contents(val, deref, obj, buf, sz);
527 grab_person("tagger", val, deref, obj, buf, sz);
530 grab_commit_values(val, deref, obj, buf, sz);
531 grab_sub_body_contents(val, deref, obj, buf, sz);
532 grab_person("author", val, deref, obj, buf, sz);
533 grab_person("committer", val, deref, obj, buf, sz);
536 // grab_tree_values(val, deref, obj, buf, sz);
539 // grab_blob_values(val, deref, obj, buf, sz);
542 die("Eh? Object of type %d?", obj->type);
547 * generate a format suitable for scanf from a ref_rev_parse_rules
548 * rule, that is replace the "%.*s" spec with a "%s" spec
550 static void gen_scanf_fmt(char *scanf_fmt, const char *rule)
554 spec = strstr(rule, "%.*s");
555 if (!spec || strstr(spec + 4, "%.*s"))
556 die("invalid rule in ref_rev_parse_rules: %s", rule);
558 /* copy all until spec */
559 strncpy(scanf_fmt, rule, spec - rule);
560 scanf_fmt[spec - rule] = '\0';
562 strcat(scanf_fmt, "%s");
563 /* copy remaining rule */
564 strcat(scanf_fmt, spec + 4);
570 * Shorten the refname to an non-ambiguous form
572 static char *get_short_ref(struct refinfo *ref)
575 static char **scanf_fmts;
579 /* pre generate scanf formats from ref_rev_parse_rules[] */
581 size_t total_len = 0;
583 /* the rule list is NULL terminated, count them first */
584 for (; ref_rev_parse_rules[nr_rules]; nr_rules++)
585 /* no +1 because strlen("%s") < strlen("%.*s") */
586 total_len += strlen(ref_rev_parse_rules[nr_rules]);
588 scanf_fmts = xmalloc(nr_rules * sizeof(char *) + total_len);
591 for (i = 0; i < nr_rules; i++) {
592 scanf_fmts[i] = (char *)&scanf_fmts[nr_rules]
594 gen_scanf_fmt(scanf_fmts[i], ref_rev_parse_rules[i]);
595 total_len += strlen(ref_rev_parse_rules[i]);
599 /* bail out if there are no rules */
603 /* buffer for scanf result, at most ref->refname must fit */
604 short_name = xstrdup(ref->refname);
606 /* skip first rule, it will always match */
607 for (i = nr_rules - 1; i > 0 ; --i) {
611 if (1 != sscanf(ref->refname, scanf_fmts[i], short_name))
614 short_name_len = strlen(short_name);
617 * check if the short name resolves to a valid ref,
618 * but use only rules prior to the matched one
620 for (j = 0; j < i; j++) {
621 const char *rule = ref_rev_parse_rules[j];
622 unsigned char short_objectname[20];
623 char refname[PATH_MAX];
626 * the short name is ambiguous, if it resolves
627 * (with this previous rule) to a valid ref
628 * read_ref() returns 0 on success
630 mksnpath(refname, sizeof(refname),
631 rule, short_name_len, short_name);
632 if (!read_ref(refname, short_objectname))
637 * short name is non-ambiguous if all previous rules
638 * haven't resolved to a valid ref
650 * Parse the object referred by ref, and grab needed value.
652 static void populate_value(struct refinfo *ref)
658 const unsigned char *tagged;
660 ref->value = xcalloc(sizeof(struct atom_value), used_atom_cnt);
662 buf = get_obj(ref->objectname, &obj, &size, &eaten);
664 die("missing object %s for %s",
665 sha1_to_hex(ref->objectname), ref->refname);
667 die("parse_object_buffer failed on %s for %s",
668 sha1_to_hex(ref->objectname), ref->refname);
670 /* Fill in specials first */
671 for (i = 0; i < used_atom_cnt; i++) {
672 const char *name = used_atom[i];
673 struct atom_value *v = &ref->value[i];
679 if (!prefixcmp(name, "refname")) {
680 const char *formatp = strchr(name, ':');
681 const char *refname = ref->refname;
683 /* look for "short" refname format */
686 if (!strcmp(formatp, "short"))
687 refname = get_short_ref(ref);
689 die("unknown refname format %s",
696 int len = strlen(refname);
697 char *s = xmalloc(len + 4);
698 sprintf(s, "%s^{}", refname);
704 grab_values(ref->value, 0, obj, buf, size);
708 /* If there is no atom that wants to know about tagged
709 * object, we are done.
711 if (!need_tagged || (obj->type != OBJ_TAG))
714 /* If it is a tag object, see if we use a value that derefs
715 * the object, and if we do grab the object it refers to.
717 tagged = ((struct tag *)obj)->tagged->sha1;
719 /* NEEDSWORK: This derefs tag only once, which
720 * is good to deal with chains of trust, but
721 * is not consistent with what deref_tag() does
722 * which peels the onion to the core.
724 buf = get_obj(tagged, &obj, &size, &eaten);
726 die("missing object %s for %s",
727 sha1_to_hex(tagged), ref->refname);
729 die("parse_object_buffer failed on %s for %s",
730 sha1_to_hex(tagged), ref->refname);
731 grab_values(ref->value, 1, obj, buf, size);
737 * Given a ref, return the value for the atom. This lazily gets value
738 * out of the object by calling populate value.
740 static void get_value(struct refinfo *ref, int atom, struct atom_value **v)
744 fill_missing_values(ref->value);
746 *v = &ref->value[atom];
749 struct grab_ref_cbdata {
750 struct refinfo **grab_array;
751 const char **grab_pattern;
756 * A call-back given to for_each_ref(). It is unfortunate that we
757 * need to use global variables to pass extra information to this
760 static int grab_single_ref(const char *refname, const unsigned char *sha1, int flag, void *cb_data)
762 struct grab_ref_cbdata *cb = cb_data;
766 if (*cb->grab_pattern) {
767 const char **pattern;
768 int namelen = strlen(refname);
769 for (pattern = cb->grab_pattern; *pattern; pattern++) {
770 const char *p = *pattern;
771 int plen = strlen(p);
773 if ((plen <= namelen) &&
774 !strncmp(refname, p, plen) &&
775 (refname[plen] == '\0' ||
776 refname[plen] == '/' ||
779 if (!fnmatch(p, refname, FNM_PATHNAME))
786 /* We do not open the object yet; sort may only need refname
787 * to do its job and the resulting list may yet to be pruned
790 ref = xcalloc(1, sizeof(*ref));
791 ref->refname = xstrdup(refname);
792 hashcpy(ref->objectname, sha1);
795 cb->grab_array = xrealloc(cb->grab_array,
796 sizeof(*cb->grab_array) * (cnt + 1));
797 cb->grab_array[cnt++] = ref;
802 static int cmp_ref_sort(struct ref_sort *s, struct refinfo *a, struct refinfo *b)
804 struct atom_value *va, *vb;
806 cmp_type cmp_type = used_atom_type[s->atom];
808 get_value(a, s->atom, &va);
809 get_value(b, s->atom, &vb);
812 cmp = strcmp(va->s, vb->s);
817 else if (va->ul == vb->ul)
823 return (s->reverse) ? -cmp : cmp;
826 static struct ref_sort *ref_sort;
827 static int compare_refs(const void *a_, const void *b_)
829 struct refinfo *a = *((struct refinfo **)a_);
830 struct refinfo *b = *((struct refinfo **)b_);
833 for (s = ref_sort; s; s = s->next) {
834 int cmp = cmp_ref_sort(s, a, b);
841 static void sort_refs(struct ref_sort *sort, struct refinfo **refs, int num_refs)
844 qsort(refs, num_refs, sizeof(struct refinfo *), compare_refs);
847 static void print_value(struct refinfo *ref, int atom, int quote_style)
849 struct atom_value *v;
850 get_value(ref, atom, &v);
851 switch (quote_style) {
856 sq_quote_print(stdout, v->s);
859 perl_quote_print(stdout, v->s);
862 python_quote_print(stdout, v->s);
865 tcl_quote_print(stdout, v->s);
870 static int hex1(char ch)
872 if ('0' <= ch && ch <= '9')
874 else if ('a' <= ch && ch <= 'f')
875 return ch - 'a' + 10;
876 else if ('A' <= ch && ch <= 'F')
877 return ch - 'A' + 10;
880 static int hex2(const char *cp)
883 return (hex1(cp[0]) << 4) | hex1(cp[1]);
888 static void emit(const char *cp, const char *ep)
890 while (*cp && (!ep || cp < ep)) {
895 int ch = hex2(cp + 1);
908 static void show_ref(struct refinfo *info, const char *format, int quote_style)
910 const char *cp, *sp, *ep;
912 for (cp = format; *cp && (sp = find_next(cp)); cp = ep + 1) {
913 ep = strchr(sp, ')');
916 print_value(info, parse_atom(sp + 2, ep), quote_style);
919 sp = cp + strlen(cp);
925 static struct ref_sort *default_sort(void)
927 static const char cstr_name[] = "refname";
929 struct ref_sort *sort = xcalloc(1, sizeof(*sort));
932 sort->atom = parse_atom(cstr_name, cstr_name + strlen(cstr_name));
936 static int opt_parse_sort(const struct option *opt, const char *arg, int unset)
938 struct ref_sort **sort_tail = opt->value;
942 if (!arg) /* should --no-sort void the list ? */
945 *sort_tail = s = xcalloc(1, sizeof(*s));
946 sort_tail = &s->next;
953 s->atom = parse_atom(arg, arg+len);
957 static char const * const for_each_ref_usage[] = {
958 "git for-each-ref [options] [<pattern>]",
962 int cmd_for_each_ref(int argc, const char **argv, const char *prefix)
965 const char *format = "%(objectname) %(objecttype)\t%(refname)";
966 struct ref_sort *sort = NULL, **sort_tail = &sort;
967 int maxcount = 0, quote_style = 0;
968 struct refinfo **refs;
969 struct grab_ref_cbdata cbdata;
971 struct option opts[] = {
972 OPT_BIT('s', "shell", "e_style,
973 "quote placeholders suitably for shells", QUOTE_SHELL),
974 OPT_BIT('p', "perl", "e_style,
975 "quote placeholders suitably for perl", QUOTE_PERL),
976 OPT_BIT(0 , "python", "e_style,
977 "quote placeholders suitably for python", QUOTE_PYTHON),
978 OPT_BIT(0 , "tcl", "e_style,
979 "quote placeholders suitably for tcl", QUOTE_TCL),
982 OPT_INTEGER( 0 , "count", &maxcount, "show only <n> matched refs"),
983 OPT_STRING( 0 , "format", &format, "format", "format to use for the output"),
984 OPT_CALLBACK(0 , "sort", sort_tail, "key",
985 "field name to sort on", &opt_parse_sort),
989 parse_options(argc, argv, opts, for_each_ref_usage, 0);
991 error("invalid --count argument: `%d'", maxcount);
992 usage_with_options(for_each_ref_usage, opts);
994 if (HAS_MULTI_BITS(quote_style)) {
995 error("more than one quoting style?");
996 usage_with_options(for_each_ref_usage, opts);
998 if (verify_format(format))
999 usage_with_options(for_each_ref_usage, opts);
1002 sort = default_sort();
1003 sort_atom_limit = used_atom_cnt;
1005 memset(&cbdata, 0, sizeof(cbdata));
1006 cbdata.grab_pattern = argv;
1007 for_each_ref(grab_single_ref, &cbdata);
1008 refs = cbdata.grab_array;
1009 num_refs = cbdata.grab_cnt;
1011 for (i = 0; i < used_atom_cnt; i++) {
1012 if (used_atom[i][0] == '*') {
1018 sort_refs(sort, refs, num_refs);
1020 if (!maxcount || num_refs < maxcount)
1021 maxcount = num_refs;
1022 for (i = 0; i < maxcount; i++)
1023 show_ref(refs[i], format, quote_style);