git.oblomov.eu Git - git/blob - pretty.c

   1 #include "cache.h"
   2 #include "commit.h"
   3 #include "utf8.h"
   4 #include "diff.h"
   5 #include "revision.h"
   6 #include "string-list.h"
   7 #include "mailmap.h"
   8 #include "log-tree.h"
   9 #include "notes.h"
  10 #include "color.h"
  11 #include "reflog-walk.h"
  12
  13 static char *user_format;
  14 static struct cmt_fmt_map {
  15         const char *name;
  16         enum cmit_fmt format;
  17         int is_tformat;
  18         int is_alias;
  19         const char *user_format;
  20 } *commit_formats;
  21 static size_t builtin_formats_len;
  22 static size_t commit_formats_len;
  23 static size_t commit_formats_alloc;
  24 static struct cmt_fmt_map *find_commit_format(const char *sought);
  25
  26 static void save_user_format(struct rev_info *rev, const char *cp, int is_tformat)
  27 {
  28         free(user_format);
  29         user_format = xstrdup(cp);
  30         if (is_tformat)
  31                 rev->use_terminator = 1;
  32         rev->commit_format = CMIT_FMT_USERFORMAT;
  33 }
  34
  35 static int git_pretty_formats_config(const char *var, const char *value, void *cb)
  36 {
  37         struct cmt_fmt_map *commit_format = NULL;
  38         const char *name;
  39         const char *fmt;
  40         int i;
  41
  42         if (prefixcmp(var, "pretty."))
  43                 return 0;
  44
  45         name = var + strlen("pretty.");
  46         for (i = 0; i < builtin_formats_len; i++) {
  47                 if (!strcmp(commit_formats[i].name, name))
  48                         return 0;
  49         }
  50
  51         for (i = builtin_formats_len; i < commit_formats_len; i++) {
  52                 if (!strcmp(commit_formats[i].name, name)) {
  53                         commit_format = &commit_formats[i];
  54                         break;
  55                 }
  56         }
  57
  58         if (!commit_format) {
  59                 ALLOC_GROW(commit_formats, commit_formats_len+1,
  60                            commit_formats_alloc);
  61                 commit_format = &commit_formats[commit_formats_len];
  62                 memset(commit_format, 0, sizeof(*commit_format));
  63                 commit_formats_len++;
  64         }
  65
  66         commit_format->name = xstrdup(name);
  67         commit_format->format = CMIT_FMT_USERFORMAT;
  68         git_config_string(&fmt, var, value);
  69         if (!prefixcmp(fmt, "format:") || !prefixcmp(fmt, "tformat:")) {
  70                 commit_format->is_tformat = fmt[0] == 't';
  71                 fmt = strchr(fmt, ':') + 1;
  72         } else if (strchr(fmt, '%'))
  73                 commit_format->is_tformat = 1;
  74         else
  75                 commit_format->is_alias = 1;
  76         commit_format->user_format = fmt;
  77
  78         return 0;
  79 }
  80
  81 static void setup_commit_formats(void)
  82 {
  83         struct cmt_fmt_map builtin_formats[] = {
  84                 { "raw",        CMIT_FMT_RAW,           0 },
  85                 { "medium",     CMIT_FMT_MEDIUM,        0 },
  86                 { "short",      CMIT_FMT_SHORT,         0 },
  87                 { "email",      CMIT_FMT_EMAIL,         0 },
  88                 { "fuller",     CMIT_FMT_FULLER,        0 },
  89                 { "full",       CMIT_FMT_FULL,          0 },
  90                 { "oneline",    CMIT_FMT_ONELINE,       1 }
  91         };
  92         commit_formats_len = ARRAY_SIZE(builtin_formats);
  93         builtin_formats_len = commit_formats_len;
  94         ALLOC_GROW(commit_formats, commit_formats_len, commit_formats_alloc);
  95         memcpy(commit_formats, builtin_formats,
  96                sizeof(*builtin_formats)*ARRAY_SIZE(builtin_formats));
  97
  98         git_config(git_pretty_formats_config, NULL);
  99 }
 100
 101 static struct cmt_fmt_map *find_commit_format_recursive(const char *sought,
 102                                                         const char *original,
 103                                                         int num_redirections)
 104 {
 105         struct cmt_fmt_map *found = NULL;
 106         size_t found_match_len = 0;
 107         int i;
 108
 109         if (num_redirections >= commit_formats_len)
 110                 die("invalid --pretty format: "
 111                     "'%s' references an alias which points to itself",
 112                     original);
 113
 114         for (i = 0; i < commit_formats_len; i++) {
 115                 size_t match_len;
 116
 117                 if (prefixcmp(commit_formats[i].name, sought))
 118                         continue;
 119
 120                 match_len = strlen(commit_formats[i].name);
 121                 if (found == NULL || found_match_len > match_len) {
 122                         found = &commit_formats[i];
 123                         found_match_len = match_len;
 124                 }
 125         }
 126
 127         if (found && found->is_alias) {
 128                 found = find_commit_format_recursive(found->user_format,
 129                                                      original,
 130                                                      num_redirections+1);
 131         }
 132
 133         return found;
 134 }
 135
 136 static struct cmt_fmt_map *find_commit_format(const char *sought)
 137 {
 138         if (!commit_formats)
 139                 setup_commit_formats();
 140
 141         return find_commit_format_recursive(sought, sought, 0);
 142 }
 143
 144 void get_commit_format(const char *arg, struct rev_info *rev)
 145 {
 146         struct cmt_fmt_map *commit_format;
 147
 148         rev->use_terminator = 0;
 149         if (!arg || !*arg) {
 150                 rev->commit_format = CMIT_FMT_DEFAULT;
 151                 return;
 152         }
 153         if (!prefixcmp(arg, "format:") || !prefixcmp(arg, "tformat:")) {
 154                 save_user_format(rev, strchr(arg, ':') + 1, arg[0] == 't');
 155                 return;
 156         }
 157
 158         if (strchr(arg, '%')) {
 159                 save_user_format(rev, arg, 1);
 160                 return;
 161         }
 162
 163         commit_format = find_commit_format(arg);
 164         if (!commit_format)
 165                 die("invalid --pretty format: %s", arg);
 166
 167         rev->commit_format = commit_format->format;
 168         rev->use_terminator = commit_format->is_tformat;
 169         if (commit_format->format == CMIT_FMT_USERFORMAT) {
 170                 save_user_format(rev, commit_format->user_format,
 171                                  commit_format->is_tformat);
 172         }
 173 }
 174
 175 /*
 176  * Generic support for pretty-printing the header
 177  */
 178 static int get_one_line(const char *msg)
 179 {
 180         int ret = 0;
 181
 182         for (;;) {
 183                 char c = *msg++;
 184                 if (!c)
 185                         break;
 186                 ret++;
 187                 if (c == '\n')
 188                         break;
 189         }
 190         return ret;
 191 }
 192
 193 /* High bit set, or ISO-2022-INT */
 194 static int non_ascii(int ch)
 195 {
 196         return !isascii(ch) || ch == '\033';
 197 }
 198
 199 int has_non_ascii(const char *s)
 200 {
 201         int ch;
 202         if (!s)
 203                 return 0;
 204         while ((ch = *s++) != '\0') {
 205                 if (non_ascii(ch))
 206                         return 1;
 207         }
 208         return 0;
 209 }
 210
 211 static int is_rfc2047_special(char ch)
 212 {
 213         return (non_ascii(ch) || (ch == '=') || (ch == '?') || (ch == '_'));
 214 }
 215
 216 static void add_rfc2047(struct strbuf *sb, const char *line, int len,
 217                        const char *encoding)
 218 {
 219         int i, last;
 220
 221         for (i = 0; i < len; i++) {
 222                 int ch = line[i];
 223                 if (non_ascii(ch))
 224                         goto needquote;
 225                 if ((i + 1 < len) && (ch == '=' && line[i+1] == '?'))
 226                         goto needquote;
 227         }
 228         strbuf_add(sb, line, len);
 229         return;
 230
 231 needquote:
 232         strbuf_grow(sb, len * 3 + strlen(encoding) + 100);
 233         strbuf_addf(sb, "=?%s?q?", encoding);
 234         for (i = last = 0; i < len; i++) {
 235                 unsigned ch = line[i] & 0xFF;
 236                 /*
 237                  * We encode ' ' using '=20' even though rfc2047
 238                  * allows using '_' for readability.  Unfortunately,
 239                  * many programs do not understand this and just
 240                  * leave the underscore in place.
 241                  */
 242                 if (is_rfc2047_special(ch) || ch == ' ') {
 243                         strbuf_add(sb, line + last, i - last);
 244                         strbuf_addf(sb, "=%02X", ch);
 245                         last = i + 1;
 246                 }
 247         }
 248         strbuf_add(sb, line + last, len - last);
 249         strbuf_addstr(sb, "?=");
 250 }
 251
 252 void pp_user_info(const char *what, enum cmit_fmt fmt, struct strbuf *sb,
 253                   const char *line, enum date_mode dmode,
 254                   const char *encoding)
 255 {
 256         char *date;
 257         int namelen;
 258         unsigned long time;
 259         int tz;
 260
 261         if (fmt == CMIT_FMT_ONELINE)
 262                 return;
 263         date = strchr(line, '>');
 264         if (!date)
 265                 return;
 266         namelen = ++date - line;
 267         time = strtoul(date, &date, 10);
 268         tz = strtol(date, NULL, 10);
 269
 270         if (fmt == CMIT_FMT_EMAIL) {
 271                 char *name_tail = strchr(line, '<');
 272                 int display_name_length;
 273                 if (!name_tail)
 274                         return;
 275                 while (line < name_tail && isspace(name_tail[-1]))
 276                         name_tail--;
 277                 display_name_length = name_tail - line;
 278                 strbuf_addstr(sb, "From: ");
 279                 add_rfc2047(sb, line, display_name_length, encoding);
 280                 strbuf_add(sb, name_tail, namelen - display_name_length);
 281                 strbuf_addch(sb, '\n');
 282         } else {
 283                 strbuf_addf(sb, "%s: %.*s%.*s\n", what,
 284                               (fmt == CMIT_FMT_FULLER) ? 4 : 0,
 285                               "    ", namelen, line);
 286         }
 287         switch (fmt) {
 288         case CMIT_FMT_MEDIUM:
 289                 strbuf_addf(sb, "Date:   %s\n", show_date(time, tz, dmode));
 290                 break;
 291         case CMIT_FMT_EMAIL:
 292                 strbuf_addf(sb, "Date: %s\n", show_date(time, tz, DATE_RFC2822));
 293                 break;
 294         case CMIT_FMT_FULLER:
 295                 strbuf_addf(sb, "%sDate: %s\n", what, show_date(time, tz, dmode));
 296                 break;
 297         default:
 298                 /* notin' */
 299                 break;
 300         }
 301 }
 302
 303 static int is_empty_line(const char *line, int *len_p)
 304 {
 305         int len = *len_p;
 306         while (len && isspace(line[len-1]))
 307                 len--;
 308         *len_p = len;
 309         return !len;
 310 }
 311
 312 static const char *skip_empty_lines(const char *msg)
 313 {
 314         for (;;) {
 315                 int linelen = get_one_line(msg);
 316                 int ll = linelen;
 317                 if (!linelen)
 318                         break;
 319                 if (!is_empty_line(msg, &ll))
 320                         break;
 321                 msg += linelen;
 322         }
 323         return msg;
 324 }
 325
 326 static void add_merge_info(enum cmit_fmt fmt, struct strbuf *sb,
 327                         const struct commit *commit, int abbrev)
 328 {
 329         struct commit_list *parent = commit->parents;
 330
 331         if ((fmt == CMIT_FMT_ONELINE) || (fmt == CMIT_FMT_EMAIL) ||
 332             !parent || !parent->next)
 333                 return;
 334
 335         strbuf_addstr(sb, "Merge:");
 336
 337         while (parent) {
 338                 struct commit *p = parent->item;
 339                 const char *hex = NULL;
 340                 if (abbrev)
 341                         hex = find_unique_abbrev(p->object.sha1, abbrev);
 342                 if (!hex)
 343                         hex = sha1_to_hex(p->object.sha1);
 344                 parent = parent->next;
 345
 346                 strbuf_addf(sb, " %s", hex);
 347         }
 348         strbuf_addch(sb, '\n');
 349 }
 350
 351 static char *get_header(const struct commit *commit, const char *key)
 352 {
 353         int key_len = strlen(key);
 354         const char *line = commit->buffer;
 355
 356         for (;;) {
 357                 const char *eol = strchr(line, '\n'), *next;
 358
 359                 if (line == eol)
 360                         return NULL;
 361                 if (!eol) {
 362                         eol = line + strlen(line);
 363                         next = NULL;
 364                 } else
 365                         next = eol + 1;
 366                 if (eol - line > key_len &&
 367                     !strncmp(line, key, key_len) &&
 368                     line[key_len] == ' ') {
 369                         return xmemdupz(line + key_len + 1, eol - line - key_len - 1);
 370                 }
 371                 line = next;
 372         }
 373 }
 374
 375 static char *replace_encoding_header(char *buf, const char *encoding)
 376 {
 377         struct strbuf tmp = STRBUF_INIT;
 378         size_t start, len;
 379         char *cp = buf;
 380
 381         /* guess if there is an encoding header before a \n\n */
 382         while (strncmp(cp, "encoding ", strlen("encoding "))) {
 383                 cp = strchr(cp, '\n');
 384                 if (!cp || *++cp == '\n')
 385                         return buf;
 386         }
 387         start = cp - buf;
 388         cp = strchr(cp, '\n');
 389         if (!cp)
 390                 return buf; /* should not happen but be defensive */
 391         len = cp + 1 - (buf + start);
 392
 393         strbuf_attach(&tmp, buf, strlen(buf), strlen(buf) + 1);
 394         if (is_encoding_utf8(encoding)) {
 395                 /* we have re-coded to UTF-8; drop the header */
 396                 strbuf_remove(&tmp, start, len);
 397         } else {
 398                 /* just replaces XXXX in 'encoding XXXX\n' */
 399                 strbuf_splice(&tmp, start + strlen("encoding "),
 400                                           len - strlen("encoding \n"),
 401                                           encoding, strlen(encoding));
 402         }
 403         return strbuf_detach(&tmp, NULL);
 404 }
 405
 406 char *logmsg_reencode(const struct commit *commit,
 407                       const char *output_encoding)
 408 {
 409         static const char *utf8 = "UTF-8";
 410         const char *use_encoding;
 411         char *encoding;
 412         char *out;
 413
 414         if (!*output_encoding)
 415                 return NULL;
 416         encoding = get_header(commit, "encoding");
 417         use_encoding = encoding ? encoding : utf8;
 418         if (!strcmp(use_encoding, output_encoding))
 419                 if (encoding) /* we'll strip encoding header later */
 420                         out = xstrdup(commit->buffer);
 421                 else
 422                         return NULL; /* nothing to do */
 423         else
 424                 out = reencode_string(commit->buffer,
 425                                       output_encoding, use_encoding);
 426         if (out)
 427                 out = replace_encoding_header(out, output_encoding);
 428
 429         free(encoding);
 430         return out;
 431 }
 432
 433 static int mailmap_name(char *email, int email_len, char *name, int name_len)
 434 {
 435         static struct string_list *mail_map;
 436         if (!mail_map) {
 437                 mail_map = xcalloc(1, sizeof(*mail_map));
 438                 read_mailmap(mail_map, NULL);
 439         }
 440         return mail_map->nr && map_user(mail_map, email, email_len, name, name_len);
 441 }
 442
 443 static size_t format_person_part(struct strbuf *sb, char part,
 444                                  const char *msg, int len, enum date_mode dmode)
 445 {
 446         /* currently all placeholders have same length */
 447         const int placeholder_len = 2;
 448         int start, end, tz = 0;
 449         unsigned long date = 0;
 450         char *ep;
 451         const char *name_start, *name_end, *mail_start, *mail_end, *msg_end = msg+len;
 452         char person_name[1024];
 453         char person_mail[1024];
 454
 455         /* advance 'end' to point to email start delimiter */
 456         for (end = 0; end < len && msg[end] != '<'; end++)
 457                 ; /* do nothing */
 458
 459         /*
 460          * When end points at the '<' that we found, it should have
 461          * matching '>' later, which means 'end' must be strictly
 462          * below len - 1.
 463          */
 464         if (end >= len - 2)
 465                 goto skip;
 466
 467         /* Seek for both name and email part */
 468         name_start = msg;
 469         name_end = msg+end;
 470         while (name_end > name_start && isspace(*(name_end-1)))
 471                 name_end--;
 472         mail_start = msg+end+1;
 473         mail_end = mail_start;
 474         while (mail_end < msg_end && *mail_end != '>')
 475                 mail_end++;
 476         if (mail_end == msg_end)
 477                 goto skip;
 478         end = mail_end-msg;
 479
 480         if (part == 'N' || part == 'E') { /* mailmap lookup */
 481                 strlcpy(person_name, name_start, name_end-name_start+1);
 482                 strlcpy(person_mail, mail_start, mail_end-mail_start+1);
 483                 mailmap_name(person_mail, sizeof(person_mail), person_name, sizeof(person_name));
 484                 name_start = person_name;
 485                 name_end = name_start + strlen(person_name);
 486                 mail_start = person_mail;
 487                 mail_end = mail_start +  strlen(person_mail);
 488         }
 489         if (part == 'n' || part == 'N') {       /* name */
 490                 strbuf_add(sb, name_start, name_end-name_start);
 491                 return placeholder_len;
 492         }
 493         if (part == 'e' || part == 'E') {       /* email */
 494                 strbuf_add(sb, mail_start, mail_end-mail_start);
 495                 return placeholder_len;
 496         }
 497
 498         /* advance 'start' to point to date start delimiter */
 499         for (start = end + 1; start < len && isspace(msg[start]); start++)
 500                 ; /* do nothing */
 501         if (start >= len)
 502                 goto skip;
 503         date = strtoul(msg + start, &ep, 10);
 504         if (msg + start == ep)
 505                 goto skip;
 506
 507         if (part == 't') {      /* date, UNIX timestamp */
 508                 strbuf_add(sb, msg + start, ep - (msg + start));
 509                 return placeholder_len;
 510         }
 511
 512         /* parse tz */
 513         for (start = ep - msg + 1; start < len && isspace(msg[start]); start++)
 514                 ; /* do nothing */
 515         if (start + 1 < len) {
 516                 tz = strtoul(msg + start + 1, NULL, 10);
 517                 if (msg[start] == '-')
 518                         tz = -tz;
 519         }
 520
 521         switch (part) {
 522         case 'd':       /* date */
 523                 strbuf_addstr(sb, show_date(date, tz, dmode));
 524                 return placeholder_len;
 525         case 'D':       /* date, RFC2822 style */
 526                 strbuf_addstr(sb, show_date(date, tz, DATE_RFC2822));
 527                 return placeholder_len;
 528         case 'r':       /* date, relative */
 529                 strbuf_addstr(sb, show_date(date, tz, DATE_RELATIVE));
 530                 return placeholder_len;
 531         case 'i':       /* date, ISO 8601 */
 532                 strbuf_addstr(sb, show_date(date, tz, DATE_ISO8601));
 533                 return placeholder_len;
 534         }
 535
 536 skip:
 537         /*
 538          * bogus commit, 'sb' cannot be updated, but we still need to
 539          * compute a valid return value.
 540          */
 541         if (part == 'n' || part == 'e' || part == 't' || part == 'd'
 542             || part == 'D' || part == 'r' || part == 'i')
 543                 return placeholder_len;
 544
 545         return 0; /* unknown placeholder */
 546 }
 547
 548 struct chunk {
 549         size_t off;
 550         size_t len;
 551 };
 552
 553 struct format_commit_context {
 554         const struct commit *commit;
 555         const struct pretty_print_context *pretty_ctx;
 556         unsigned commit_header_parsed:1;
 557         unsigned commit_message_parsed:1;
 558         char *message;
 559         size_t width, indent1, indent2;
 560
 561         /* These offsets are relative to the start of the commit message. */
 562         struct chunk author;
 563         struct chunk committer;
 564         struct chunk encoding;
 565         size_t message_off;
 566         size_t subject_off;
 567         size_t body_off;
 568
 569         /* The following ones are relative to the result struct strbuf. */
 570         struct chunk abbrev_commit_hash;
 571         struct chunk abbrev_tree_hash;
 572         struct chunk abbrev_parent_hashes;
 573         size_t wrap_start;
 574 };
 575
 576 static int add_again(struct strbuf *sb, struct chunk *chunk)
 577 {
 578         if (chunk->len) {
 579                 strbuf_adddup(sb, chunk->off, chunk->len);
 580                 return 1;
 581         }
 582
 583         /*
 584          * We haven't seen this chunk before.  Our caller is surely
 585          * going to add it the hard way now.  Remember the most likely
 586          * start of the to-be-added chunk: the current end of the
 587          * struct strbuf.
 588          */
 589         chunk->off = sb->len;
 590         return 0;
 591 }
 592
 593 static void parse_commit_header(struct format_commit_context *context)
 594 {
 595         const char *msg = context->message;
 596         int i;
 597
 598         for (i = 0; msg[i]; i++) {
 599                 int eol;
 600                 for (eol = i; msg[eol] && msg[eol] != '\n'; eol++)
 601                         ; /* do nothing */
 602
 603                 if (i == eol) {
 604                         break;
 605                 } else if (!prefixcmp(msg + i, "author ")) {
 606                         context->author.off = i + 7;
 607                         context->author.len = eol - i - 7;
 608                 } else if (!prefixcmp(msg + i, "committer ")) {
 609                         context->committer.off = i + 10;
 610                         context->committer.len = eol - i - 10;
 611                 } else if (!prefixcmp(msg + i, "encoding ")) {
 612                         context->encoding.off = i + 9;
 613                         context->encoding.len = eol - i - 9;
 614                 }
 615                 i = eol;
 616         }
 617         context->message_off = i;
 618         context->commit_header_parsed = 1;
 619 }
 620
 621 static int istitlechar(char c)
 622 {
 623         return (c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z') ||
 624                 (c >= '0' && c <= '9') || c == '.' || c == '_';
 625 }
 626
 627 static void format_sanitized_subject(struct strbuf *sb, const char *msg)
 628 {
 629         size_t trimlen;
 630         size_t start_len = sb->len;
 631         int space = 2;
 632
 633         for (; *msg && *msg != '\n'; msg++) {
 634                 if (istitlechar(*msg)) {
 635                         if (space == 1)
 636                                 strbuf_addch(sb, '-');
 637                         space = 0;
 638                         strbuf_addch(sb, *msg);
 639                         if (*msg == '.')
 640                                 while (*(msg+1) == '.')
 641                                         msg++;
 642                 } else
 643                         space |= 1;
 644         }
 645
 646         /* trim any trailing '.' or '-' characters */
 647         trimlen = 0;
 648         while (sb->len - trimlen > start_len &&
 649                 (sb->buf[sb->len - 1 - trimlen] == '.'
 650                 || sb->buf[sb->len - 1 - trimlen] == '-'))
 651                 trimlen++;
 652         strbuf_remove(sb, sb->len - trimlen, trimlen);
 653 }
 654
 655 const char *format_subject(struct strbuf *sb, const char *msg,
 656                            const char *line_separator)
 657 {
 658         int first = 1;
 659
 660         for (;;) {
 661                 const char *line = msg;
 662                 int linelen = get_one_line(line);
 663
 664                 msg += linelen;
 665                 if (!linelen || is_empty_line(line, &linelen))
 666                         break;
 667
 668                 if (!sb)
 669                         continue;
 670                 strbuf_grow(sb, linelen + 2);
 671                 if (!first)
 672                         strbuf_addstr(sb, line_separator);
 673                 strbuf_add(sb, line, linelen);
 674                 first = 0;
 675         }
 676         return msg;
 677 }
 678
 679 static void parse_commit_message(struct format_commit_context *c)
 680 {
 681         const char *msg = c->message + c->message_off;
 682         const char *start = c->message;
 683
 684         msg = skip_empty_lines(msg);
 685         c->subject_off = msg - start;
 686
 687         msg = format_subject(NULL, msg, NULL);
 688         msg = skip_empty_lines(msg);
 689         c->body_off = msg - start;
 690
 691         c->commit_message_parsed = 1;
 692 }
 693
 694 static void format_decoration(struct strbuf *sb, const struct commit *commit)
 695 {
 696         struct name_decoration *d;
 697         const char *prefix = " (";
 698
 699         load_ref_decorations(DECORATE_SHORT_REFS);
 700         d = lookup_decoration(&name_decoration, &commit->object);
 701         while (d) {
 702                 strbuf_addstr(sb, prefix);
 703                 prefix = ", ";
 704                 strbuf_addstr(sb, d->name);
 705                 d = d->next;
 706         }
 707         if (prefix[0] == ',')
 708                 strbuf_addch(sb, ')');
 709 }
 710
 711 static void strbuf_wrap(struct strbuf *sb, size_t pos,
 712                         size_t width, size_t indent1, size_t indent2)
 713 {
 714         struct strbuf tmp = STRBUF_INIT;
 715
 716         if (pos)
 717                 strbuf_add(&tmp, sb->buf, pos);
 718         strbuf_add_wrapped_text(&tmp, sb->buf + pos,
 719                                 (int) indent1, (int) indent2, (int) width);
 720         strbuf_swap(&tmp, sb);
 721         strbuf_release(&tmp);
 722 }
 723
 724 static void rewrap_message_tail(struct strbuf *sb,
 725                                 struct format_commit_context *c,
 726                                 size_t new_width, size_t new_indent1,
 727                                 size_t new_indent2)
 728 {
 729         if (c->width == new_width && c->indent1 == new_indent1 &&
 730             c->indent2 == new_indent2)
 731                 return;
 732         if (c->wrap_start < sb->len)
 733                 strbuf_wrap(sb, c->wrap_start, c->width, c->indent1, c->indent2);
 734         c->wrap_start = sb->len;
 735         c->width = new_width;
 736         c->indent1 = new_indent1;
 737         c->indent2 = new_indent2;
 738 }
 739
 740 static size_t format_commit_one(struct strbuf *sb, const char *placeholder,
 741                                 void *context)
 742 {
 743         struct format_commit_context *c = context;
 744         const struct commit *commit = c->commit;
 745         const char *msg = c->message;
 746         struct commit_list *p;
 747         int h1, h2;
 748
 749         /* these are independent of the commit */
 750         switch (placeholder[0]) {
 751         case 'C':
 752                 if (placeholder[1] == '(') {
 753                         const char *end = strchr(placeholder + 2, ')');
 754                         char color[COLOR_MAXLEN];
 755                         if (!end)
 756                                 return 0;
 757                         color_parse_mem(placeholder + 2,
 758                                         end - (placeholder + 2),
 759                                         "--pretty format", color);
 760                         strbuf_addstr(sb, color);
 761                         return end - placeholder + 1;
 762                 }
 763                 if (!prefixcmp(placeholder + 1, "red")) {
 764                         strbuf_addstr(sb, GIT_COLOR_RED);
 765                         return 4;
 766                 } else if (!prefixcmp(placeholder + 1, "green")) {
 767                         strbuf_addstr(sb, GIT_COLOR_GREEN);
 768                         return 6;
 769                 } else if (!prefixcmp(placeholder + 1, "blue")) {
 770                         strbuf_addstr(sb, GIT_COLOR_BLUE);
 771                         return 5;
 772                 } else if (!prefixcmp(placeholder + 1, "reset")) {
 773                         strbuf_addstr(sb, GIT_COLOR_RESET);
 774                         return 6;
 775                 } else
 776                         return 0;
 777         case 'n':               /* newline */
 778                 strbuf_addch(sb, '\n');
 779                 return 1;
 780         case 'x':
 781                 /* %x00 == NUL, %x0a == LF, etc. */
 782                 if (0 <= (h1 = hexval_table[0xff & placeholder[1]]) &&
 783                     h1 <= 16 &&
 784                     0 <= (h2 = hexval_table[0xff & placeholder[2]]) &&
 785                     h2 <= 16) {
 786                         strbuf_addch(sb, (h1<<4)|h2);
 787                         return 3;
 788                 } else
 789                         return 0;
 790         case 'w':
 791                 if (placeholder[1] == '(') {
 792                         unsigned long width = 0, indent1 = 0, indent2 = 0;
 793                         char *next;
 794                         const char *start = placeholder + 2;
 795                         const char *end = strchr(start, ')');
 796                         if (!end)
 797                                 return 0;
 798                         if (end > start) {
 799                                 width = strtoul(start, &next, 10);
 800                                 if (*next == ',') {
 801                                         indent1 = strtoul(next + 1, &next, 10);
 802                                         if (*next == ',') {
 803                                                 indent2 = strtoul(next + 1,
 804                                                                  &next, 10);
 805                                         }
 806                                 }
 807                                 if (*next != ')')
 808                                         return 0;
 809                         }
 810                         rewrap_message_tail(sb, c, width, indent1, indent2);
 811                         return end - placeholder + 1;
 812                 } else
 813                         return 0;
 814         }
 815
 816         /* these depend on the commit */
 817         if (!commit->object.parsed)
 818                 parse_object(commit->object.sha1);
 819
 820         switch (placeholder[0]) {
 821         case 'H':               /* commit hash */
 822                 strbuf_addstr(sb, sha1_to_hex(commit->object.sha1));
 823                 return 1;
 824         case 'h':               /* abbreviated commit hash */
 825                 if (add_again(sb, &c->abbrev_commit_hash))
 826                         return 1;
 827                 strbuf_addstr(sb, find_unique_abbrev(commit->object.sha1,
 828                                                      c->pretty_ctx->abbrev));
 829                 c->abbrev_commit_hash.len = sb->len - c->abbrev_commit_hash.off;
 830                 return 1;
 831         case 'T':               /* tree hash */
 832                 strbuf_addstr(sb, sha1_to_hex(commit->tree->object.sha1));
 833                 return 1;
 834         case 't':               /* abbreviated tree hash */
 835                 if (add_again(sb, &c->abbrev_tree_hash))
 836                         return 1;
 837                 strbuf_addstr(sb, find_unique_abbrev(commit->tree->object.sha1,
 838                                                      c->pretty_ctx->abbrev));
 839                 c->abbrev_tree_hash.len = sb->len - c->abbrev_tree_hash.off;
 840                 return 1;
 841         case 'P':               /* parent hashes */
 842                 for (p = commit->parents; p; p = p->next) {
 843                         if (p != commit->parents)
 844                                 strbuf_addch(sb, ' ');
 845                         strbuf_addstr(sb, sha1_to_hex(p->item->object.sha1));
 846                 }
 847                 return 1;
 848         case 'p':               /* abbreviated parent hashes */
 849                 if (add_again(sb, &c->abbrev_parent_hashes))
 850                         return 1;
 851                 for (p = commit->parents; p; p = p->next) {
 852                         if (p != commit->parents)
 853                                 strbuf_addch(sb, ' ');
 854                         strbuf_addstr(sb, find_unique_abbrev(
 855                                         p->item->object.sha1,
 856                                         c->pretty_ctx->abbrev));
 857                 }
 858                 c->abbrev_parent_hashes.len = sb->len -
 859                                               c->abbrev_parent_hashes.off;
 860                 return 1;
 861         case 'm':               /* left/right/bottom */
 862                 strbuf_addstr(sb, get_revision_mark(NULL, commit));
 863                 return 1;
 864         case 'd':
 865                 format_decoration(sb, commit);
 866                 return 1;
 867         case 'g':               /* reflog info */
 868                 switch(placeholder[1]) {
 869                 case 'd':       /* reflog selector */
 870                 case 'D':
 871                         if (c->pretty_ctx->reflog_info)
 872                                 get_reflog_selector(sb,
 873                                                     c->pretty_ctx->reflog_info,
 874                                                     c->pretty_ctx->date_mode,
 875                                                     (placeholder[1] == 'd'));
 876                         return 2;
 877                 case 's':       /* reflog message */
 878                         if (c->pretty_ctx->reflog_info)
 879                                 get_reflog_message(sb, c->pretty_ctx->reflog_info);
 880                         return 2;
 881                 }
 882                 return 0;       /* unknown %g placeholder */
 883         case 'N':
 884                 if (c->pretty_ctx->show_notes) {
 885                         format_display_notes(commit->object.sha1, sb,
 886                                     get_log_output_encoding(), 0);
 887                         return 1;
 888                 }
 889                 return 0;
 890         }
 891
 892         /* For the rest we have to parse the commit header. */
 893         if (!c->commit_header_parsed)
 894                 parse_commit_header(c);
 895
 896         switch (placeholder[0]) {
 897         case 'a':       /* author ... */
 898                 return format_person_part(sb, placeholder[1],
 899                                    msg + c->author.off, c->author.len,
 900                                    c->pretty_ctx->date_mode);
 901         case 'c':       /* committer ... */
 902                 return format_person_part(sb, placeholder[1],
 903                                    msg + c->committer.off, c->committer.len,
 904                                    c->pretty_ctx->date_mode);
 905         case 'e':       /* encoding */
 906                 strbuf_add(sb, msg + c->encoding.off, c->encoding.len);
 907                 return 1;
 908         case 'B':       /* raw body */
 909                 /* message_off is always left at the initial newline */
 910                 strbuf_addstr(sb, msg + c->message_off + 1);
 911                 return 1;
 912         }
 913
 914         /* Now we need to parse the commit message. */
 915         if (!c->commit_message_parsed)
 916                 parse_commit_message(c);
 917
 918         switch (placeholder[0]) {
 919         case 's':       /* subject */
 920                 format_subject(sb, msg + c->subject_off, " ");
 921                 return 1;
 922         case 'f':       /* sanitized subject */
 923                 format_sanitized_subject(sb, msg + c->subject_off);
 924                 return 1;
 925         case 'b':       /* body */
 926                 strbuf_addstr(sb, msg + c->body_off);
 927                 return 1;
 928         }
 929         return 0;       /* unknown placeholder */
 930 }
 931
 932 static size_t format_commit_item(struct strbuf *sb, const char *placeholder,
 933                                  void *context)
 934 {
 935         int consumed;
 936         size_t orig_len;
 937         enum {
 938                 NO_MAGIC,
 939                 ADD_LF_BEFORE_NON_EMPTY,
 940                 DEL_LF_BEFORE_EMPTY,
 941                 ADD_SP_BEFORE_NON_EMPTY
 942         } magic = NO_MAGIC;
 943
 944         switch (placeholder[0]) {
 945         case '-':
 946                 magic = DEL_LF_BEFORE_EMPTY;
 947                 break;
 948         case '+':
 949                 magic = ADD_LF_BEFORE_NON_EMPTY;
 950                 break;
 951         case ' ':
 952                 magic = ADD_SP_BEFORE_NON_EMPTY;
 953                 break;
 954         default:
 955                 break;
 956         }
 957         if (magic != NO_MAGIC)
 958                 placeholder++;
 959
 960         orig_len = sb->len;
 961         consumed = format_commit_one(sb, placeholder, context);
 962         if (magic == NO_MAGIC)
 963                 return consumed;
 964
 965         if ((orig_len == sb->len) && magic == DEL_LF_BEFORE_EMPTY) {
 966                 while (sb->len && sb->buf[sb->len - 1] == '\n')
 967                         strbuf_setlen(sb, sb->len - 1);
 968         } else if (orig_len != sb->len) {
 969                 if (magic == ADD_LF_BEFORE_NON_EMPTY)
 970                         strbuf_insert(sb, orig_len, "\n", 1);
 971                 else if (magic == ADD_SP_BEFORE_NON_EMPTY)
 972                         strbuf_insert(sb, orig_len, " ", 1);
 973         }
 974         return consumed + 1;
 975 }
 976
 977 static size_t userformat_want_item(struct strbuf *sb, const char *placeholder,
 978                                    void *context)
 979 {
 980         struct userformat_want *w = context;
 981
 982         if (*placeholder == '+' || *placeholder == '-' || *placeholder == ' ')
 983                 placeholder++;
 984
 985         switch (*placeholder) {
 986         case 'N':
 987                 w->notes = 1;
 988                 break;
 989         }
 990         return 0;
 991 }
 992
 993 void userformat_find_requirements(const char *fmt, struct userformat_want *w)
 994 {
 995         struct strbuf dummy = STRBUF_INIT;
 996
 997         if (!fmt) {
 998                 if (!user_format)
 999                         return;
1000                 fmt = user_format;
1001         }
1002         strbuf_expand(&dummy, user_format, userformat_want_item, w);
1003         strbuf_release(&dummy);
1004 }
1005
1006 void format_commit_message(const struct commit *commit,
1007                            const char *format, struct strbuf *sb,
1008                            const struct pretty_print_context *pretty_ctx)
1009 {
1010         struct format_commit_context context;
1011         static const char utf8[] = "UTF-8";
1012         const char *enc;
1013         const char *output_enc = pretty_ctx->output_encoding;
1014
1015         memset(&context, 0, sizeof(context));
1016         context.commit = commit;
1017         context.pretty_ctx = pretty_ctx;
1018         context.wrap_start = sb->len;
1019         context.message = commit->buffer;
1020         if (output_enc) {
1021                 enc = get_header(commit, "encoding");
1022                 enc = enc ? enc : utf8;
1023                 if (strcmp(enc, output_enc))
1024                         context.message = logmsg_reencode(commit, output_enc);
1025         }
1026
1027         strbuf_expand(sb, format, format_commit_item, &context);
1028         rewrap_message_tail(sb, &context, 0, 0, 0);
1029
1030         if (context.message != commit->buffer)
1031                 free(context.message);
1032 }
1033
1034 static void pp_header(enum cmit_fmt fmt,
1035                       int abbrev,
1036                       enum date_mode dmode,
1037                       const char *encoding,
1038                       const struct commit *commit,
1039                       const char **msg_p,
1040                       struct strbuf *sb)
1041 {
1042         int parents_shown = 0;
1043
1044         for (;;) {
1045                 const char *line = *msg_p;
1046                 int linelen = get_one_line(*msg_p);
1047
1048                 if (!linelen)
1049                         return;
1050                 *msg_p += linelen;
1051
1052                 if (linelen == 1)
1053                         /* End of header */
1054                         return;
1055
1056                 if (fmt == CMIT_FMT_RAW) {
1057                         strbuf_add(sb, line, linelen);
1058                         continue;
1059                 }
1060
1061                 if (!memcmp(line, "parent ", 7)) {
1062                         if (linelen != 48)
1063                                 die("bad parent line in commit");
1064                         continue;
1065                 }
1066
1067                 if (!parents_shown) {
1068                         struct commit_list *parent;
1069                         int num;
1070                         for (parent = commit->parents, num = 0;
1071                              parent;
1072                              parent = parent->next, num++)
1073                                 ;
1074                         /* with enough slop */
1075                         strbuf_grow(sb, num * 50 + 20);
1076                         add_merge_info(fmt, sb, commit, abbrev);
1077                         parents_shown = 1;
1078                 }
1079
1080                 /*
1081                  * MEDIUM == DEFAULT shows only author with dates.
1082                  * FULL shows both authors but not dates.
1083                  * FULLER shows both authors and dates.
1084                  */
1085                 if (!memcmp(line, "author ", 7)) {
1086                         strbuf_grow(sb, linelen + 80);
1087                         pp_user_info("Author", fmt, sb, line + 7, dmode, encoding);
1088                 }
1089                 if (!memcmp(line, "committer ", 10) &&
1090                     (fmt == CMIT_FMT_FULL || fmt == CMIT_FMT_FULLER)) {
1091                         strbuf_grow(sb, linelen + 80);
1092                         pp_user_info("Commit", fmt, sb, line + 10, dmode, encoding);
1093                 }
1094         }
1095 }
1096
1097 void pp_title_line(enum cmit_fmt fmt,
1098                    const char **msg_p,
1099                    struct strbuf *sb,
1100                    const char *subject,
1101                    const char *after_subject,
1102                    const char *encoding,
1103                    int need_8bit_cte)
1104 {
1105         const char *line_separator = (fmt == CMIT_FMT_EMAIL) ? "\n " : " ";
1106         struct strbuf title;
1107
1108         strbuf_init(&title, 80);
1109         *msg_p = format_subject(&title, *msg_p, line_separator);
1110
1111         strbuf_grow(sb, title.len + 1024);
1112         if (subject) {
1113                 strbuf_addstr(sb, subject);
1114                 add_rfc2047(sb, title.buf, title.len, encoding);
1115         } else {
1116                 strbuf_addbuf(sb, &title);
1117         }
1118         strbuf_addch(sb, '\n');
1119
1120         if (need_8bit_cte > 0) {
1121                 const char *header_fmt =
1122                         "MIME-Version: 1.0\n"
1123                         "Content-Type: text/plain; charset=%s\n"
1124                         "Content-Transfer-Encoding: 8bit\n";
1125                 strbuf_addf(sb, header_fmt, encoding);
1126         }
1127         if (after_subject) {
1128                 strbuf_addstr(sb, after_subject);
1129         }
1130         if (fmt == CMIT_FMT_EMAIL) {
1131                 strbuf_addch(sb, '\n');
1132         }
1133         strbuf_release(&title);
1134 }
1135
1136 void pp_remainder(enum cmit_fmt fmt,
1137                   const char **msg_p,
1138                   struct strbuf *sb,
1139                   int indent)
1140 {
1141         int first = 1;
1142         for (;;) {
1143                 const char *line = *msg_p;
1144                 int linelen = get_one_line(line);
1145                 *msg_p += linelen;
1146
1147                 if (!linelen)
1148                         break;
1149
1150                 if (is_empty_line(line, &linelen)) {
1151                         if (first)
1152                                 continue;
1153                         if (fmt == CMIT_FMT_SHORT)
1154                                 break;
1155                 }
1156                 first = 0;
1157
1158                 strbuf_grow(sb, linelen + indent + 20);
1159                 if (indent) {
1160                         memset(sb->buf + sb->len, ' ', indent);
1161                         strbuf_setlen(sb, sb->len + indent);
1162                 }
1163                 strbuf_add(sb, line, linelen);
1164                 strbuf_addch(sb, '\n');
1165         }
1166 }
1167
1168 char *reencode_commit_message(const struct commit *commit, const char **encoding_p)
1169 {
1170         const char *encoding;
1171
1172         encoding = get_log_output_encoding();
1173         if (encoding_p)
1174                 *encoding_p = encoding;
1175         return logmsg_reencode(commit, encoding);
1176 }
1177
1178 void pretty_print_commit(enum cmit_fmt fmt, const struct commit *commit,
1179                          struct strbuf *sb,
1180                          const struct pretty_print_context *context)
1181 {
1182         unsigned long beginning_of_body;
1183         int indent = 4;
1184         const char *msg = commit->buffer;
1185         char *reencoded;
1186         const char *encoding;
1187         int need_8bit_cte = context->need_8bit_cte;
1188
1189         if (fmt == CMIT_FMT_USERFORMAT) {
1190                 format_commit_message(commit, user_format, sb, context);
1191                 return;
1192         }
1193
1194         reencoded = reencode_commit_message(commit, &encoding);
1195         if (reencoded) {
1196                 msg = reencoded;
1197         }
1198
1199         if (fmt == CMIT_FMT_ONELINE || fmt == CMIT_FMT_EMAIL)
1200                 indent = 0;
1201
1202         /*
1203          * We need to check and emit Content-type: to mark it
1204          * as 8-bit if we haven't done so.
1205          */
1206         if (fmt == CMIT_FMT_EMAIL && need_8bit_cte == 0) {
1207                 int i, ch, in_body;
1208
1209                 for (in_body = i = 0; (ch = msg[i]); i++) {
1210                         if (!in_body) {
1211                                 /* author could be non 7-bit ASCII but
1212                                  * the log may be so; skip over the
1213                                  * header part first.
1214                                  */
1215                                 if (ch == '\n' && msg[i+1] == '\n')
1216                                         in_body = 1;
1217                         }
1218                         else if (non_ascii(ch)) {
1219                                 need_8bit_cte = 1;
1220                                 break;
1221                         }
1222                 }
1223         }
1224
1225         pp_header(fmt, context->abbrev, context->date_mode, encoding,
1226                   commit, &msg, sb);
1227         if (fmt != CMIT_FMT_ONELINE && !context->subject) {
1228                 strbuf_addch(sb, '\n');
1229         }
1230
1231         /* Skip excess blank lines at the beginning of body, if any... */
1232         msg = skip_empty_lines(msg);
1233
1234         /* These formats treat the title line specially. */
1235         if (fmt == CMIT_FMT_ONELINE || fmt == CMIT_FMT_EMAIL)
1236                 pp_title_line(fmt, &msg, sb, context->subject,
1237                               context->after_subject, encoding, need_8bit_cte);
1238
1239         beginning_of_body = sb->len;
1240         if (fmt != CMIT_FMT_ONELINE)
1241                 pp_remainder(fmt, &msg, sb, indent);
1242         strbuf_rtrim(sb);
1243
1244         /* Make sure there is an EOLN for the non-oneline case */
1245         if (fmt != CMIT_FMT_ONELINE)
1246                 strbuf_addch(sb, '\n');
1247
1248         /*
1249          * The caller may append additional body text in e-mail
1250          * format.  Make sure we did not strip the blank line
1251          * between the header and the body.
1252          */
1253         if (fmt == CMIT_FMT_EMAIL && sb->len <= beginning_of_body)
1254                 strbuf_addch(sb, '\n');
1255
1256         if (context->show_notes)
1257                 format_display_notes(commit->object.sha1, sb, encoding,
1258                                      NOTES_SHOW_HEADER | NOTES_INDENT);
1259
1260         free(reencoded);
1261 }