pretty.c

   1 #define USE_THE_REPOSITORY_VARIABLE
   2
   3 #include "git-compat-util.h"
   4 #include "config.h"
   5 #include "commit.h"
   6 #include "environment.h"
   7 #include "gettext.h"
   8 #include "hash.h"
   9 #include "hex.h"
  10 #include "utf8.h"
  11 #include "diff.h"
  12 #include "pager.h"
  13 #include "revision.h"
  14 #include "string-list.h"
  15 #include "mailmap.h"
  16 #include "log-tree.h"
  17 #include "notes.h"
  18 #include "color.h"
  19 #include "reflog-walk.h"
  20 #include "gpg-interface.h"
  21 #include "trailer.h"
  22 #include "run-command.h"
  23 #include "object-name.h"
  24
  25 /*
  26  * The limit for formatting directives, which enable the caller to append
  27  * arbitrarily many bytes to the formatted buffer. This includes padding
  28  * and wrapping formatters.
  29  */
  30 #define FORMATTING_LIMIT (16 * 1024)
  31
  32 static char *user_format;
  33 static struct cmt_fmt_map {
  34         const char *name;
  35         enum cmit_fmt format;
  36         int is_tformat;
  37         int expand_tabs_in_log;
  38         int is_alias;
  39         enum date_mode_type default_date_mode_type;
  40         const char *user_format;
  41 } *commit_formats;
  42 static size_t builtin_formats_len;
  43 static size_t commit_formats_len;
  44 static size_t commit_formats_alloc;
  45 static struct cmt_fmt_map *find_commit_format(const char *sought);
  46
  47 int commit_format_is_empty(enum cmit_fmt fmt)
  48 {
  49         return fmt == CMIT_FMT_USERFORMAT && !*user_format;
  50 }
  51
  52 static void save_user_format(struct rev_info *rev, const char *cp, int is_tformat)
  53 {
  54         free(user_format);
  55         user_format = xstrdup(cp);
  56         if (is_tformat)
  57                 rev->use_terminator = 1;
  58         rev->commit_format = CMIT_FMT_USERFORMAT;
  59 }
  60
  61 static int git_pretty_formats_config(const char *var, const char *value,
  62                                      const struct config_context *ctx UNUSED,
  63                                      void *cb UNUSED)
  64 {
  65         struct cmt_fmt_map *commit_format = NULL;
  66         const char *name;
  67         char *fmt;
  68         int i;
  69
  70         if (!skip_prefix(var, "pretty.", &name))
  71                 return 0;
  72
  73         for (i = 0; i < builtin_formats_len; i++) {
  74                 if (!strcmp(commit_formats[i].name, name))
  75                         return 0;
  76         }
  77
  78         for (i = builtin_formats_len; i < commit_formats_len; i++) {
  79                 if (!strcmp(commit_formats[i].name, name)) {
  80                         commit_format = &commit_formats[i];
  81                         break;
  82                 }
  83         }
  84
  85         if (!commit_format) {
  86                 ALLOC_GROW(commit_formats, commit_formats_len+1,
  87                            commit_formats_alloc);
  88                 commit_format = &commit_formats[commit_formats_len];
  89                 memset(commit_format, 0, sizeof(*commit_format));
  90                 commit_formats_len++;
  91         }
  92
  93         commit_format->name = xstrdup(name);
  94         commit_format->format = CMIT_FMT_USERFORMAT;
  95         if (git_config_string(&fmt, var, value))
  96                 return -1;
  97
  98         if (skip_prefix(fmt, "format:", &commit_format->user_format)) {
  99                 commit_format->is_tformat = 0;
 100         } else if (skip_prefix(fmt, "tformat:", &commit_format->user_format)) {
 101                 commit_format->is_tformat = 1;
 102         } else if (strchr(fmt, '%')) {
 103                 commit_format->is_tformat = 1;
 104                 commit_format->user_format = fmt;
 105         } else {
 106                 commit_format->is_alias = 1;
 107                 commit_format->user_format = fmt;
 108         }
 109
 110         return 0;
 111 }
 112
 113 static void setup_commit_formats(void)
 114 {
 115         struct cmt_fmt_map builtin_formats[] = {
 116                 { "raw",        CMIT_FMT_RAW,           0,      0 },
 117                 { "medium",     CMIT_FMT_MEDIUM,        0,      8 },
 118                 { "short",      CMIT_FMT_SHORT,         0,      0 },
 119                 { "email",      CMIT_FMT_EMAIL,         0,      0 },
 120                 { "mboxrd",     CMIT_FMT_MBOXRD,        0,      0 },
 121                 { "fuller",     CMIT_FMT_FULLER,        0,      8 },
 122                 { "full",       CMIT_FMT_FULL,          0,      8 },
 123                 { "oneline",    CMIT_FMT_ONELINE,       1,      0 },
 124                 { "reference",  CMIT_FMT_USERFORMAT,    1,      0,
 125                         0, DATE_SHORT, "%C(auto)%h (%s, %ad)" },
 126                 /*
 127                  * Please update $__git_log_pretty_formats in
 128                  * git-completion.bash when you add new formats.
 129                  */
 130         };
 131         commit_formats_len = ARRAY_SIZE(builtin_formats);
 132         builtin_formats_len = commit_formats_len;
 133         ALLOC_GROW(commit_formats, commit_formats_len, commit_formats_alloc);
 134         COPY_ARRAY(commit_formats, builtin_formats,
 135                    ARRAY_SIZE(builtin_formats));
 136
 137         git_config(git_pretty_formats_config, NULL);
 138 }
 139
 140 static struct cmt_fmt_map *find_commit_format_recursive(const char *sought,
 141                                                         const char *original,
 142                                                         int num_redirections)
 143 {
 144         struct cmt_fmt_map *found = NULL;
 145         size_t found_match_len = 0;
 146         int i;
 147
 148         if (num_redirections >= commit_formats_len)
 149                 die("invalid --pretty format: "
 150                     "'%s' references an alias which points to itself",
 151                     original);
 152
 153         for (i = 0; i < commit_formats_len; i++) {
 154                 size_t match_len;
 155
 156                 if (!istarts_with(commit_formats[i].name, sought))
 157                         continue;
 158
 159                 match_len = strlen(commit_formats[i].name);
 160                 if (found == NULL || found_match_len > match_len) {
 161                         found = &commit_formats[i];
 162                         found_match_len = match_len;
 163                 }
 164         }
 165
 166         if (found && found->is_alias) {
 167                 found = find_commit_format_recursive(found->user_format,
 168                                                      original,
 169                                                      num_redirections+1);
 170         }
 171
 172         return found;
 173 }
 174
 175 static struct cmt_fmt_map *find_commit_format(const char *sought)
 176 {
 177         if (!commit_formats)
 178                 setup_commit_formats();
 179
 180         return find_commit_format_recursive(sought, sought, 0);
 181 }
 182
 183 void get_commit_format(const char *arg, struct rev_info *rev)
 184 {
 185         struct cmt_fmt_map *commit_format;
 186
 187         rev->use_terminator = 0;
 188         if (!arg) {
 189                 rev->commit_format = CMIT_FMT_DEFAULT;
 190                 return;
 191         }
 192         if (skip_prefix(arg, "format:", &arg)) {
 193                 save_user_format(rev, arg, 0);
 194                 return;
 195         }
 196
 197         if (!*arg || skip_prefix(arg, "tformat:", &arg) || strchr(arg, '%')) {
 198                 save_user_format(rev, arg, 1);
 199                 return;
 200         }
 201
 202         commit_format = find_commit_format(arg);
 203         if (!commit_format)
 204                 die("invalid --pretty format: %s", arg);
 205
 206         rev->commit_format = commit_format->format;
 207         rev->use_terminator = commit_format->is_tformat;
 208         rev->expand_tabs_in_log_default = commit_format->expand_tabs_in_log;
 209         if (!rev->date_mode_explicit && commit_format->default_date_mode_type)
 210                 rev->date_mode.type = commit_format->default_date_mode_type;
 211         if (commit_format->format == CMIT_FMT_USERFORMAT) {
 212                 save_user_format(rev, commit_format->user_format,
 213                                  commit_format->is_tformat);
 214         }
 215 }
 216
 217 /*
 218  * Generic support for pretty-printing the header
 219  */
 220 static int get_one_line(const char *msg)
 221 {
 222         int ret = 0;
 223
 224         for (;;) {
 225                 char c = *msg++;
 226                 if (!c)
 227                         break;
 228                 ret++;
 229                 if (c == '\n')
 230                         break;
 231         }
 232         return ret;
 233 }
 234
 235 /* High bit set, or ISO-2022-INT */
 236 static int non_ascii(int ch)
 237 {
 238         return !isascii(ch) || ch == '\033';
 239 }
 240
 241 int has_non_ascii(const char *s)
 242 {
 243         int ch;
 244         if (!s)
 245                 return 0;
 246         while ((ch = *s++) != '\0') {
 247                 if (non_ascii(ch))
 248                         return 1;
 249         }
 250         return 0;
 251 }
 252
 253 static int is_rfc822_special(char ch)
 254 {
 255         switch (ch) {
 256         case '(':
 257         case ')':
 258         case '<':
 259         case '>':
 260         case '[':
 261         case ']':
 262         case ':':
 263         case ';':
 264         case '@':
 265         case ',':
 266         case '.':
 267         case '"':
 268         case '\\':
 269                 return 1;
 270         default:
 271                 return 0;
 272         }
 273 }
 274
 275 static int needs_rfc822_quoting(const char *s, int len)
 276 {
 277         int i;
 278         for (i = 0; i < len; i++)
 279                 if (is_rfc822_special(s[i]))
 280                         return 1;
 281         return 0;
 282 }
 283
 284 static int last_line_length(struct strbuf *sb)
 285 {
 286         int i;
 287
 288         /* How many bytes are already used on the last line? */
 289         for (i = sb->len - 1; i >= 0; i--)
 290                 if (sb->buf[i] == '\n')
 291                         break;
 292         return sb->len - (i + 1);
 293 }
 294
 295 static void add_rfc822_quoted(struct strbuf *out, const char *s, int len)
 296 {
 297         int i;
 298
 299         /* just a guess, we may have to also backslash-quote */
 300         strbuf_grow(out, len + 2);
 301
 302         strbuf_addch(out, '"');
 303         for (i = 0; i < len; i++) {
 304                 switch (s[i]) {
 305                 case '"':
 306                 case '\\':
 307                         strbuf_addch(out, '\\');
 308                         /* fall through */
 309                 default:
 310                         strbuf_addch(out, s[i]);
 311                 }
 312         }
 313         strbuf_addch(out, '"');
 314 }
 315
 316 enum rfc2047_type {
 317         RFC2047_SUBJECT,
 318         RFC2047_ADDRESS
 319 };
 320
 321 static int is_rfc2047_special(char ch, enum rfc2047_type type)
 322 {
 323         /*
 324          * rfc2047, section 4.2:
 325          *
 326          *    8-bit values which correspond to printable ASCII characters other
 327          *    than "=", "?", and "_" (underscore), MAY be represented as those
 328          *    characters.  (But see section 5 for restrictions.)  In
 329          *    particular, SPACE and TAB MUST NOT be represented as themselves
 330          *    within encoded words.
 331          */
 332
 333         /*
 334          * rule out non-ASCII characters and non-printable characters (the
 335          * non-ASCII check should be redundant as isprint() is not localized
 336          * and only knows about ASCII, but be defensive about that)
 337          */
 338         if (non_ascii(ch) || !isprint(ch))
 339                 return 1;
 340
 341         /*
 342          * rule out special printable characters (' ' should be the only
 343          * whitespace character considered printable, but be defensive and use
 344          * isspace())
 345          */
 346         if (isspace(ch) || ch == '=' || ch == '?' || ch == '_')
 347                 return 1;
 348
 349         /*
 350          * rfc2047, section 5.3:
 351          *
 352          *    As a replacement for a 'word' entity within a 'phrase', for example,
 353          *    one that precedes an address in a From, To, or Cc header.  The ABNF
 354          *    definition for 'phrase' from RFC 822 thus becomes:
 355          *
 356          *    phrase = 1*( encoded-word / word )
 357          *
 358          *    In this case the set of characters that may be used in a "Q"-encoded
 359          *    'encoded-word' is restricted to: <upper and lower case ASCII
 360          *    letters, decimal digits, "!", "*", "+", "-", "/", "=", and "_"
 361          *    (underscore, ASCII 95.)>.  An 'encoded-word' that appears within a
 362          *    'phrase' MUST be separated from any adjacent 'word', 'text' or
 363          *    'special' by 'linear-white-space'.
 364          */
 365
 366         if (type != RFC2047_ADDRESS)
 367                 return 0;
 368
 369         /* '=' and '_' are special cases and have been checked above */
 370         return !(isalnum(ch) || ch == '!' || ch == '*' || ch == '+' || ch == '-' || ch == '/');
 371 }
 372
 373 static int needs_rfc2047_encoding(const char *line, int len)
 374 {
 375         int i;
 376
 377         for (i = 0; i < len; i++) {
 378                 int ch = line[i];
 379                 if (non_ascii(ch) || ch == '\n')
 380                         return 1;
 381                 if ((i + 1 < len) && (ch == '=' && line[i+1] == '?'))
 382                         return 1;
 383         }
 384
 385         return 0;
 386 }
 387
 388 static void add_rfc2047(struct strbuf *sb, const char *line, size_t len,
 389                        const char *encoding, enum rfc2047_type type)
 390 {
 391         static const int max_encoded_length = 76; /* per rfc2047 */
 392         int i;
 393         int line_len = last_line_length(sb);
 394
 395         strbuf_grow(sb, len * 3 + strlen(encoding) + 100);
 396         strbuf_addf(sb, "=?%s?q?", encoding);
 397         line_len += strlen(encoding) + 5; /* 5 for =??q? */
 398
 399         while (len) {
 400                 /*
 401                  * RFC 2047, section 5 (3):
 402                  *
 403                  * Each 'encoded-word' MUST represent an integral number of
 404                  * characters.  A multi-octet character may not be split across
 405                  * adjacent 'encoded- word's.
 406                  */
 407                 const unsigned char *p = (const unsigned char *)line;
 408                 int chrlen = mbs_chrlen(&line, &len, encoding);
 409                 int is_special = (chrlen > 1) || is_rfc2047_special(*p, type);
 410
 411                 /* "=%02X" * chrlen, or the byte itself */
 412                 const char *encoded_fmt = is_special ? "=%02X"    : "%c";
 413                 int         encoded_len = is_special ? 3 * chrlen : 1;
 414
 415                 /*
 416                  * According to RFC 2047, we could encode the special character
 417                  * ' ' (space) with '_' (underscore) for readability. But many
 418                  * programs do not understand this and just leave the
 419                  * underscore in place. Thus, we do nothing special here, which
 420                  * causes ' ' to be encoded as '=20', avoiding this problem.
 421                  */
 422
 423                 if (line_len + encoded_len + 2 > max_encoded_length) {
 424                         /* It won't fit with trailing "?=" --- break the line */
 425                         strbuf_addf(sb, "?=\n =?%s?q?", encoding);
 426                         line_len = strlen(encoding) + 5 + 1; /* =??q? plus SP */
 427                 }
 428
 429                 for (i = 0; i < chrlen; i++)
 430                         strbuf_addf(sb, encoded_fmt, p[i]);
 431                 line_len += encoded_len;
 432         }
 433         strbuf_addstr(sb, "?=");
 434 }
 435
 436 const char *show_ident_date(const struct ident_split *ident,
 437                             struct date_mode mode)
 438 {
 439         timestamp_t date = 0;
 440         long tz = 0;
 441
 442         if (ident->date_begin && ident->date_end)
 443                 date = parse_timestamp(ident->date_begin, NULL, 10);
 444         if (date_overflows(date))
 445                 date = 0;
 446         else {
 447                 if (ident->tz_begin && ident->tz_end)
 448                         tz = strtol(ident->tz_begin, NULL, 10);
 449                 if (tz >= INT_MAX || tz <= INT_MIN)
 450                         tz = 0;
 451         }
 452         return show_date(date, tz, mode);
 453 }
 454
 455 static inline void strbuf_add_with_color(struct strbuf *sb, const char *color,
 456                                          const char *buf, size_t buflen)
 457 {
 458         strbuf_addstr(sb, color);
 459         strbuf_add(sb, buf, buflen);
 460         if (*color)
 461                 strbuf_addstr(sb, GIT_COLOR_RESET);
 462 }
 463
 464 static void append_line_with_color(struct strbuf *sb, struct grep_opt *opt,
 465                                    const char *line, size_t linelen,
 466                                    int color, enum grep_context ctx,
 467                                    enum grep_header_field field)
 468 {
 469         const char *buf, *eol, *line_color, *match_color;
 470         regmatch_t match;
 471         int eflags = 0;
 472
 473         buf = line;
 474         eol = buf + linelen;
 475
 476         if (!opt || !want_color(color) || opt->invert)
 477                 goto end;
 478
 479         line_color = opt->colors[GREP_COLOR_SELECTED];
 480         match_color = opt->colors[GREP_COLOR_MATCH_SELECTED];
 481
 482         while (grep_next_match(opt, buf, eol, ctx, &match, field, eflags)) {
 483                 if (match.rm_so == match.rm_eo)
 484                         break;
 485
 486                 strbuf_add_with_color(sb, line_color, buf, match.rm_so);
 487                 strbuf_add_with_color(sb, match_color, buf + match.rm_so,
 488                                       match.rm_eo - match.rm_so);
 489                 buf += match.rm_eo;
 490                 eflags = REG_NOTBOL;
 491         }
 492
 493         if (eflags)
 494                 strbuf_add_with_color(sb, line_color, buf, eol - buf);
 495         else {
 496 end:
 497                 strbuf_add(sb, buf, eol - buf);
 498         }
 499 }
 500
 501 static int use_in_body_from(const struct pretty_print_context *pp,
 502                             const struct ident_split *ident)
 503 {
 504         if (pp->rev && pp->rev->force_in_body_from)
 505                 return 1;
 506         if (ident_cmp(pp->from_ident, ident))
 507                 return 1;
 508         return 0;
 509 }
 510
 511 void pp_user_info(struct pretty_print_context *pp,
 512                   const char *what, struct strbuf *sb,
 513                   const char *line, const char *encoding)
 514 {
 515         struct ident_split ident;
 516         char *line_end;
 517         const char *mailbuf, *namebuf;
 518         size_t namelen, maillen;
 519         int max_length = 78; /* per rfc2822 */
 520
 521         if (pp->fmt == CMIT_FMT_ONELINE)
 522                 return;
 523
 524         line_end = strchrnul(line, '\n');
 525         if (split_ident_line(&ident, line, line_end - line))
 526                 return;
 527
 528         mailbuf = ident.mail_begin;
 529         maillen = ident.mail_end - ident.mail_begin;
 530         namebuf = ident.name_begin;
 531         namelen = ident.name_end - ident.name_begin;
 532
 533         if (pp->mailmap)
 534                 map_user(pp->mailmap, &mailbuf, &maillen, &namebuf, &namelen);
 535
 536         if (cmit_fmt_is_mail(pp->fmt)) {
 537                 if (pp->from_ident && use_in_body_from(pp, &ident)) {
 538                         struct strbuf buf = STRBUF_INIT;
 539
 540                         strbuf_addstr(&buf, "From: ");
 541                         strbuf_add(&buf, namebuf, namelen);
 542                         strbuf_addstr(&buf, " <");
 543                         strbuf_add(&buf, mailbuf, maillen);
 544                         strbuf_addstr(&buf, ">\n");
 545                         string_list_append(&pp->in_body_headers,
 546                                            strbuf_detach(&buf, NULL));
 547
 548                         mailbuf = pp->from_ident->mail_begin;
 549                         maillen = pp->from_ident->mail_end - mailbuf;
 550                         namebuf = pp->from_ident->name_begin;
 551                         namelen = pp->from_ident->name_end - namebuf;
 552                 }
 553
 554                 strbuf_addstr(sb, "From: ");
 555                 if (pp->encode_email_headers &&
 556                     needs_rfc2047_encoding(namebuf, namelen)) {
 557                         add_rfc2047(sb, namebuf, namelen,
 558                                     encoding, RFC2047_ADDRESS);
 559                         max_length = 76; /* per rfc2047 */
 560                 } else if (needs_rfc822_quoting(namebuf, namelen)) {
 561                         struct strbuf quoted = STRBUF_INIT;
 562                         add_rfc822_quoted(&quoted, namebuf, namelen);
 563                         strbuf_add_wrapped_bytes(sb, quoted.buf, quoted.len,
 564                                                         -6, 1, max_length);
 565                         strbuf_release(&quoted);
 566                 } else {
 567                         strbuf_add_wrapped_bytes(sb, namebuf, namelen,
 568                                                  -6, 1, max_length);
 569                 }
 570
 571                 if (max_length <
 572                     last_line_length(sb) + strlen(" <") + maillen + strlen(">"))
 573                         strbuf_addch(sb, '\n');
 574                 strbuf_addf(sb, " <%.*s>\n", (int)maillen, mailbuf);
 575         } else {
 576                 struct strbuf id = STRBUF_INIT;
 577                 enum grep_header_field field = GREP_HEADER_FIELD_MAX;
 578                 struct grep_opt *opt = pp->rev ? &pp->rev->grep_filter : NULL;
 579
 580                 if (!strcmp(what, "Author"))
 581                         field = GREP_HEADER_AUTHOR;
 582                 else if (!strcmp(what, "Commit"))
 583                         field = GREP_HEADER_COMMITTER;
 584
 585                 strbuf_addf(sb, "%s: ", what);
 586                 if (pp->fmt == CMIT_FMT_FULLER)
 587                         strbuf_addchars(sb, ' ', 4);
 588
 589                 strbuf_addf(&id, "%.*s <%.*s>", (int)namelen, namebuf,
 590                             (int)maillen, mailbuf);
 591
 592                 append_line_with_color(sb, opt, id.buf, id.len, pp->color,
 593                                        GREP_CONTEXT_HEAD, field);
 594                 strbuf_addch(sb, '\n');
 595                 strbuf_release(&id);
 596         }
 597
 598         switch (pp->fmt) {
 599         case CMIT_FMT_MEDIUM:
 600                 strbuf_addf(sb, "Date:   %s\n",
 601                             show_ident_date(&ident, pp->date_mode));
 602                 break;
 603         case CMIT_FMT_EMAIL:
 604         case CMIT_FMT_MBOXRD:
 605                 strbuf_addf(sb, "Date: %s\n",
 606                             show_ident_date(&ident, DATE_MODE(RFC2822)));
 607                 break;
 608         case CMIT_FMT_FULLER:
 609                 strbuf_addf(sb, "%sDate: %s\n", what,
 610                             show_ident_date(&ident, pp->date_mode));
 611                 break;
 612         default:
 613                 /* notin' */
 614                 break;
 615         }
 616 }
 617
 618 static int is_blank_line(const char *line, int *len_p)
 619 {
 620         int len = *len_p;
 621         while (len && isspace(line[len - 1]))
 622                 len--;
 623         *len_p = len;
 624         return !len;
 625 }
 626
 627 const char *skip_blank_lines(const char *msg)
 628 {
 629         for (;;) {
 630                 int linelen = get_one_line(msg);
 631                 int ll = linelen;
 632                 if (!linelen)
 633                         break;
 634                 if (!is_blank_line(msg, &ll))
 635                         break;
 636                 msg += linelen;
 637         }
 638         return msg;
 639 }
 640
 641 static void add_merge_info(const struct pretty_print_context *pp,
 642                            struct strbuf *sb, const struct commit *commit)
 643 {
 644         struct commit_list *parent = commit->parents;
 645
 646         if ((pp->fmt == CMIT_FMT_ONELINE) || (cmit_fmt_is_mail(pp->fmt)) ||
 647             !parent || !parent->next)
 648                 return;
 649
 650         strbuf_addstr(sb, "Merge:");
 651
 652         while (parent) {
 653                 struct object_id *oidp = &parent->item->object.oid;
 654                 strbuf_addch(sb, ' ');
 655                 if (pp->abbrev)
 656                         strbuf_add_unique_abbrev(sb, oidp, pp->abbrev);
 657                 else
 658                         strbuf_addstr(sb, oid_to_hex(oidp));
 659                 parent = parent->next;
 660         }
 661         strbuf_addch(sb, '\n');
 662 }
 663
 664 static char *get_header(const char *msg, const char *key)
 665 {
 666         size_t len;
 667         const char *v = find_commit_header(msg, key, &len);
 668         return v ? xmemdupz(v, len) : NULL;
 669 }
 670
 671 static char *replace_encoding_header(char *buf, const char *encoding)
 672 {
 673         struct strbuf tmp = STRBUF_INIT;
 674         size_t start, len;
 675         char *cp = buf;
 676
 677         /* guess if there is an encoding header before a \n\n */
 678         while (!starts_with(cp, "encoding ")) {
 679                 cp = strchr(cp, '\n');
 680                 if (!cp || *++cp == '\n')
 681                         return buf;
 682         }
 683         start = cp - buf;
 684         cp = strchr(cp, '\n');
 685         if (!cp)
 686                 return buf; /* should not happen but be defensive */
 687         len = cp + 1 - (buf + start);
 688
 689         strbuf_attach(&tmp, buf, strlen(buf), strlen(buf) + 1);
 690         if (is_encoding_utf8(encoding)) {
 691                 /* we have re-coded to UTF-8; drop the header */
 692                 strbuf_remove(&tmp, start, len);
 693         } else {
 694                 /* just replaces XXXX in 'encoding XXXX\n' */
 695                 strbuf_splice(&tmp, start + strlen("encoding "),
 696                                           len - strlen("encoding \n"),
 697                                           encoding, strlen(encoding));
 698         }
 699         return strbuf_detach(&tmp, NULL);
 700 }
 701
 702 const char *repo_logmsg_reencode(struct repository *r,
 703                                  const struct commit *commit,
 704                                  char **commit_encoding,
 705                                  const char *output_encoding)
 706 {
 707         static const char *utf8 = "UTF-8";
 708         const char *use_encoding;
 709         char *encoding;
 710         const char *msg = repo_get_commit_buffer(r, commit, NULL);
 711         char *out;
 712
 713         if (!output_encoding || !*output_encoding) {
 714                 if (commit_encoding)
 715                         *commit_encoding = get_header(msg, "encoding");
 716                 return msg;
 717         }
 718         encoding = get_header(msg, "encoding");
 719         if (commit_encoding)
 720                 *commit_encoding = encoding;
 721         use_encoding = encoding ? encoding : utf8;
 722         if (same_encoding(use_encoding, output_encoding)) {
 723                 /*
 724                  * No encoding work to be done. If we have no encoding header
 725                  * at all, then there's nothing to do, and we can return the
 726                  * message verbatim (whether newly allocated or not).
 727                  */
 728                 if (!encoding)
 729                         return msg;
 730
 731                 /*
 732                  * Otherwise, we still want to munge the encoding header in the
 733                  * result, which will be done by modifying the buffer. If we
 734                  * are using a fresh copy, we can reuse it. But if we are using
 735                  * the cached copy from repo_get_commit_buffer, we need to duplicate it
 736                  * to avoid munging the cached copy.
 737                  */
 738                 if (msg == get_cached_commit_buffer(r, commit, NULL))
 739                         out = xstrdup(msg);
 740                 else
 741                         out = (char *)msg;
 742         }
 743         else {
 744                 /*
 745                  * There's actual encoding work to do. Do the reencoding, which
 746                  * still leaves the header to be replaced in the next step. At
 747                  * this point, we are done with msg. If we allocated a fresh
 748                  * copy, we can free it.
 749                  */
 750                 out = reencode_string(msg, output_encoding, use_encoding);
 751                 if (out)
 752                         repo_unuse_commit_buffer(r, commit, msg);
 753         }
 754
 755         /*
 756          * This replacement actually consumes the buffer we hand it, so we do
 757          * not have to worry about freeing the old "out" here.
 758          */
 759         if (out)
 760                 out = replace_encoding_header(out, output_encoding);
 761
 762         if (!commit_encoding)
 763                 free(encoding);
 764         /*
 765          * If the re-encoding failed, out might be NULL here; in that
 766          * case we just return the commit message verbatim.
 767          */
 768         return out ? out : msg;
 769 }
 770
 771 static int mailmap_name(const char **email, size_t *email_len,
 772                         const char **name, size_t *name_len)
 773 {
 774         static struct string_list *mail_map;
 775         if (!mail_map) {
 776                 CALLOC_ARRAY(mail_map, 1);
 777                 read_mailmap(mail_map);
 778         }
 779         return mail_map->nr && map_user(mail_map, email, email_len, name, name_len);
 780 }
 781
 782 static size_t format_person_part(struct strbuf *sb, char part,
 783                                  const char *msg, int len,
 784                                  struct date_mode dmode)
 785 {
 786         /* currently all placeholders have same length */
 787         const int placeholder_len = 2;
 788         struct ident_split s;
 789         const char *name, *mail;
 790         size_t maillen, namelen;
 791
 792         if (split_ident_line(&s, msg, len) < 0)
 793                 goto skip;
 794
 795         name = s.name_begin;
 796         namelen = s.name_end - s.name_begin;
 797         mail = s.mail_begin;
 798         maillen = s.mail_end - s.mail_begin;
 799
 800         if (part == 'N' || part == 'E' || part == 'L') /* mailmap lookup */
 801                 mailmap_name(&mail, &maillen, &name, &namelen);
 802         if (part == 'n' || part == 'N') {       /* name */
 803                 strbuf_add(sb, name, namelen);
 804                 return placeholder_len;
 805         }
 806         if (part == 'e' || part == 'E') {       /* email */
 807                 strbuf_add(sb, mail, maillen);
 808                 return placeholder_len;
 809         }
 810         if (part == 'l' || part == 'L') {       /* local-part */
 811                 const char *at = memchr(mail, '@', maillen);
 812                 if (at)
 813                         maillen = at - mail;
 814                 strbuf_add(sb, mail, maillen);
 815                 return placeholder_len;
 816         }
 817
 818         if (!s.date_begin)
 819                 goto skip;
 820
 821         if (part == 't') {      /* date, UNIX timestamp */
 822                 strbuf_add(sb, s.date_begin, s.date_end - s.date_begin);
 823                 return placeholder_len;
 824         }
 825
 826         switch (part) {
 827         case 'd':       /* date */
 828                 strbuf_addstr(sb, show_ident_date(&s, dmode));
 829                 return placeholder_len;
 830         case 'D':       /* date, RFC2822 style */
 831                 strbuf_addstr(sb, show_ident_date(&s, DATE_MODE(RFC2822)));
 832                 return placeholder_len;
 833         case 'r':       /* date, relative */
 834                 strbuf_addstr(sb, show_ident_date(&s, DATE_MODE(RELATIVE)));
 835                 return placeholder_len;
 836         case 'i':       /* date, ISO 8601-like */
 837                 strbuf_addstr(sb, show_ident_date(&s, DATE_MODE(ISO8601)));
 838                 return placeholder_len;
 839         case 'I':       /* date, ISO 8601 strict */
 840                 strbuf_addstr(sb, show_ident_date(&s, DATE_MODE(ISO8601_STRICT)));
 841                 return placeholder_len;
 842         case 'h':       /* date, human */
 843                 strbuf_addstr(sb, show_ident_date(&s, DATE_MODE(HUMAN)));
 844                 return placeholder_len;
 845         case 's':
 846                 strbuf_addstr(sb, show_ident_date(&s, DATE_MODE(SHORT)));
 847                 return placeholder_len;
 848         }
 849
 850 skip:
 851         /*
 852          * reading from either a bogus commit, or a reflog entry with
 853          * %gn, %ge, etc.; 'sb' cannot be updated, but we still need
 854          * to compute a valid return value.
 855          */
 856         if (part == 'n' || part == 'e' || part == 't' || part == 'd'
 857             || part == 'D' || part == 'r' || part == 'i')
 858                 return placeholder_len;
 859
 860         return 0; /* unknown placeholder */
 861 }
 862
 863 struct chunk {
 864         size_t off;
 865         size_t len;
 866 };
 867
 868 enum flush_type {
 869         no_flush,
 870         flush_right,
 871         flush_left,
 872         flush_left_and_steal,
 873         flush_both
 874 };
 875
 876 enum trunc_type {
 877         trunc_none,
 878         trunc_left,
 879         trunc_middle,
 880         trunc_right
 881 };
 882
 883 struct format_commit_context {
 884         struct repository *repository;
 885         const struct commit *commit;
 886         const struct pretty_print_context *pretty_ctx;
 887         unsigned commit_header_parsed:1;
 888         unsigned commit_message_parsed:1;
 889         struct signature_check signature_check;
 890         enum flush_type flush_type;
 891         enum trunc_type truncate;
 892         const char *message;
 893         char *commit_encoding;
 894         size_t width, indent1, indent2;
 895         int auto_color;
 896         int padding;
 897
 898         /* These offsets are relative to the start of the commit message. */
 899         struct chunk author;
 900         struct chunk committer;
 901         size_t message_off;
 902         size_t subject_off;
 903         size_t body_off;
 904
 905         /* The following ones are relative to the result struct strbuf. */
 906         size_t wrap_start;
 907 };
 908
 909 static void parse_commit_header(struct format_commit_context *context)
 910 {
 911         const char *msg = context->message;
 912         int i;
 913
 914         for (i = 0; msg[i]; i++) {
 915                 const char *name;
 916                 int eol;
 917                 for (eol = i; msg[eol] && msg[eol] != '\n'; eol++)
 918                         ; /* do nothing */
 919
 920                 if (i == eol) {
 921                         break;
 922                 } else if (skip_prefix(msg + i, "author ", &name)) {
 923                         context->author.off = name - msg;
 924                         context->author.len = msg + eol - name;
 925                 } else if (skip_prefix(msg + i, "committer ", &name)) {
 926                         context->committer.off = name - msg;
 927                         context->committer.len = msg + eol - name;
 928                 }
 929                 i = eol;
 930         }
 931         context->message_off = i;
 932         context->commit_header_parsed = 1;
 933 }
 934
 935 static int istitlechar(char c)
 936 {
 937         return (c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z') ||
 938                 (c >= '0' && c <= '9') || c == '.' || c == '_';
 939 }
 940
 941 void format_sanitized_subject(struct strbuf *sb, const char *msg, size_t len)
 942 {
 943         size_t trimlen;
 944         size_t start_len = sb->len;
 945         int space = 2;
 946         int i;
 947
 948         for (i = 0; i < len; i++) {
 949                 if (istitlechar(msg[i])) {
 950                         if (space == 1)
 951                                 strbuf_addch(sb, '-');
 952                         space = 0;
 953                         strbuf_addch(sb, msg[i]);
 954                         if (msg[i] == '.')
 955                                 while (msg[i+1] == '.')
 956                                         i++;
 957                 } else
 958                         space |= 1;
 959         }
 960
 961         /* trim any trailing '.' or '-' characters */
 962         trimlen = 0;
 963         while (sb->len - trimlen > start_len &&
 964                 (sb->buf[sb->len - 1 - trimlen] == '.'
 965                 || sb->buf[sb->len - 1 - trimlen] == '-'))
 966                 trimlen++;
 967         strbuf_remove(sb, sb->len - trimlen, trimlen);
 968 }
 969
 970 const char *format_subject(struct strbuf *sb, const char *msg,
 971                            const char *line_separator)
 972 {
 973         int first = 1;
 974
 975         for (;;) {
 976                 const char *line = msg;
 977                 int linelen = get_one_line(line);
 978
 979                 msg += linelen;
 980                 if (!linelen || is_blank_line(line, &linelen))
 981                         break;
 982
 983                 if (!sb)
 984                         continue;
 985                 strbuf_grow(sb, linelen + 2);
 986                 if (!first)
 987                         strbuf_addstr(sb, line_separator);
 988                 strbuf_add(sb, line, linelen);
 989                 first = 0;
 990         }
 991         return msg;
 992 }
 993
 994 static void parse_commit_message(struct format_commit_context *c)
 995 {
 996         const char *msg = c->message + c->message_off;
 997         const char *start = c->message;
 998
 999         msg = skip_blank_lines(msg);
1000         c->subject_off = msg - start;
1001
1002         msg = format_subject(NULL, msg, NULL);
1003         msg = skip_blank_lines(msg);
1004         c->body_off = msg - start;
1005
1006         c->commit_message_parsed = 1;
1007 }
1008
1009 static void strbuf_wrap(struct strbuf *sb, size_t pos,
1010                         size_t width, size_t indent1, size_t indent2)
1011 {
1012         struct strbuf tmp = STRBUF_INIT;
1013
1014         if (pos)
1015                 strbuf_add(&tmp, sb->buf, pos);
1016         strbuf_add_wrapped_text(&tmp, sb->buf + pos,
1017                                 cast_size_t_to_int(indent1),
1018                                 cast_size_t_to_int(indent2),
1019                                 cast_size_t_to_int(width));
1020         strbuf_swap(&tmp, sb);
1021         strbuf_release(&tmp);
1022 }
1023
1024 static void rewrap_message_tail(struct strbuf *sb,
1025                                 struct format_commit_context *c,
1026                                 size_t new_width, size_t new_indent1,
1027                                 size_t new_indent2)
1028 {
1029         if (c->width == new_width && c->indent1 == new_indent1 &&
1030             c->indent2 == new_indent2)
1031                 return;
1032         if (c->wrap_start < sb->len)
1033                 strbuf_wrap(sb, c->wrap_start, c->width, c->indent1, c->indent2);
1034         c->wrap_start = sb->len;
1035         c->width = new_width;
1036         c->indent1 = new_indent1;
1037         c->indent2 = new_indent2;
1038 }
1039
1040 static int format_reflog_person(struct strbuf *sb,
1041                                 char part,
1042                                 struct reflog_walk_info *log,
1043                                 struct date_mode dmode)
1044 {
1045         const char *ident;
1046
1047         if (!log)
1048                 return 2;
1049
1050         ident = get_reflog_ident(log);
1051         if (!ident)
1052                 return 2;
1053
1054         return format_person_part(sb, part, ident, strlen(ident), dmode);
1055 }
1056
1057 static size_t parse_color(struct strbuf *sb, /* in UTF-8 */
1058                           const char *placeholder,
1059                           struct format_commit_context *c)
1060 {
1061         const char *rest = placeholder;
1062         const char *basic_color = NULL;
1063
1064         if (placeholder[1] == '(') {
1065                 const char *begin = placeholder + 2;
1066                 const char *end = strchr(begin, ')');
1067                 char color[COLOR_MAXLEN];
1068
1069                 if (!end)
1070                         return 0;
1071
1072                 if (skip_prefix(begin, "auto,", &begin)) {
1073                         if (!want_color(c->pretty_ctx->color))
1074                                 return end - placeholder + 1;
1075                 } else if (skip_prefix(begin, "always,", &begin)) {
1076                         /* nothing to do; we do not respect want_color at all */
1077                 } else {
1078                         /* the default is the same as "auto" */
1079                         if (!want_color(c->pretty_ctx->color))
1080                                 return end - placeholder + 1;
1081                 }
1082
1083                 if (color_parse_mem(begin, end - begin, color) < 0)
1084                         die(_("unable to parse --pretty format"));
1085                 strbuf_addstr(sb, color);
1086                 return end - placeholder + 1;
1087         }
1088
1089         /*
1090          * We handle things like "%C(red)" above; for historical reasons, there
1091          * are a few colors that can be specified without parentheses (and
1092          * they cannot support things like "auto" or "always" at all).
1093          */
1094         if (skip_prefix(placeholder + 1, "red", &rest))
1095                 basic_color = GIT_COLOR_RED;
1096         else if (skip_prefix(placeholder + 1, "green", &rest))
1097                 basic_color = GIT_COLOR_GREEN;
1098         else if (skip_prefix(placeholder + 1, "blue", &rest))
1099                 basic_color = GIT_COLOR_BLUE;
1100         else if (skip_prefix(placeholder + 1, "reset", &rest))
1101                 basic_color = GIT_COLOR_RESET;
1102
1103         if (basic_color && want_color(c->pretty_ctx->color))
1104                 strbuf_addstr(sb, basic_color);
1105
1106         return rest - placeholder;
1107 }
1108
1109 static size_t parse_padding_placeholder(const char *placeholder,
1110                                         struct format_commit_context *c)
1111 {
1112         const char *ch = placeholder;
1113         enum flush_type flush_type;
1114         int to_column = 0;
1115
1116         switch (*ch++) {
1117         case '<':
1118                 flush_type = flush_right;
1119                 break;
1120         case '>':
1121                 if (*ch == '<') {
1122                         flush_type = flush_both;
1123                         ch++;
1124                 } else if (*ch == '>') {
1125                         flush_type = flush_left_and_steal;
1126                         ch++;
1127                 } else
1128                         flush_type = flush_left;
1129                 break;
1130         default:
1131                 return 0;
1132         }
1133
1134         /* the next value means "wide enough to that column" */
1135         if (*ch == '|') {
1136                 to_column = 1;
1137                 ch++;
1138         }
1139
1140         if (*ch == '(') {
1141                 const char *start = ch + 1;
1142                 const char *end = start + strcspn(start, ",)");
1143                 char *next;
1144                 int width;
1145                 if (!*end || end == start)
1146                         return 0;
1147                 width = strtol(start, &next, 10);
1148
1149                 /*
1150                  * We need to limit the amount of padding, or otherwise this
1151                  * would allow the user to pad the buffer by arbitrarily many
1152                  * bytes and thus cause resource exhaustion.
1153                  */
1154                 if (width < -FORMATTING_LIMIT || width > FORMATTING_LIMIT)
1155                         return 0;
1156
1157                 if (next == start || width == 0)
1158                         return 0;
1159                 if (width < 0) {
1160                         if (to_column)
1161                                 width += term_columns();
1162                         if (width < 0)
1163                                 return 0;
1164                 }
1165                 c->padding = to_column ? -width : width;
1166                 c->flush_type = flush_type;
1167
1168                 if (*end == ',') {
1169                         start = end + 1;
1170                         end = strchr(start, ')');
1171                         if (!end || end == start)
1172                                 return 0;
1173                         if (starts_with(start, "trunc)"))
1174                                 c->truncate = trunc_right;
1175                         else if (starts_with(start, "ltrunc)"))
1176                                 c->truncate = trunc_left;
1177                         else if (starts_with(start, "mtrunc)"))
1178                                 c->truncate = trunc_middle;
1179                         else
1180                                 return 0;
1181                 } else
1182                         c->truncate = trunc_none;
1183
1184                 return end - placeholder + 1;
1185         }
1186         return 0;
1187 }
1188
1189 static int match_placeholder_arg_value(const char *to_parse, const char *candidate,
1190                                        const char **end, const char **valuestart,
1191                                        size_t *valuelen)
1192 {
1193         const char *p;
1194
1195         if (!(skip_prefix(to_parse, candidate, &p)))
1196                 return 0;
1197         if (valuestart) {
1198                 if (*p == '=') {
1199                         *valuestart = p + 1;
1200                         *valuelen = strcspn(*valuestart, ",)");
1201                         p = *valuestart + *valuelen;
1202                 } else {
1203                         if (*p != ',' && *p != ')')
1204                                 return 0;
1205                         *valuestart = NULL;
1206                         *valuelen = 0;
1207                 }
1208         }
1209         if (*p == ',') {
1210                 *end = p + 1;
1211                 return 1;
1212         }
1213         if (*p == ')') {
1214                 *end = p;
1215                 return 1;
1216         }
1217         return 0;
1218 }
1219
1220 static int match_placeholder_bool_arg(const char *to_parse, const char *candidate,
1221                                       const char **end, int *val)
1222 {
1223         const char *argval;
1224         char *strval;
1225         size_t arglen;
1226         int v;
1227
1228         if (!match_placeholder_arg_value(to_parse, candidate, end, &argval, &arglen))
1229                 return 0;
1230
1231         if (!argval) {
1232                 *val = 1;
1233                 return 1;
1234         }
1235
1236         strval = xstrndup(argval, arglen);
1237         v = git_parse_maybe_bool(strval);
1238         free(strval);
1239
1240         if (v == -1)
1241                 return 0;
1242
1243         *val = v;
1244
1245         return 1;
1246 }
1247
1248 static int format_trailer_match_cb(const struct strbuf *key, void *ud)
1249 {
1250         const struct string_list *list = ud;
1251         const struct string_list_item *item;
1252
1253         for_each_string_list_item (item, list) {
1254                 if (key->len == (uintptr_t)item->util &&
1255                     !strncasecmp(item->string, key->buf, key->len))
1256                         return 1;
1257         }
1258         return 0;
1259 }
1260
1261 static struct strbuf *expand_string_arg(struct strbuf *sb,
1262                                         const char *argval, size_t arglen)
1263 {
1264         char *fmt = xstrndup(argval, arglen);
1265         const char *format = fmt;
1266
1267         strbuf_reset(sb);
1268         while (strbuf_expand_step(sb, &format)) {
1269                 size_t len;
1270
1271                 if (skip_prefix(format, "%", &format))
1272                         strbuf_addch(sb, '%');
1273                 else if ((len = strbuf_expand_literal(sb, format)))
1274                         format += len;
1275                 else
1276                         strbuf_addch(sb, '%');
1277         }
1278         free(fmt);
1279         return sb;
1280 }
1281
1282 int format_set_trailers_options(struct process_trailer_options *opts,
1283                                 struct string_list *filter_list,
1284                                 struct strbuf *sepbuf,
1285                                 struct strbuf *kvsepbuf,
1286                                 const char **arg,
1287                                 char **invalid_arg)
1288 {
1289         for (;;) {
1290                 const char *argval;
1291                 size_t arglen;
1292
1293                 if (**arg == ')')
1294                         break;
1295
1296                 if (match_placeholder_arg_value(*arg, "key", arg, &argval, &arglen)) {
1297                         uintptr_t len = arglen;
1298
1299                         if (!argval)
1300                                 return -1;
1301
1302                         if (len && argval[len - 1] == ':')
1303                                 len--;
1304                         string_list_append(filter_list, argval)->util = (char *)len;
1305
1306                         opts->filter = format_trailer_match_cb;
1307                         opts->filter_data = filter_list;
1308                         opts->only_trailers = 1;
1309                 } else if (match_placeholder_arg_value(*arg, "separator", arg, &argval, &arglen)) {
1310                         opts->separator = expand_string_arg(sepbuf, argval, arglen);
1311                 } else if (match_placeholder_arg_value(*arg, "key_value_separator", arg, &argval, &arglen)) {
1312                         opts->key_value_separator = expand_string_arg(kvsepbuf, argval, arglen);
1313                 } else if (!match_placeholder_bool_arg(*arg, "only", arg, &opts->only_trailers) &&
1314                            !match_placeholder_bool_arg(*arg, "unfold", arg, &opts->unfold) &&
1315                            !match_placeholder_bool_arg(*arg, "keyonly", arg, &opts->key_only) &&
1316                            !match_placeholder_bool_arg(*arg, "valueonly", arg, &opts->value_only)) {
1317                         if (invalid_arg) {
1318                                 size_t len = strcspn(*arg, ",)");
1319                                 *invalid_arg = xstrndup(*arg, len);
1320                         }
1321                         return -1;
1322                 }
1323         }
1324         return 0;
1325 }
1326
1327 static size_t parse_describe_args(const char *start, struct strvec *args)
1328 {
1329         struct {
1330                 const char *name;
1331                 enum {
1332                         DESCRIBE_ARG_BOOL,
1333                         DESCRIBE_ARG_INTEGER,
1334                         DESCRIBE_ARG_STRING,
1335                 } type;
1336         }  option[] = {
1337                 { "tags", DESCRIBE_ARG_BOOL},
1338                 { "abbrev", DESCRIBE_ARG_INTEGER },
1339                 { "exclude", DESCRIBE_ARG_STRING },
1340                 { "match", DESCRIBE_ARG_STRING },
1341         };
1342         const char *arg = start;
1343
1344         for (;;) {
1345                 int found = 0;
1346                 const char *argval;
1347                 size_t arglen = 0;
1348                 int optval = 0;
1349                 int i;
1350
1351                 for (i = 0; !found && i < ARRAY_SIZE(option); i++) {
1352                         switch (option[i].type) {
1353                         case DESCRIBE_ARG_BOOL:
1354                                 if (match_placeholder_bool_arg(arg, option[i].name, &arg, &optval)) {
1355                                         if (optval)
1356                                                 strvec_pushf(args, "--%s", option[i].name);
1357                                         else
1358                                                 strvec_pushf(args, "--no-%s", option[i].name);
1359                                         found = 1;
1360                                 }
1361                                 break;
1362                         case DESCRIBE_ARG_INTEGER:
1363                                 if (match_placeholder_arg_value(arg, option[i].name, &arg,
1364                                                                 &argval, &arglen)) {
1365                                         char *endptr;
1366                                         if (!arglen)
1367                                                 return 0;
1368                                         strtol(argval, &endptr, 10);
1369                                         if (endptr - argval != arglen)
1370                                                 return 0;
1371                                         strvec_pushf(args, "--%s=%.*s", option[i].name, (int)arglen, argval);
1372                                         found = 1;
1373                                 }
1374                                 break;
1375                         case DESCRIBE_ARG_STRING:
1376                                 if (match_placeholder_arg_value(arg, option[i].name, &arg,
1377                                                                 &argval, &arglen)) {
1378                                         if (!arglen)
1379                                                 return 0;
1380                                         strvec_pushf(args, "--%s=%.*s", option[i].name, (int)arglen, argval);
1381                                         found = 1;
1382                                 }
1383                                 break;
1384                         }
1385                 }
1386                 if (!found)
1387                         break;
1388
1389         }
1390         return arg - start;
1391 }
1392
1393
1394 static int parse_decoration_option(const char **arg,
1395                                    const char *name,
1396                                    char **opt)
1397 {
1398         const char *argval;
1399         size_t arglen;
1400
1401         if (match_placeholder_arg_value(*arg, name, arg, &argval, &arglen)) {
1402                 struct strbuf sb = STRBUF_INIT;
1403
1404                 expand_string_arg(&sb, argval, arglen);
1405                 *opt = strbuf_detach(&sb, NULL);
1406                 return 1;
1407         }
1408         return 0;
1409 }
1410
1411 static void parse_decoration_options(const char **arg,
1412                                      struct decoration_options *opts)
1413 {
1414         while (parse_decoration_option(arg, "prefix", &opts->prefix) ||
1415                parse_decoration_option(arg, "suffix", &opts->suffix) ||
1416                parse_decoration_option(arg, "separator", &opts->separator) ||
1417                parse_decoration_option(arg, "pointer", &opts->pointer) ||
1418                parse_decoration_option(arg, "tag", &opts->tag))
1419                 ;
1420 }
1421
1422 static void free_decoration_options(const struct decoration_options *opts)
1423 {
1424         free(opts->prefix);
1425         free(opts->suffix);
1426         free(opts->separator);
1427         free(opts->pointer);
1428         free(opts->tag);
1429 }
1430
1431 static size_t format_commit_one(struct strbuf *sb, /* in UTF-8 */
1432                                 const char *placeholder,
1433                                 void *context)
1434 {
1435         struct format_commit_context *c = context;
1436         const struct commit *commit = c->commit;
1437         const char *msg = c->message;
1438         struct commit_list *p;
1439         const char *arg, *eol;
1440         size_t res;
1441         char **slot;
1442
1443         /* these are independent of the commit */
1444         res = strbuf_expand_literal(sb, placeholder);
1445         if (res)
1446                 return res;
1447
1448         switch (placeholder[0]) {
1449         case 'C':
1450                 if (starts_with(placeholder + 1, "(auto)")) {
1451                         c->auto_color = want_color(c->pretty_ctx->color);
1452                         if (c->auto_color && sb->len)
1453                                 strbuf_addstr(sb, GIT_COLOR_RESET);
1454                         return 7; /* consumed 7 bytes, "C(auto)" */
1455                 } else {
1456                         int ret = parse_color(sb, placeholder, c);
1457                         if (ret)
1458                                 c->auto_color = 0;
1459                         /*
1460                          * Otherwise, we decided to treat %C<unknown>
1461                          * as a literal string, and the previous
1462                          * %C(auto) is still valid.
1463                          */
1464                         return ret;
1465                 }
1466         case 'w':
1467                 if (placeholder[1] == '(') {
1468                         unsigned long width = 0, indent1 = 0, indent2 = 0;
1469                         char *next;
1470                         const char *start = placeholder + 2;
1471                         const char *end = strchr(start, ')');
1472                         if (!end)
1473                                 return 0;
1474                         if (end > start) {
1475                                 width = strtoul(start, &next, 10);
1476                                 if (*next == ',') {
1477                                         indent1 = strtoul(next + 1, &next, 10);
1478                                         if (*next == ',') {
1479                                                 indent2 = strtoul(next + 1,
1480                                                                  &next, 10);
1481                                         }
1482                                 }
1483                                 if (*next != ')')
1484                                         return 0;
1485                         }
1486
1487                         /*
1488                          * We need to limit the format here as it allows the
1489                          * user to prepend arbitrarily many bytes to the buffer
1490                          * when rewrapping.
1491                          */
1492                         if (width > FORMATTING_LIMIT ||
1493                             indent1 > FORMATTING_LIMIT ||
1494                             indent2 > FORMATTING_LIMIT)
1495                                 return 0;
1496                         rewrap_message_tail(sb, c, width, indent1, indent2);
1497                         return end - placeholder + 1;
1498                 } else
1499                         return 0;
1500
1501         case '<':
1502         case '>':
1503                 return parse_padding_placeholder(placeholder, c);
1504         }
1505
1506         if (skip_prefix(placeholder, "(describe", &arg)) {
1507                 struct child_process cmd = CHILD_PROCESS_INIT;
1508                 struct strbuf out = STRBUF_INIT;
1509                 struct strbuf err = STRBUF_INIT;
1510                 struct pretty_print_describe_status *describe_status;
1511
1512                 describe_status = c->pretty_ctx->describe_status;
1513                 if (describe_status) {
1514                         if (!describe_status->max_invocations)
1515                                 return 0;
1516                         describe_status->max_invocations--;
1517                 }
1518
1519                 cmd.git_cmd = 1;
1520                 strvec_push(&cmd.args, "describe");
1521
1522                 if (*arg == ':') {
1523                         arg++;
1524                         arg += parse_describe_args(arg, &cmd.args);
1525                 }
1526
1527                 if (*arg != ')') {
1528                         child_process_clear(&cmd);
1529                         return 0;
1530                 }
1531
1532                 strvec_push(&cmd.args, oid_to_hex(&commit->object.oid));
1533                 pipe_command(&cmd, NULL, 0, &out, 0, &err, 0);
1534                 strbuf_rtrim(&out);
1535                 strbuf_addbuf(sb, &out);
1536                 strbuf_release(&out);
1537                 strbuf_release(&err);
1538                 return arg - placeholder + 1;
1539         }
1540
1541         /* these depend on the commit */
1542         if (!commit->object.parsed)
1543                 parse_object(the_repository, &commit->object.oid);
1544
1545         switch (placeholder[0]) {
1546         case 'H':               /* commit hash */
1547                 strbuf_addstr(sb, diff_get_color(c->auto_color, DIFF_COMMIT));
1548                 strbuf_addstr(sb, oid_to_hex(&commit->object.oid));
1549                 strbuf_addstr(sb, diff_get_color(c->auto_color, DIFF_RESET));
1550                 return 1;
1551         case 'h':               /* abbreviated commit hash */
1552                 strbuf_addstr(sb, diff_get_color(c->auto_color, DIFF_COMMIT));
1553                 strbuf_add_unique_abbrev(sb, &commit->object.oid,
1554                                          c->pretty_ctx->abbrev);
1555                 strbuf_addstr(sb, diff_get_color(c->auto_color, DIFF_RESET));
1556                 return 1;
1557         case 'T':               /* tree hash */
1558                 strbuf_addstr(sb, oid_to_hex(get_commit_tree_oid(commit)));
1559                 return 1;
1560         case 't':               /* abbreviated tree hash */
1561                 strbuf_add_unique_abbrev(sb,
1562                                          get_commit_tree_oid(commit),
1563                                          c->pretty_ctx->abbrev);
1564                 return 1;
1565         case 'P':               /* parent hashes */
1566                 for (p = commit->parents; p; p = p->next) {
1567                         if (p != commit->parents)
1568                                 strbuf_addch(sb, ' ');
1569                         strbuf_addstr(sb, oid_to_hex(&p->item->object.oid));
1570                 }
1571                 return 1;
1572         case 'p':               /* abbreviated parent hashes */
1573                 for (p = commit->parents; p; p = p->next) {
1574                         if (p != commit->parents)
1575                                 strbuf_addch(sb, ' ');
1576                         strbuf_add_unique_abbrev(sb, &p->item->object.oid,
1577                                                  c->pretty_ctx->abbrev);
1578                 }
1579                 return 1;
1580         case 'm':               /* left/right/bottom */
1581                 strbuf_addstr(sb, get_revision_mark(NULL, commit));
1582                 return 1;
1583         case 'd':
1584                 format_decorations(sb, commit, c->auto_color, NULL);
1585                 return 1;
1586         case 'D':
1587                 {
1588                         const struct decoration_options opts = {
1589                                 .prefix = (char *) "",
1590                                 .suffix = (char *) "",
1591                         };
1592
1593                         format_decorations(sb, commit, c->auto_color, &opts);
1594                         return 1;
1595                 }
1596         case 'S':               /* tag/branch like --source */
1597                 if (!(c->pretty_ctx->rev && c->pretty_ctx->rev->sources))
1598                         return 0;
1599                 slot = revision_sources_at(c->pretty_ctx->rev->sources, commit);
1600                 if (!(slot && *slot))
1601                         return 0;
1602                 strbuf_addstr(sb, *slot);
1603                 return 1;
1604         case 'g':               /* reflog info */
1605                 switch(placeholder[1]) {
1606                 case 'd':       /* reflog selector */
1607                 case 'D':
1608                         if (c->pretty_ctx->reflog_info)
1609                                 get_reflog_selector(sb,
1610                                                     c->pretty_ctx->reflog_info,
1611                                                     c->pretty_ctx->date_mode,
1612                                                     c->pretty_ctx->date_mode_explicit,
1613                                                     (placeholder[1] == 'd'));
1614                         return 2;
1615                 case 's':       /* reflog message */
1616                         if (c->pretty_ctx->reflog_info)
1617                                 get_reflog_message(sb, c->pretty_ctx->reflog_info);
1618                         return 2;
1619                 case 'n':
1620                 case 'N':
1621                 case 'e':
1622                 case 'E':
1623                         return format_reflog_person(sb,
1624                                                     placeholder[1],
1625                                                     c->pretty_ctx->reflog_info,
1626                                                     c->pretty_ctx->date_mode);
1627                 }
1628                 return 0;       /* unknown %g placeholder */
1629         case 'N':
1630                 if (c->pretty_ctx->notes_message) {
1631                         strbuf_addstr(sb, c->pretty_ctx->notes_message);
1632                         return 1;
1633                 }
1634                 return 0;
1635         }
1636
1637         if (placeholder[0] == 'G') {
1638                 if (!c->signature_check.result)
1639                         check_commit_signature(c->commit, &(c->signature_check));
1640                 switch (placeholder[1]) {
1641                 case 'G':
1642                         if (c->signature_check.output)
1643                                 strbuf_addstr(sb, c->signature_check.output);
1644                         break;
1645                 case '?':
1646                         switch (c->signature_check.result) {
1647                         case 'G':
1648                                 switch (c->signature_check.trust_level) {
1649                                 case TRUST_UNDEFINED:
1650                                 case TRUST_NEVER:
1651                                         strbuf_addch(sb, 'U');
1652                                         break;
1653                                 default:
1654                                         strbuf_addch(sb, 'G');
1655                                         break;
1656                                 }
1657                                 break;
1658                         case 'B':
1659                         case 'E':
1660                         case 'N':
1661                         case 'X':
1662                         case 'Y':
1663                         case 'R':
1664                                 strbuf_addch(sb, c->signature_check.result);
1665                         }
1666                         break;
1667                 case 'S':
1668                         if (c->signature_check.signer)
1669                                 strbuf_addstr(sb, c->signature_check.signer);
1670                         break;
1671                 case 'K':
1672                         if (c->signature_check.key)
1673                                 strbuf_addstr(sb, c->signature_check.key);
1674                         break;
1675                 case 'F':
1676                         if (c->signature_check.fingerprint)
1677                                 strbuf_addstr(sb, c->signature_check.fingerprint);
1678                         break;
1679                 case 'P':
1680                         if (c->signature_check.primary_key_fingerprint)
1681                                 strbuf_addstr(sb, c->signature_check.primary_key_fingerprint);
1682                         break;
1683                 case 'T':
1684                         strbuf_addstr(sb, gpg_trust_level_to_str(c->signature_check.trust_level));
1685                         break;
1686                 default:
1687                         return 0;
1688                 }
1689                 return 2;
1690         }
1691
1692         if (skip_prefix(placeholder, "(decorate", &arg)) {
1693                 struct decoration_options opts = { NULL };
1694                 size_t ret = 0;
1695
1696                 if (*arg == ':') {
1697                         arg++;
1698                         parse_decoration_options(&arg, &opts);
1699                 }
1700                 if (*arg == ')') {
1701                         format_decorations(sb, commit, c->auto_color, &opts);
1702                         ret = arg - placeholder + 1;
1703                 }
1704
1705                 free_decoration_options(&opts);
1706                 return ret;
1707         }
1708
1709         /* For the rest we have to parse the commit header. */
1710         if (!c->commit_header_parsed) {
1711                 msg = c->message =
1712                         repo_logmsg_reencode(c->repository, commit,
1713                                              &c->commit_encoding, "UTF-8");
1714                 parse_commit_header(c);
1715         }
1716
1717         switch (placeholder[0]) {
1718         case 'a':       /* author ... */
1719                 return format_person_part(sb, placeholder[1],
1720                                    msg + c->author.off, c->author.len,
1721                                    c->pretty_ctx->date_mode);
1722         case 'c':       /* committer ... */
1723                 return format_person_part(sb, placeholder[1],
1724                                    msg + c->committer.off, c->committer.len,
1725                                    c->pretty_ctx->date_mode);
1726         case 'e':       /* encoding */
1727                 if (c->commit_encoding)
1728                         strbuf_addstr(sb, c->commit_encoding);
1729                 return 1;
1730         case 'B':       /* raw body */
1731                 /* message_off is always left at the initial newline */
1732                 strbuf_addstr(sb, msg + c->message_off + 1);
1733                 return 1;
1734         }
1735
1736         /* Now we need to parse the commit message. */
1737         if (!c->commit_message_parsed)
1738                 parse_commit_message(c);
1739
1740         switch (placeholder[0]) {
1741         case 's':       /* subject */
1742                 format_subject(sb, msg + c->subject_off, " ");
1743                 return 1;
1744         case 'f':       /* sanitized subject */
1745                 eol = strchrnul(msg + c->subject_off, '\n');
1746                 format_sanitized_subject(sb, msg + c->subject_off, eol - (msg + c->subject_off));
1747                 return 1;
1748         case 'b':       /* body */
1749                 strbuf_addstr(sb, msg + c->body_off);
1750                 return 1;
1751         }
1752
1753         if (skip_prefix(placeholder, "(trailers", &arg)) {
1754                 struct process_trailer_options opts = PROCESS_TRAILER_OPTIONS_INIT;
1755                 struct string_list filter_list = STRING_LIST_INIT_NODUP;
1756                 struct strbuf sepbuf = STRBUF_INIT;
1757                 struct strbuf kvsepbuf = STRBUF_INIT;
1758                 size_t ret = 0;
1759
1760                 opts.no_divider = 1;
1761
1762                 if (*arg == ':') {
1763                         arg++;
1764                         if (format_set_trailers_options(&opts, &filter_list, &sepbuf, &kvsepbuf, &arg, NULL))
1765                                 goto trailer_out;
1766                 }
1767                 if (*arg == ')') {
1768                         format_trailers_from_commit(&opts, msg + c->subject_off, sb);
1769                         ret = arg - placeholder + 1;
1770                 }
1771         trailer_out:
1772                 string_list_clear(&filter_list, 0);
1773                 strbuf_release(&sepbuf);
1774                 return ret;
1775         }
1776
1777         return 0;       /* unknown placeholder */
1778 }
1779
1780 static size_t format_and_pad_commit(struct strbuf *sb, /* in UTF-8 */
1781                                     const char *placeholder,
1782                                     struct format_commit_context *c)
1783 {
1784         struct strbuf local_sb = STRBUF_INIT;
1785         size_t total_consumed = 0;
1786         int len, padding = c->padding;
1787
1788         if (padding < 0) {
1789                 const char *start = strrchr(sb->buf, '\n');
1790                 int occupied;
1791                 if (!start)
1792                         start = sb->buf;
1793                 occupied = utf8_strnwidth(start, strlen(start), 1);
1794                 occupied += c->pretty_ctx->graph_width;
1795                 padding = (-padding) - occupied;
1796         }
1797         while (1) {
1798                 int modifier = *placeholder == 'C';
1799                 size_t consumed = format_commit_one(&local_sb, placeholder, c);
1800                 total_consumed += consumed;
1801
1802                 if (!modifier)
1803                         break;
1804
1805                 placeholder += consumed;
1806                 if (*placeholder != '%')
1807                         break;
1808                 placeholder++;
1809                 total_consumed++;
1810         }
1811         len = utf8_strnwidth(local_sb.buf, local_sb.len, 1);
1812
1813         if (c->flush_type == flush_left_and_steal) {
1814                 const char *ch = sb->buf + sb->len - 1;
1815                 while (len > padding && ch > sb->buf) {
1816                         const char *p;
1817                         if (*ch == ' ') {
1818                                 ch--;
1819                                 padding++;
1820                                 continue;
1821                         }
1822                         /* check for trailing ansi sequences */
1823                         if (*ch != 'm')
1824                                 break;
1825                         p = ch - 1;
1826                         while (p > sb->buf && ch - p < 10 && *p != '\033')
1827                                 p--;
1828                         if (*p != '\033' ||
1829                             ch + 1 - p != display_mode_esc_sequence_len(p))
1830                                 break;
1831                         /*
1832                          * got a good ansi sequence, put it back to
1833                          * local_sb as we're cutting sb
1834                          */
1835                         strbuf_insert(&local_sb, 0, p, ch + 1 - p);
1836                         ch = p - 1;
1837                 }
1838                 strbuf_setlen(sb, ch + 1 - sb->buf);
1839                 c->flush_type = flush_left;
1840         }
1841
1842         if (len > padding) {
1843                 switch (c->truncate) {
1844                 case trunc_left:
1845                         strbuf_utf8_replace(&local_sb,
1846                                             0, len - (padding - 2),
1847                                             "..");
1848                         break;
1849                 case trunc_middle:
1850                         strbuf_utf8_replace(&local_sb,
1851                                             padding / 2 - 1,
1852                                             len - (padding - 2),
1853                                             "..");
1854                         break;
1855                 case trunc_right:
1856                         strbuf_utf8_replace(&local_sb,
1857                                             padding - 2, len - (padding - 2),
1858                                             "..");
1859                         break;
1860                 case trunc_none:
1861                         break;
1862                 }
1863                 strbuf_addbuf(sb, &local_sb);
1864         } else {
1865                 size_t sb_len = sb->len, offset = 0;
1866                 if (c->flush_type == flush_left)
1867                         offset = padding - len;
1868                 else if (c->flush_type == flush_both)
1869                         offset = (padding - len) / 2;
1870                 /*
1871                  * we calculate padding in columns, now
1872                  * convert it back to chars
1873                  */
1874                 padding = padding - len + local_sb.len;
1875                 strbuf_addchars(sb, ' ', padding);
1876                 memcpy(sb->buf + sb_len + offset, local_sb.buf,
1877                        local_sb.len);
1878         }
1879         strbuf_release(&local_sb);
1880         c->flush_type = no_flush;
1881         return total_consumed;
1882 }
1883
1884 static size_t format_commit_item(struct strbuf *sb, /* in UTF-8 */
1885                                  const char *placeholder,
1886                                  struct format_commit_context *context)
1887 {
1888         size_t consumed, orig_len;
1889         enum {
1890                 NO_MAGIC,
1891                 ADD_LF_BEFORE_NON_EMPTY,
1892                 DEL_LF_BEFORE_EMPTY,
1893                 ADD_SP_BEFORE_NON_EMPTY
1894         } magic = NO_MAGIC;
1895
1896         switch (placeholder[0]) {
1897         case '-':
1898                 magic = DEL_LF_BEFORE_EMPTY;
1899                 break;
1900         case '+':
1901                 magic = ADD_LF_BEFORE_NON_EMPTY;
1902                 break;
1903         case ' ':
1904                 magic = ADD_SP_BEFORE_NON_EMPTY;
1905                 break;
1906         default:
1907                 break;
1908         }
1909         if (magic != NO_MAGIC) {
1910                 placeholder++;
1911
1912                 switch (placeholder[0]) {
1913                 case 'w':
1914                         /*
1915                          * `%+w()` cannot ever expand to a non-empty string,
1916                          * and it potentially changes the layout of preceding
1917                          * contents. We're thus not able to handle the magic in
1918                          * this combination and refuse the pattern.
1919                          */
1920                         return 0;
1921                 };
1922         }
1923
1924         orig_len = sb->len;
1925         if (context->flush_type == no_flush)
1926                 consumed = format_commit_one(sb, placeholder, context);
1927         else
1928                 consumed = format_and_pad_commit(sb, placeholder, context);
1929         if (magic == NO_MAGIC)
1930                 return consumed;
1931
1932         if ((orig_len == sb->len) && magic == DEL_LF_BEFORE_EMPTY) {
1933                 while (sb->len && sb->buf[sb->len - 1] == '\n')
1934                         strbuf_setlen(sb, sb->len - 1);
1935         } else if (orig_len != sb->len) {
1936                 if (magic == ADD_LF_BEFORE_NON_EMPTY)
1937                         strbuf_insertstr(sb, orig_len, "\n");
1938                 else if (magic == ADD_SP_BEFORE_NON_EMPTY)
1939                         strbuf_insertstr(sb, orig_len, " ");
1940         }
1941         return consumed + 1;
1942 }
1943
1944 void userformat_find_requirements(const char *fmt, struct userformat_want *w)
1945 {
1946         if (!fmt) {
1947                 if (!user_format)
1948                         return;
1949                 fmt = user_format;
1950         }
1951         while ((fmt = strchr(fmt, '%'))) {
1952                 fmt++;
1953                 if (skip_prefix(fmt, "%", &fmt))
1954                         continue;
1955
1956                 if (*fmt == '+' || *fmt == '-' || *fmt == ' ')
1957                         fmt++;
1958
1959                 switch (*fmt) {
1960                 case 'N':
1961                         w->notes = 1;
1962                         break;
1963                 case 'S':
1964                         w->source = 1;
1965                         break;
1966                 case 'd':
1967                 case 'D':
1968                         w->decorate = 1;
1969                         break;
1970                 case '(':
1971                         if (starts_with(fmt + 1, "decorate"))
1972                                 w->decorate = 1;
1973                         break;
1974                 }
1975         }
1976 }
1977
1978 void repo_format_commit_message(struct repository *r,
1979                                 const struct commit *commit,
1980                                 const char *format, struct strbuf *sb,
1981                                 const struct pretty_print_context *pretty_ctx)
1982 {
1983         struct format_commit_context context = {
1984                 .repository = r,
1985                 .commit = commit,
1986                 .pretty_ctx = pretty_ctx,
1987                 .wrap_start = sb->len
1988         };
1989         const char *output_enc = pretty_ctx->output_encoding;
1990         const char *utf8 = "UTF-8";
1991
1992         while (strbuf_expand_step(sb, &format)) {
1993                 size_t len;
1994
1995                 if (skip_prefix(format, "%", &format))
1996                         strbuf_addch(sb, '%');
1997                 else if ((len = format_commit_item(sb, format, &context)))
1998                         format += len;
1999                 else
2000                         strbuf_addch(sb, '%');
2001         }
2002         rewrap_message_tail(sb, &context, 0, 0, 0);
2003
2004         /*
2005          * Convert output to an actual output encoding; note that
2006          * format_commit_item() will always use UTF-8, so we don't
2007          * have to bother if that's what the output wants.
2008          */
2009         if (output_enc) {
2010                 if (same_encoding(utf8, output_enc))
2011                         output_enc = NULL;
2012         } else {
2013                 if (context.commit_encoding &&
2014                     !same_encoding(context.commit_encoding, utf8))
2015                         output_enc = context.commit_encoding;
2016         }
2017
2018         if (output_enc) {
2019                 size_t outsz;
2020                 char *out = reencode_string_len(sb->buf, sb->len,
2021                                                 output_enc, utf8, &outsz);
2022                 if (out)
2023                         strbuf_attach(sb, out, outsz, outsz + 1);
2024         }
2025
2026         free(context.commit_encoding);
2027         repo_unuse_commit_buffer(r, commit, context.message);
2028 }
2029
2030 static void pp_header(struct pretty_print_context *pp,
2031                       const char *encoding,
2032                       const struct commit *commit,
2033                       const char **msg_p,
2034                       struct strbuf *sb)
2035 {
2036         int parents_shown = 0;
2037
2038         for (;;) {
2039                 const char *name, *line = *msg_p;
2040                 int linelen = get_one_line(*msg_p);
2041
2042                 if (!linelen)
2043                         return;
2044                 *msg_p += linelen;
2045
2046                 if (linelen == 1)
2047                         /* End of header */
2048                         return;
2049
2050                 if (pp->fmt == CMIT_FMT_RAW) {
2051                         strbuf_add(sb, line, linelen);
2052                         continue;
2053                 }
2054
2055                 if (starts_with(line, "parent ")) {
2056                         if (linelen != the_hash_algo->hexsz + 8)
2057                                 die("bad parent line in commit");
2058                         continue;
2059                 }
2060
2061                 if (!parents_shown) {
2062                         unsigned num = commit_list_count(commit->parents);
2063                         /* with enough slop */
2064                         strbuf_grow(sb, num * (GIT_MAX_HEXSZ + 10) + 20);
2065                         add_merge_info(pp, sb, commit);
2066                         parents_shown = 1;
2067                 }
2068
2069                 /*
2070                  * MEDIUM == DEFAULT shows only author with dates.
2071                  * FULL shows both authors but not dates.
2072                  * FULLER shows both authors and dates.
2073                  */
2074                 if (skip_prefix(line, "author ", &name)) {
2075                         strbuf_grow(sb, linelen + 80);
2076                         pp_user_info(pp, "Author", sb, name, encoding);
2077                 }
2078                 if (skip_prefix(line, "committer ", &name) &&
2079                     (pp->fmt == CMIT_FMT_FULL || pp->fmt == CMIT_FMT_FULLER)) {
2080                         strbuf_grow(sb, linelen + 80);
2081                         pp_user_info(pp, "Commit", sb, name, encoding);
2082                 }
2083         }
2084 }
2085
2086 void pp_email_subject(struct pretty_print_context *pp,
2087                       const char **msg_p,
2088                       struct strbuf *sb,
2089                       const char *encoding,
2090                       int need_8bit_cte)
2091 {
2092         static const int max_length = 78; /* per rfc2047 */
2093         struct strbuf title;
2094
2095         strbuf_init(&title, 80);
2096         *msg_p = format_subject(&title, *msg_p,
2097                                 pp->preserve_subject ? "\n" : " ");
2098
2099         strbuf_grow(sb, title.len + 1024);
2100         fmt_output_email_subject(sb, pp->rev);
2101         if (pp->encode_email_headers &&
2102             needs_rfc2047_encoding(title.buf, title.len))
2103                 add_rfc2047(sb, title.buf, title.len,
2104                             encoding, RFC2047_SUBJECT);
2105         else
2106                 strbuf_add_wrapped_bytes(sb, title.buf, title.len,
2107                                          -last_line_length(sb), 1, max_length);
2108         strbuf_addch(sb, '\n');
2109
2110         if (need_8bit_cte == 0) {
2111                 int i;
2112                 for (i = 0; i < pp->in_body_headers.nr; i++) {
2113                         if (has_non_ascii(pp->in_body_headers.items[i].string)) {
2114                                 need_8bit_cte = 1;
2115                                 break;
2116                         }
2117                 }
2118         }
2119
2120         if (need_8bit_cte > 0) {
2121                 const char *header_fmt =
2122                         "MIME-Version: 1.0\n"
2123                         "Content-Type: text/plain; charset=%s\n"
2124                         "Content-Transfer-Encoding: 8bit\n";
2125                 strbuf_addf(sb, header_fmt, encoding);
2126         }
2127         if (pp->after_subject) {
2128                 strbuf_addstr(sb, pp->after_subject);
2129         }
2130
2131         strbuf_addch(sb, '\n');
2132
2133         if (pp->in_body_headers.nr) {
2134                 int i;
2135                 for (i = 0; i < pp->in_body_headers.nr; i++) {
2136                         strbuf_addstr(sb, pp->in_body_headers.items[i].string);
2137                         free(pp->in_body_headers.items[i].string);
2138                 }
2139                 string_list_clear(&pp->in_body_headers, 0);
2140                 strbuf_addch(sb, '\n');
2141         }
2142
2143         strbuf_release(&title);
2144 }
2145
2146 static int pp_utf8_width(const char *start, const char *end)
2147 {
2148         int width = 0;
2149         size_t remain = end - start;
2150
2151         while (remain) {
2152                 int n = utf8_width(&start, &remain);
2153                 if (n < 0 || !start)
2154                         return -1;
2155                 width += n;
2156         }
2157         return width;
2158 }
2159
2160 static void strbuf_add_tabexpand(struct strbuf *sb, struct grep_opt *opt,
2161                                  int color, int tabwidth, const char *line,
2162                                  int linelen)
2163 {
2164         const char *tab;
2165
2166         while ((tab = memchr(line, '\t', linelen)) != NULL) {
2167                 int width = pp_utf8_width(line, tab);
2168
2169                 /*
2170                  * If it wasn't well-formed utf8, or it
2171                  * had characters with badly defined
2172                  * width (control characters etc), just
2173                  * give up on trying to align things.
2174                  */
2175                 if (width < 0)
2176                         break;
2177
2178                 /* Output the data .. */
2179                 append_line_with_color(sb, opt, line, tab - line, color,
2180                                        GREP_CONTEXT_BODY,
2181                                        GREP_HEADER_FIELD_MAX);
2182
2183                 /* .. and the de-tabified tab */
2184                 strbuf_addchars(sb, ' ', tabwidth - (width % tabwidth));
2185
2186                 /* Skip over the printed part .. */
2187                 linelen -= tab + 1 - line;
2188                 line = tab + 1;
2189         }
2190
2191         /*
2192          * Print out everything after the last tab without
2193          * worrying about width - there's nothing more to
2194          * align.
2195          */
2196         append_line_with_color(sb, opt, line, linelen, color, GREP_CONTEXT_BODY,
2197                                GREP_HEADER_FIELD_MAX);
2198 }
2199
2200 /*
2201  * pp_handle_indent() prints out the intendation, and
2202  * the whole line (without the final newline), after
2203  * de-tabifying.
2204  */
2205 static void pp_handle_indent(struct pretty_print_context *pp,
2206                              struct strbuf *sb, int indent,
2207                              const char *line, int linelen)
2208 {
2209         struct grep_opt *opt = pp->rev ? &pp->rev->grep_filter : NULL;
2210
2211         strbuf_addchars(sb, ' ', indent);
2212         if (pp->expand_tabs_in_log)
2213                 strbuf_add_tabexpand(sb, opt, pp->color, pp->expand_tabs_in_log,
2214                                      line, linelen);
2215         else
2216                 append_line_with_color(sb, opt, line, linelen, pp->color,
2217                                        GREP_CONTEXT_BODY,
2218                                        GREP_HEADER_FIELD_MAX);
2219 }
2220
2221 static int is_mboxrd_from(const char *line, int len)
2222 {
2223         /*
2224          * a line matching /^From $/ here would only have len == 4
2225          * at this point because is_empty_line would've trimmed all
2226          * trailing space
2227          */
2228         return len > 4 && starts_with(line + strspn(line, ">"), "From ");
2229 }
2230
2231 void pp_remainder(struct pretty_print_context *pp,
2232                   const char **msg_p,
2233                   struct strbuf *sb,
2234                   int indent)
2235 {
2236         struct grep_opt *opt = pp->rev ? &pp->rev->grep_filter : NULL;
2237         int first = 1;
2238
2239         for (;;) {
2240                 const char *line = *msg_p;
2241                 int linelen = get_one_line(line);
2242                 *msg_p += linelen;
2243
2244                 if (!linelen)
2245                         break;
2246
2247                 if (is_blank_line(line, &linelen)) {
2248                         if (first)
2249                                 continue;
2250                         if (pp->fmt == CMIT_FMT_SHORT)
2251                                 break;
2252                 }
2253                 first = 0;
2254
2255                 strbuf_grow(sb, linelen + indent + 20);
2256                 if (indent)
2257                         pp_handle_indent(pp, sb, indent, line, linelen);
2258                 else if (pp->expand_tabs_in_log)
2259                         strbuf_add_tabexpand(sb, opt, pp->color,
2260                                              pp->expand_tabs_in_log, line,
2261                                              linelen);
2262                 else {
2263                         if (pp->fmt == CMIT_FMT_MBOXRD &&
2264                                         is_mboxrd_from(line, linelen))
2265                                 strbuf_addch(sb, '>');
2266
2267                         append_line_with_color(sb, opt, line, linelen,
2268                                                pp->color, GREP_CONTEXT_BODY,
2269                                                GREP_HEADER_FIELD_MAX);
2270                 }
2271                 strbuf_addch(sb, '\n');
2272         }
2273 }
2274
2275 void pretty_print_commit(struct pretty_print_context *pp,
2276                          const struct commit *commit,
2277                          struct strbuf *sb)
2278 {
2279         unsigned long beginning_of_body;
2280         int indent = 4;
2281         const char *msg;
2282         const char *reencoded;
2283         const char *encoding;
2284         int need_8bit_cte = pp->need_8bit_cte;
2285
2286         if (pp->fmt == CMIT_FMT_USERFORMAT) {
2287                 repo_format_commit_message(the_repository, commit,
2288                                            user_format, sb, pp);
2289                 return;
2290         }
2291
2292         encoding = get_log_output_encoding();
2293         msg = reencoded = repo_logmsg_reencode(the_repository, commit, NULL,
2294                                                encoding);
2295
2296         if (pp->fmt == CMIT_FMT_ONELINE || cmit_fmt_is_mail(pp->fmt))
2297                 indent = 0;
2298
2299         /*
2300          * We need to check and emit Content-type: to mark it
2301          * as 8-bit if we haven't done so.
2302          */
2303         if (cmit_fmt_is_mail(pp->fmt) && need_8bit_cte == 0) {
2304                 int i, ch, in_body;
2305
2306                 for (in_body = i = 0; (ch = msg[i]); i++) {
2307                         if (!in_body) {
2308                                 /* author could be non 7-bit ASCII but
2309                                  * the log may be so; skip over the
2310                                  * header part first.
2311                                  */
2312                                 if (ch == '\n' && msg[i+1] == '\n')
2313                                         in_body = 1;
2314                         }
2315                         else if (non_ascii(ch)) {
2316                                 need_8bit_cte = 1;
2317                                 break;
2318                         }
2319                 }
2320         }
2321
2322         pp_header(pp, encoding, commit, &msg, sb);
2323         if (pp->fmt != CMIT_FMT_ONELINE && !cmit_fmt_is_mail(pp->fmt)) {
2324                 strbuf_addch(sb, '\n');
2325         }
2326
2327         /* Skip excess blank lines at the beginning of body, if any... */
2328         msg = skip_blank_lines(msg);
2329
2330         /* These formats treat the title line specially. */
2331         if (pp->fmt == CMIT_FMT_ONELINE) {
2332                 msg = format_subject(sb, msg, " ");
2333                 strbuf_addch(sb, '\n');
2334         } else if (cmit_fmt_is_mail(pp->fmt))
2335                 pp_email_subject(pp, &msg, sb, encoding, need_8bit_cte);
2336
2337         beginning_of_body = sb->len;
2338         if (pp->fmt != CMIT_FMT_ONELINE)
2339                 pp_remainder(pp, &msg, sb, indent);
2340         strbuf_rtrim(sb);
2341
2342         /* Make sure there is an EOLN for the non-oneline case */
2343         if (pp->fmt != CMIT_FMT_ONELINE)
2344                 strbuf_addch(sb, '\n');
2345
2346         /*
2347          * The caller may append additional body text in e-mail
2348          * format.  Make sure we did not strip the blank line
2349          * between the header and the body.
2350          */
2351         if (cmit_fmt_is_mail(pp->fmt) && sb->len <= beginning_of_body)
2352                 strbuf_addch(sb, '\n');
2353
2354         repo_unuse_commit_buffer(the_repository, commit, reencoded);
2355 }
2356
2357 void pp_commit_easy(enum cmit_fmt fmt, const struct commit *commit,
2358                     struct strbuf *sb)
2359 {
2360         struct pretty_print_context pp = {0};
2361         pp.fmt = fmt;
2362         pretty_print_commit(&pp, commit, sb);
2363 }