pretty.con commit rev-list/log: factor out revision mark generation (1df2d65)
   1#include "cache.h"
   2#include "commit.h"
   3#include "utf8.h"
   4#include "diff.h"
   5#include "revision.h"
   6#include "string-list.h"
   7#include "mailmap.h"
   8#include "log-tree.h"
   9#include "notes.h"
  10#include "color.h"
  11#include "reflog-walk.h"
  12
  13static char *user_format;
  14static struct cmt_fmt_map {
  15        const char *name;
  16        enum cmit_fmt format;
  17        int is_tformat;
  18        int is_alias;
  19        const char *user_format;
  20} *commit_formats;
  21static size_t builtin_formats_len;
  22static size_t commit_formats_len;
  23static size_t commit_formats_alloc;
  24static struct cmt_fmt_map *find_commit_format(const char *sought);
  25
  26static void save_user_format(struct rev_info *rev, const char *cp, int is_tformat)
  27{
  28        free(user_format);
  29        user_format = xstrdup(cp);
  30        if (is_tformat)
  31                rev->use_terminator = 1;
  32        rev->commit_format = CMIT_FMT_USERFORMAT;
  33}
  34
  35static int git_pretty_formats_config(const char *var, const char *value, void *cb)
  36{
  37        struct cmt_fmt_map *commit_format = NULL;
  38        const char *name;
  39        const char *fmt;
  40        int i;
  41
  42        if (prefixcmp(var, "pretty."))
  43                return 0;
  44
  45        name = var + strlen("pretty.");
  46        for (i = 0; i < builtin_formats_len; i++) {
  47                if (!strcmp(commit_formats[i].name, name))
  48                        return 0;
  49        }
  50
  51        for (i = builtin_formats_len; i < commit_formats_len; i++) {
  52                if (!strcmp(commit_formats[i].name, name)) {
  53                        commit_format = &commit_formats[i];
  54                        break;
  55                }
  56        }
  57
  58        if (!commit_format) {
  59                ALLOC_GROW(commit_formats, commit_formats_len+1,
  60                           commit_formats_alloc);
  61                commit_format = &commit_formats[commit_formats_len];
  62                memset(commit_format, 0, sizeof(*commit_format));
  63                commit_formats_len++;
  64        }
  65
  66        commit_format->name = xstrdup(name);
  67        commit_format->format = CMIT_FMT_USERFORMAT;
  68        git_config_string(&fmt, var, value);
  69        if (!prefixcmp(fmt, "format:") || !prefixcmp(fmt, "tformat:")) {
  70                commit_format->is_tformat = fmt[0] == 't';
  71                fmt = strchr(fmt, ':') + 1;
  72        } else if (strchr(fmt, '%'))
  73                commit_format->is_tformat = 1;
  74        else
  75                commit_format->is_alias = 1;
  76        commit_format->user_format = fmt;
  77
  78        return 0;
  79}
  80
  81static void setup_commit_formats(void)
  82{
  83        struct cmt_fmt_map builtin_formats[] = {
  84                { "raw",        CMIT_FMT_RAW,           0 },
  85                { "medium",     CMIT_FMT_MEDIUM,        0 },
  86                { "short",      CMIT_FMT_SHORT,         0 },
  87                { "email",      CMIT_FMT_EMAIL,         0 },
  88                { "fuller",     CMIT_FMT_FULLER,        0 },
  89                { "full",       CMIT_FMT_FULL,          0 },
  90                { "oneline",    CMIT_FMT_ONELINE,       1 }
  91        };
  92        commit_formats_len = ARRAY_SIZE(builtin_formats);
  93        builtin_formats_len = commit_formats_len;
  94        ALLOC_GROW(commit_formats, commit_formats_len, commit_formats_alloc);
  95        memcpy(commit_formats, builtin_formats,
  96               sizeof(*builtin_formats)*ARRAY_SIZE(builtin_formats));
  97
  98        git_config(git_pretty_formats_config, NULL);
  99}
 100
 101static struct cmt_fmt_map *find_commit_format_recursive(const char *sought,
 102                                                        const char *original,
 103                                                        int num_redirections)
 104{
 105        struct cmt_fmt_map *found = NULL;
 106        size_t found_match_len = 0;
 107        int i;
 108
 109        if (num_redirections >= commit_formats_len)
 110                die("invalid --pretty format: "
 111                    "'%s' references an alias which points to itself",
 112                    original);
 113
 114        for (i = 0; i < commit_formats_len; i++) {
 115                size_t match_len;
 116
 117                if (prefixcmp(commit_formats[i].name, sought))
 118                        continue;
 119
 120                match_len = strlen(commit_formats[i].name);
 121                if (found == NULL || found_match_len > match_len) {
 122                        found = &commit_formats[i];
 123                        found_match_len = match_len;
 124                }
 125        }
 126
 127        if (found && found->is_alias) {
 128                found = find_commit_format_recursive(found->user_format,
 129                                                     original,
 130                                                     num_redirections+1);
 131        }
 132
 133        return found;
 134}
 135
 136static struct cmt_fmt_map *find_commit_format(const char *sought)
 137{
 138        if (!commit_formats)
 139                setup_commit_formats();
 140
 141        return find_commit_format_recursive(sought, sought, 0);
 142}
 143
 144void get_commit_format(const char *arg, struct rev_info *rev)
 145{
 146        struct cmt_fmt_map *commit_format;
 147
 148        rev->use_terminator = 0;
 149        if (!arg || !*arg) {
 150                rev->commit_format = CMIT_FMT_DEFAULT;
 151                return;
 152        }
 153        if (!prefixcmp(arg, "format:") || !prefixcmp(arg, "tformat:")) {
 154                save_user_format(rev, strchr(arg, ':') + 1, arg[0] == 't');
 155                return;
 156        }
 157
 158        if (strchr(arg, '%')) {
 159                save_user_format(rev, arg, 1);
 160                return;
 161        }
 162
 163        commit_format = find_commit_format(arg);
 164        if (!commit_format)
 165                die("invalid --pretty format: %s", arg);
 166
 167        rev->commit_format = commit_format->format;
 168        rev->use_terminator = commit_format->is_tformat;
 169        if (commit_format->format == CMIT_FMT_USERFORMAT) {
 170                save_user_format(rev, commit_format->user_format,
 171                                 commit_format->is_tformat);
 172        }
 173}
 174
 175/*
 176 * Generic support for pretty-printing the header
 177 */
 178static int get_one_line(const char *msg)
 179{
 180        int ret = 0;
 181
 182        for (;;) {
 183                char c = *msg++;
 184                if (!c)
 185                        break;
 186                ret++;
 187                if (c == '\n')
 188                        break;
 189        }
 190        return ret;
 191}
 192
 193/* High bit set, or ISO-2022-INT */
 194static int non_ascii(int ch)
 195{
 196        return !isascii(ch) || ch == '\033';
 197}
 198
 199int has_non_ascii(const char *s)
 200{
 201        int ch;
 202        if (!s)
 203                return 0;
 204        while ((ch = *s++) != '\0') {
 205                if (non_ascii(ch))
 206                        return 1;
 207        }
 208        return 0;
 209}
 210
 211static int is_rfc2047_special(char ch)
 212{
 213        return (non_ascii(ch) || (ch == '=') || (ch == '?') || (ch == '_'));
 214}
 215
 216static void add_rfc2047(struct strbuf *sb, const char *line, int len,
 217                       const char *encoding)
 218{
 219        int i, last;
 220
 221        for (i = 0; i < len; i++) {
 222                int ch = line[i];
 223                if (non_ascii(ch))
 224                        goto needquote;
 225                if ((i + 1 < len) && (ch == '=' && line[i+1] == '?'))
 226                        goto needquote;
 227        }
 228        strbuf_add(sb, line, len);
 229        return;
 230
 231needquote:
 232        strbuf_grow(sb, len * 3 + strlen(encoding) + 100);
 233        strbuf_addf(sb, "=?%s?q?", encoding);
 234        for (i = last = 0; i < len; i++) {
 235                unsigned ch = line[i] & 0xFF;
 236                /*
 237                 * We encode ' ' using '=20' even though rfc2047
 238                 * allows using '_' for readability.  Unfortunately,
 239                 * many programs do not understand this and just
 240                 * leave the underscore in place.
 241                 */
 242                if (is_rfc2047_special(ch) || ch == ' ') {
 243                        strbuf_add(sb, line + last, i - last);
 244                        strbuf_addf(sb, "=%02X", ch);
 245                        last = i + 1;
 246                }
 247        }
 248        strbuf_add(sb, line + last, len - last);
 249        strbuf_addstr(sb, "?=");
 250}
 251
 252void pp_user_info(const char *what, enum cmit_fmt fmt, struct strbuf *sb,
 253                  const char *line, enum date_mode dmode,
 254                  const char *encoding)
 255{
 256        char *date;
 257        int namelen;
 258        unsigned long time;
 259        int tz;
 260
 261        if (fmt == CMIT_FMT_ONELINE)
 262                return;
 263        date = strchr(line, '>');
 264        if (!date)
 265                return;
 266        namelen = ++date - line;
 267        time = strtoul(date, &date, 10);
 268        tz = strtol(date, NULL, 10);
 269
 270        if (fmt == CMIT_FMT_EMAIL) {
 271                char *name_tail = strchr(line, '<');
 272                int display_name_length;
 273                if (!name_tail)
 274                        return;
 275                while (line < name_tail && isspace(name_tail[-1]))
 276                        name_tail--;
 277                display_name_length = name_tail - line;
 278                strbuf_addstr(sb, "From: ");
 279                add_rfc2047(sb, line, display_name_length, encoding);
 280                strbuf_add(sb, name_tail, namelen - display_name_length);
 281                strbuf_addch(sb, '\n');
 282        } else {
 283                strbuf_addf(sb, "%s: %.*s%.*s\n", what,
 284                              (fmt == CMIT_FMT_FULLER) ? 4 : 0,
 285                              "    ", namelen, line);
 286        }
 287        switch (fmt) {
 288        case CMIT_FMT_MEDIUM:
 289                strbuf_addf(sb, "Date:   %s\n", show_date(time, tz, dmode));
 290                break;
 291        case CMIT_FMT_EMAIL:
 292                strbuf_addf(sb, "Date: %s\n", show_date(time, tz, DATE_RFC2822));
 293                break;
 294        case CMIT_FMT_FULLER:
 295                strbuf_addf(sb, "%sDate: %s\n", what, show_date(time, tz, dmode));
 296                break;
 297        default:
 298                /* notin' */
 299                break;
 300        }
 301}
 302
 303static int is_empty_line(const char *line, int *len_p)
 304{
 305        int len = *len_p;
 306        while (len && isspace(line[len-1]))
 307                len--;
 308        *len_p = len;
 309        return !len;
 310}
 311
 312static const char *skip_empty_lines(const char *msg)
 313{
 314        for (;;) {
 315                int linelen = get_one_line(msg);
 316                int ll = linelen;
 317                if (!linelen)
 318                        break;
 319                if (!is_empty_line(msg, &ll))
 320                        break;
 321                msg += linelen;
 322        }
 323        return msg;
 324}
 325
 326static void add_merge_info(enum cmit_fmt fmt, struct strbuf *sb,
 327                        const struct commit *commit, int abbrev)
 328{
 329        struct commit_list *parent = commit->parents;
 330
 331        if ((fmt == CMIT_FMT_ONELINE) || (fmt == CMIT_FMT_EMAIL) ||
 332            !parent || !parent->next)
 333                return;
 334
 335        strbuf_addstr(sb, "Merge:");
 336
 337        while (parent) {
 338                struct commit *p = parent->item;
 339                const char *hex = NULL;
 340                if (abbrev)
 341                        hex = find_unique_abbrev(p->object.sha1, abbrev);
 342                if (!hex)
 343                        hex = sha1_to_hex(p->object.sha1);
 344                parent = parent->next;
 345
 346                strbuf_addf(sb, " %s", hex);
 347        }
 348        strbuf_addch(sb, '\n');
 349}
 350
 351static char *get_header(const struct commit *commit, const char *key)
 352{
 353        int key_len = strlen(key);
 354        const char *line = commit->buffer;
 355
 356        for (;;) {
 357                const char *eol = strchr(line, '\n'), *next;
 358
 359                if (line == eol)
 360                        return NULL;
 361                if (!eol) {
 362                        eol = line + strlen(line);
 363                        next = NULL;
 364                } else
 365                        next = eol + 1;
 366                if (eol - line > key_len &&
 367                    !strncmp(line, key, key_len) &&
 368                    line[key_len] == ' ') {
 369                        return xmemdupz(line + key_len + 1, eol - line - key_len - 1);
 370                }
 371                line = next;
 372        }
 373}
 374
 375static char *replace_encoding_header(char *buf, const char *encoding)
 376{
 377        struct strbuf tmp = STRBUF_INIT;
 378        size_t start, len;
 379        char *cp = buf;
 380
 381        /* guess if there is an encoding header before a \n\n */
 382        while (strncmp(cp, "encoding ", strlen("encoding "))) {
 383                cp = strchr(cp, '\n');
 384                if (!cp || *++cp == '\n')
 385                        return buf;
 386        }
 387        start = cp - buf;
 388        cp = strchr(cp, '\n');
 389        if (!cp)
 390                return buf; /* should not happen but be defensive */
 391        len = cp + 1 - (buf + start);
 392
 393        strbuf_attach(&tmp, buf, strlen(buf), strlen(buf) + 1);
 394        if (is_encoding_utf8(encoding)) {
 395                /* we have re-coded to UTF-8; drop the header */
 396                strbuf_remove(&tmp, start, len);
 397        } else {
 398                /* just replaces XXXX in 'encoding XXXX\n' */
 399                strbuf_splice(&tmp, start + strlen("encoding "),
 400                                          len - strlen("encoding \n"),
 401                                          encoding, strlen(encoding));
 402        }
 403        return strbuf_detach(&tmp, NULL);
 404}
 405
 406char *logmsg_reencode(const struct commit *commit,
 407                      const char *output_encoding)
 408{
 409        static const char *utf8 = "UTF-8";
 410        const char *use_encoding;
 411        char *encoding;
 412        char *out;
 413
 414        if (!*output_encoding)
 415                return NULL;
 416        encoding = get_header(commit, "encoding");
 417        use_encoding = encoding ? encoding : utf8;
 418        if (!strcmp(use_encoding, output_encoding))
 419                if (encoding) /* we'll strip encoding header later */
 420                        out = xstrdup(commit->buffer);
 421                else
 422                        return NULL; /* nothing to do */
 423        else
 424                out = reencode_string(commit->buffer,
 425                                      output_encoding, use_encoding);
 426        if (out)
 427                out = replace_encoding_header(out, output_encoding);
 428
 429        free(encoding);
 430        return out;
 431}
 432
 433static int mailmap_name(char *email, int email_len, char *name, int name_len)
 434{
 435        static struct string_list *mail_map;
 436        if (!mail_map) {
 437                mail_map = xcalloc(1, sizeof(*mail_map));
 438                read_mailmap(mail_map, NULL);
 439        }
 440        return mail_map->nr && map_user(mail_map, email, email_len, name, name_len);
 441}
 442
 443static size_t format_person_part(struct strbuf *sb, char part,
 444                                 const char *msg, int len, enum date_mode dmode)
 445{
 446        /* currently all placeholders have same length */
 447        const int placeholder_len = 2;
 448        int start, end, tz = 0;
 449        unsigned long date = 0;
 450        char *ep;
 451        const char *name_start, *name_end, *mail_start, *mail_end, *msg_end = msg+len;
 452        char person_name[1024];
 453        char person_mail[1024];
 454
 455        /* advance 'end' to point to email start delimiter */
 456        for (end = 0; end < len && msg[end] != '<'; end++)
 457                ; /* do nothing */
 458
 459        /*
 460         * When end points at the '<' that we found, it should have
 461         * matching '>' later, which means 'end' must be strictly
 462         * below len - 1.
 463         */
 464        if (end >= len - 2)
 465                goto skip;
 466
 467        /* Seek for both name and email part */
 468        name_start = msg;
 469        name_end = msg+end;
 470        while (name_end > name_start && isspace(*(name_end-1)))
 471                name_end--;
 472        mail_start = msg+end+1;
 473        mail_end = mail_start;
 474        while (mail_end < msg_end && *mail_end != '>')
 475                mail_end++;
 476        if (mail_end == msg_end)
 477                goto skip;
 478        end = mail_end-msg;
 479
 480        if (part == 'N' || part == 'E') { /* mailmap lookup */
 481                strlcpy(person_name, name_start, name_end-name_start+1);
 482                strlcpy(person_mail, mail_start, mail_end-mail_start+1);
 483                mailmap_name(person_mail, sizeof(person_mail), person_name, sizeof(person_name));
 484                name_start = person_name;
 485                name_end = name_start + strlen(person_name);
 486                mail_start = person_mail;
 487                mail_end = mail_start +  strlen(person_mail);
 488        }
 489        if (part == 'n' || part == 'N') {       /* name */
 490                strbuf_add(sb, name_start, name_end-name_start);
 491                return placeholder_len;
 492        }
 493        if (part == 'e' || part == 'E') {       /* email */
 494                strbuf_add(sb, mail_start, mail_end-mail_start);
 495                return placeholder_len;
 496        }
 497
 498        /* advance 'start' to point to date start delimiter */
 499        for (start = end + 1; start < len && isspace(msg[start]); start++)
 500                ; /* do nothing */
 501        if (start >= len)
 502                goto skip;
 503        date = strtoul(msg + start, &ep, 10);
 504        if (msg + start == ep)
 505                goto skip;
 506
 507        if (part == 't') {      /* date, UNIX timestamp */
 508                strbuf_add(sb, msg + start, ep - (msg + start));
 509                return placeholder_len;
 510        }
 511
 512        /* parse tz */
 513        for (start = ep - msg + 1; start < len && isspace(msg[start]); start++)
 514                ; /* do nothing */
 515        if (start + 1 < len) {
 516                tz = strtoul(msg + start + 1, NULL, 10);
 517                if (msg[start] == '-')
 518                        tz = -tz;
 519        }
 520
 521        switch (part) {
 522        case 'd':       /* date */
 523                strbuf_addstr(sb, show_date(date, tz, dmode));
 524                return placeholder_len;
 525        case 'D':       /* date, RFC2822 style */
 526                strbuf_addstr(sb, show_date(date, tz, DATE_RFC2822));
 527                return placeholder_len;
 528        case 'r':       /* date, relative */
 529                strbuf_addstr(sb, show_date(date, tz, DATE_RELATIVE));
 530                return placeholder_len;
 531        case 'i':       /* date, ISO 8601 */
 532                strbuf_addstr(sb, show_date(date, tz, DATE_ISO8601));
 533                return placeholder_len;
 534        }
 535
 536skip:
 537        /*
 538         * bogus commit, 'sb' cannot be updated, but we still need to
 539         * compute a valid return value.
 540         */
 541        if (part == 'n' || part == 'e' || part == 't' || part == 'd'
 542            || part == 'D' || part == 'r' || part == 'i')
 543                return placeholder_len;
 544
 545        return 0; /* unknown placeholder */
 546}
 547
 548struct chunk {
 549        size_t off;
 550        size_t len;
 551};
 552
 553struct format_commit_context {
 554        const struct commit *commit;
 555        const struct pretty_print_context *pretty_ctx;
 556        unsigned commit_header_parsed:1;
 557        unsigned commit_message_parsed:1;
 558        char *message;
 559        size_t width, indent1, indent2;
 560
 561        /* These offsets are relative to the start of the commit message. */
 562        struct chunk author;
 563        struct chunk committer;
 564        struct chunk encoding;
 565        size_t message_off;
 566        size_t subject_off;
 567        size_t body_off;
 568
 569        /* The following ones are relative to the result struct strbuf. */
 570        struct chunk abbrev_commit_hash;
 571        struct chunk abbrev_tree_hash;
 572        struct chunk abbrev_parent_hashes;
 573        size_t wrap_start;
 574};
 575
 576static int add_again(struct strbuf *sb, struct chunk *chunk)
 577{
 578        if (chunk->len) {
 579                strbuf_adddup(sb, chunk->off, chunk->len);
 580                return 1;
 581        }
 582
 583        /*
 584         * We haven't seen this chunk before.  Our caller is surely
 585         * going to add it the hard way now.  Remember the most likely
 586         * start of the to-be-added chunk: the current end of the
 587         * struct strbuf.
 588         */
 589        chunk->off = sb->len;
 590        return 0;
 591}
 592
 593static void parse_commit_header(struct format_commit_context *context)
 594{
 595        const char *msg = context->message;
 596        int i;
 597
 598        for (i = 0; msg[i]; i++) {
 599                int eol;
 600                for (eol = i; msg[eol] && msg[eol] != '\n'; eol++)
 601                        ; /* do nothing */
 602
 603                if (i == eol) {
 604                        break;
 605                } else if (!prefixcmp(msg + i, "author ")) {
 606                        context->author.off = i + 7;
 607                        context->author.len = eol - i - 7;
 608                } else if (!prefixcmp(msg + i, "committer ")) {
 609                        context->committer.off = i + 10;
 610                        context->committer.len = eol - i - 10;
 611                } else if (!prefixcmp(msg + i, "encoding ")) {
 612                        context->encoding.off = i + 9;
 613                        context->encoding.len = eol - i - 9;
 614                }
 615                i = eol;
 616        }
 617        context->message_off = i;
 618        context->commit_header_parsed = 1;
 619}
 620
 621static int istitlechar(char c)
 622{
 623        return (c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z') ||
 624                (c >= '0' && c <= '9') || c == '.' || c == '_';
 625}
 626
 627static void format_sanitized_subject(struct strbuf *sb, const char *msg)
 628{
 629        size_t trimlen;
 630        size_t start_len = sb->len;
 631        int space = 2;
 632
 633        for (; *msg && *msg != '\n'; msg++) {
 634                if (istitlechar(*msg)) {
 635                        if (space == 1)
 636                                strbuf_addch(sb, '-');
 637                        space = 0;
 638                        strbuf_addch(sb, *msg);
 639                        if (*msg == '.')
 640                                while (*(msg+1) == '.')
 641                                        msg++;
 642                } else
 643                        space |= 1;
 644        }
 645
 646        /* trim any trailing '.' or '-' characters */
 647        trimlen = 0;
 648        while (sb->len - trimlen > start_len &&
 649                (sb->buf[sb->len - 1 - trimlen] == '.'
 650                || sb->buf[sb->len - 1 - trimlen] == '-'))
 651                trimlen++;
 652        strbuf_remove(sb, sb->len - trimlen, trimlen);
 653}
 654
 655const char *format_subject(struct strbuf *sb, const char *msg,
 656                           const char *line_separator)
 657{
 658        int first = 1;
 659
 660        for (;;) {
 661                const char *line = msg;
 662                int linelen = get_one_line(line);
 663
 664                msg += linelen;
 665                if (!linelen || is_empty_line(line, &linelen))
 666                        break;
 667
 668                if (!sb)
 669                        continue;
 670                strbuf_grow(sb, linelen + 2);
 671                if (!first)
 672                        strbuf_addstr(sb, line_separator);
 673                strbuf_add(sb, line, linelen);
 674                first = 0;
 675        }
 676        return msg;
 677}
 678
 679static void parse_commit_message(struct format_commit_context *c)
 680{
 681        const char *msg = c->message + c->message_off;
 682        const char *start = c->message;
 683
 684        msg = skip_empty_lines(msg);
 685        c->subject_off = msg - start;
 686
 687        msg = format_subject(NULL, msg, NULL);
 688        msg = skip_empty_lines(msg);
 689        c->body_off = msg - start;
 690
 691        c->commit_message_parsed = 1;
 692}
 693
 694static void format_decoration(struct strbuf *sb, const struct commit *commit)
 695{
 696        struct name_decoration *d;
 697        const char *prefix = " (";
 698
 699        load_ref_decorations(DECORATE_SHORT_REFS);
 700        d = lookup_decoration(&name_decoration, &commit->object);
 701        while (d) {
 702                strbuf_addstr(sb, prefix);
 703                prefix = ", ";
 704                strbuf_addstr(sb, d->name);
 705                d = d->next;
 706        }
 707        if (prefix[0] == ',')
 708                strbuf_addch(sb, ')');
 709}
 710
 711static void strbuf_wrap(struct strbuf *sb, size_t pos,
 712                        size_t width, size_t indent1, size_t indent2)
 713{
 714        struct strbuf tmp = STRBUF_INIT;
 715
 716        if (pos)
 717                strbuf_add(&tmp, sb->buf, pos);
 718        strbuf_add_wrapped_text(&tmp, sb->buf + pos,
 719                                (int) indent1, (int) indent2, (int) width);
 720        strbuf_swap(&tmp, sb);
 721        strbuf_release(&tmp);
 722}
 723
 724static void rewrap_message_tail(struct strbuf *sb,
 725                                struct format_commit_context *c,
 726                                size_t new_width, size_t new_indent1,
 727                                size_t new_indent2)
 728{
 729        if (c->width == new_width && c->indent1 == new_indent1 &&
 730            c->indent2 == new_indent2)
 731                return;
 732        if (c->wrap_start < sb->len)
 733                strbuf_wrap(sb, c->wrap_start, c->width, c->indent1, c->indent2);
 734        c->wrap_start = sb->len;
 735        c->width = new_width;
 736        c->indent1 = new_indent1;
 737        c->indent2 = new_indent2;
 738}
 739
 740static size_t format_commit_one(struct strbuf *sb, const char *placeholder,
 741                                void *context)
 742{
 743        struct format_commit_context *c = context;
 744        const struct commit *commit = c->commit;
 745        const char *msg = c->message;
 746        struct commit_list *p;
 747        int h1, h2;
 748
 749        /* these are independent of the commit */
 750        switch (placeholder[0]) {
 751        case 'C':
 752                if (placeholder[1] == '(') {
 753                        const char *end = strchr(placeholder + 2, ')');
 754                        char color[COLOR_MAXLEN];
 755                        if (!end)
 756                                return 0;
 757                        color_parse_mem(placeholder + 2,
 758                                        end - (placeholder + 2),
 759                                        "--pretty format", color);
 760                        strbuf_addstr(sb, color);
 761                        return end - placeholder + 1;
 762                }
 763                if (!prefixcmp(placeholder + 1, "red")) {
 764                        strbuf_addstr(sb, GIT_COLOR_RED);
 765                        return 4;
 766                } else if (!prefixcmp(placeholder + 1, "green")) {
 767                        strbuf_addstr(sb, GIT_COLOR_GREEN);
 768                        return 6;
 769                } else if (!prefixcmp(placeholder + 1, "blue")) {
 770                        strbuf_addstr(sb, GIT_COLOR_BLUE);
 771                        return 5;
 772                } else if (!prefixcmp(placeholder + 1, "reset")) {
 773                        strbuf_addstr(sb, GIT_COLOR_RESET);
 774                        return 6;
 775                } else
 776                        return 0;
 777        case 'n':               /* newline */
 778                strbuf_addch(sb, '\n');
 779                return 1;
 780        case 'x':
 781                /* %x00 == NUL, %x0a == LF, etc. */
 782                if (0 <= (h1 = hexval_table[0xff & placeholder[1]]) &&
 783                    h1 <= 16 &&
 784                    0 <= (h2 = hexval_table[0xff & placeholder[2]]) &&
 785                    h2 <= 16) {
 786                        strbuf_addch(sb, (h1<<4)|h2);
 787                        return 3;
 788                } else
 789                        return 0;
 790        case 'w':
 791                if (placeholder[1] == '(') {
 792                        unsigned long width = 0, indent1 = 0, indent2 = 0;
 793                        char *next;
 794                        const char *start = placeholder + 2;
 795                        const char *end = strchr(start, ')');
 796                        if (!end)
 797                                return 0;
 798                        if (end > start) {
 799                                width = strtoul(start, &next, 10);
 800                                if (*next == ',') {
 801                                        indent1 = strtoul(next + 1, &next, 10);
 802                                        if (*next == ',') {
 803                                                indent2 = strtoul(next + 1,
 804                                                                 &next, 10);
 805                                        }
 806                                }
 807                                if (*next != ')')
 808                                        return 0;
 809                        }
 810                        rewrap_message_tail(sb, c, width, indent1, indent2);
 811                        return end - placeholder + 1;
 812                } else
 813                        return 0;
 814        }
 815
 816        /* these depend on the commit */
 817        if (!commit->object.parsed)
 818                parse_object(commit->object.sha1);
 819
 820        switch (placeholder[0]) {
 821        case 'H':               /* commit hash */
 822                strbuf_addstr(sb, sha1_to_hex(commit->object.sha1));
 823                return 1;
 824        case 'h':               /* abbreviated commit hash */
 825                if (add_again(sb, &c->abbrev_commit_hash))
 826                        return 1;
 827                strbuf_addstr(sb, find_unique_abbrev(commit->object.sha1,
 828                                                     c->pretty_ctx->abbrev));
 829                c->abbrev_commit_hash.len = sb->len - c->abbrev_commit_hash.off;
 830                return 1;
 831        case 'T':               /* tree hash */
 832                strbuf_addstr(sb, sha1_to_hex(commit->tree->object.sha1));
 833                return 1;
 834        case 't':               /* abbreviated tree hash */
 835                if (add_again(sb, &c->abbrev_tree_hash))
 836                        return 1;
 837                strbuf_addstr(sb, find_unique_abbrev(commit->tree->object.sha1,
 838                                                     c->pretty_ctx->abbrev));
 839                c->abbrev_tree_hash.len = sb->len - c->abbrev_tree_hash.off;
 840                return 1;
 841        case 'P':               /* parent hashes */
 842                for (p = commit->parents; p; p = p->next) {
 843                        if (p != commit->parents)
 844                                strbuf_addch(sb, ' ');
 845                        strbuf_addstr(sb, sha1_to_hex(p->item->object.sha1));
 846                }
 847                return 1;
 848        case 'p':               /* abbreviated parent hashes */
 849                if (add_again(sb, &c->abbrev_parent_hashes))
 850                        return 1;
 851                for (p = commit->parents; p; p = p->next) {
 852                        if (p != commit->parents)
 853                                strbuf_addch(sb, ' ');
 854                        strbuf_addstr(sb, find_unique_abbrev(
 855                                        p->item->object.sha1,
 856                                        c->pretty_ctx->abbrev));
 857                }
 858                c->abbrev_parent_hashes.len = sb->len -
 859                                              c->abbrev_parent_hashes.off;
 860                return 1;
 861        case 'm':               /* left/right/bottom */
 862                strbuf_addstr(sb, get_revision_mark(NULL, commit));
 863                return 1;
 864        case 'd':
 865                format_decoration(sb, commit);
 866                return 1;
 867        case 'g':               /* reflog info */
 868                switch(placeholder[1]) {
 869                case 'd':       /* reflog selector */
 870                case 'D':
 871                        if (c->pretty_ctx->reflog_info)
 872                                get_reflog_selector(sb,
 873                                                    c->pretty_ctx->reflog_info,
 874                                                    c->pretty_ctx->date_mode,
 875                                                    (placeholder[1] == 'd'));
 876                        return 2;
 877                case 's':       /* reflog message */
 878                        if (c->pretty_ctx->reflog_info)
 879                                get_reflog_message(sb, c->pretty_ctx->reflog_info);
 880                        return 2;
 881                }
 882                return 0;       /* unknown %g placeholder */
 883        case 'N':
 884                if (c->pretty_ctx->show_notes) {
 885                        format_display_notes(commit->object.sha1, sb,
 886                                    get_log_output_encoding(), 0);
 887                        return 1;
 888                }
 889                return 0;
 890        }
 891
 892        /* For the rest we have to parse the commit header. */
 893        if (!c->commit_header_parsed)
 894                parse_commit_header(c);
 895
 896        switch (placeholder[0]) {
 897        case 'a':       /* author ... */
 898                return format_person_part(sb, placeholder[1],
 899                                   msg + c->author.off, c->author.len,
 900                                   c->pretty_ctx->date_mode);
 901        case 'c':       /* committer ... */
 902                return format_person_part(sb, placeholder[1],
 903                                   msg + c->committer.off, c->committer.len,
 904                                   c->pretty_ctx->date_mode);
 905        case 'e':       /* encoding */
 906                strbuf_add(sb, msg + c->encoding.off, c->encoding.len);
 907                return 1;
 908        case 'B':       /* raw body */
 909                /* message_off is always left at the initial newline */
 910                strbuf_addstr(sb, msg + c->message_off + 1);
 911                return 1;
 912        }
 913
 914        /* Now we need to parse the commit message. */
 915        if (!c->commit_message_parsed)
 916                parse_commit_message(c);
 917
 918        switch (placeholder[0]) {
 919        case 's':       /* subject */
 920                format_subject(sb, msg + c->subject_off, " ");
 921                return 1;
 922        case 'f':       /* sanitized subject */
 923                format_sanitized_subject(sb, msg + c->subject_off);
 924                return 1;
 925        case 'b':       /* body */
 926                strbuf_addstr(sb, msg + c->body_off);
 927                return 1;
 928        }
 929        return 0;       /* unknown placeholder */
 930}
 931
 932static size_t format_commit_item(struct strbuf *sb, const char *placeholder,
 933                                 void *context)
 934{
 935        int consumed;
 936        size_t orig_len;
 937        enum {
 938                NO_MAGIC,
 939                ADD_LF_BEFORE_NON_EMPTY,
 940                DEL_LF_BEFORE_EMPTY,
 941                ADD_SP_BEFORE_NON_EMPTY
 942        } magic = NO_MAGIC;
 943
 944        switch (placeholder[0]) {
 945        case '-':
 946                magic = DEL_LF_BEFORE_EMPTY;
 947                break;
 948        case '+':
 949                magic = ADD_LF_BEFORE_NON_EMPTY;
 950                break;
 951        case ' ':
 952                magic = ADD_SP_BEFORE_NON_EMPTY;
 953                break;
 954        default:
 955                break;
 956        }
 957        if (magic != NO_MAGIC)
 958                placeholder++;
 959
 960        orig_len = sb->len;
 961        consumed = format_commit_one(sb, placeholder, context);
 962        if (magic == NO_MAGIC)
 963                return consumed;
 964
 965        if ((orig_len == sb->len) && magic == DEL_LF_BEFORE_EMPTY) {
 966                while (sb->len && sb->buf[sb->len - 1] == '\n')
 967                        strbuf_setlen(sb, sb->len - 1);
 968        } else if (orig_len != sb->len) {
 969                if (magic == ADD_LF_BEFORE_NON_EMPTY)
 970                        strbuf_insert(sb, orig_len, "\n", 1);
 971                else if (magic == ADD_SP_BEFORE_NON_EMPTY)
 972                        strbuf_insert(sb, orig_len, " ", 1);
 973        }
 974        return consumed + 1;
 975}
 976
 977static size_t userformat_want_item(struct strbuf *sb, const char *placeholder,
 978                                   void *context)
 979{
 980        struct userformat_want *w = context;
 981
 982        if (*placeholder == '+' || *placeholder == '-' || *placeholder == ' ')
 983                placeholder++;
 984
 985        switch (*placeholder) {
 986        case 'N':
 987                w->notes = 1;
 988                break;
 989        }
 990        return 0;
 991}
 992
 993void userformat_find_requirements(const char *fmt, struct userformat_want *w)
 994{
 995        struct strbuf dummy = STRBUF_INIT;
 996
 997        if (!fmt) {
 998                if (!user_format)
 999                        return;
1000                fmt = user_format;
1001        }
1002        strbuf_expand(&dummy, user_format, userformat_want_item, w);
1003        strbuf_release(&dummy);
1004}
1005
1006void format_commit_message(const struct commit *commit,
1007                           const char *format, struct strbuf *sb,
1008                           const struct pretty_print_context *pretty_ctx)
1009{
1010        struct format_commit_context context;
1011        static const char utf8[] = "UTF-8";
1012        const char *enc;
1013        const char *output_enc = pretty_ctx->output_encoding;
1014
1015        memset(&context, 0, sizeof(context));
1016        context.commit = commit;
1017        context.pretty_ctx = pretty_ctx;
1018        context.wrap_start = sb->len;
1019        context.message = commit->buffer;
1020        if (output_enc) {
1021                enc = get_header(commit, "encoding");
1022                enc = enc ? enc : utf8;
1023                if (strcmp(enc, output_enc))
1024                        context.message = logmsg_reencode(commit, output_enc);
1025        }
1026
1027        strbuf_expand(sb, format, format_commit_item, &context);
1028        rewrap_message_tail(sb, &context, 0, 0, 0);
1029
1030        if (context.message != commit->buffer)
1031                free(context.message);
1032}
1033
1034static void pp_header(enum cmit_fmt fmt,
1035                      int abbrev,
1036                      enum date_mode dmode,
1037                      const char *encoding,
1038                      const struct commit *commit,
1039                      const char **msg_p,
1040                      struct strbuf *sb)
1041{
1042        int parents_shown = 0;
1043
1044        for (;;) {
1045                const char *line = *msg_p;
1046                int linelen = get_one_line(*msg_p);
1047
1048                if (!linelen)
1049                        return;
1050                *msg_p += linelen;
1051
1052                if (linelen == 1)
1053                        /* End of header */
1054                        return;
1055
1056                if (fmt == CMIT_FMT_RAW) {
1057                        strbuf_add(sb, line, linelen);
1058                        continue;
1059                }
1060
1061                if (!memcmp(line, "parent ", 7)) {
1062                        if (linelen != 48)
1063                                die("bad parent line in commit");
1064                        continue;
1065                }
1066
1067                if (!parents_shown) {
1068                        struct commit_list *parent;
1069                        int num;
1070                        for (parent = commit->parents, num = 0;
1071                             parent;
1072                             parent = parent->next, num++)
1073                                ;
1074                        /* with enough slop */
1075                        strbuf_grow(sb, num * 50 + 20);
1076                        add_merge_info(fmt, sb, commit, abbrev);
1077                        parents_shown = 1;
1078                }
1079
1080                /*
1081                 * MEDIUM == DEFAULT shows only author with dates.
1082                 * FULL shows both authors but not dates.
1083                 * FULLER shows both authors and dates.
1084                 */
1085                if (!memcmp(line, "author ", 7)) {
1086                        strbuf_grow(sb, linelen + 80);
1087                        pp_user_info("Author", fmt, sb, line + 7, dmode, encoding);
1088                }
1089                if (!memcmp(line, "committer ", 10) &&
1090                    (fmt == CMIT_FMT_FULL || fmt == CMIT_FMT_FULLER)) {
1091                        strbuf_grow(sb, linelen + 80);
1092                        pp_user_info("Commit", fmt, sb, line + 10, dmode, encoding);
1093                }
1094        }
1095}
1096
1097void pp_title_line(enum cmit_fmt fmt,
1098                   const char **msg_p,
1099                   struct strbuf *sb,
1100                   const char *subject,
1101                   const char *after_subject,
1102                   const char *encoding,
1103                   int need_8bit_cte)
1104{
1105        const char *line_separator = (fmt == CMIT_FMT_EMAIL) ? "\n " : " ";
1106        struct strbuf title;
1107
1108        strbuf_init(&title, 80);
1109        *msg_p = format_subject(&title, *msg_p, line_separator);
1110
1111        strbuf_grow(sb, title.len + 1024);
1112        if (subject) {
1113                strbuf_addstr(sb, subject);
1114                add_rfc2047(sb, title.buf, title.len, encoding);
1115        } else {
1116                strbuf_addbuf(sb, &title);
1117        }
1118        strbuf_addch(sb, '\n');
1119
1120        if (need_8bit_cte > 0) {
1121                const char *header_fmt =
1122                        "MIME-Version: 1.0\n"
1123                        "Content-Type: text/plain; charset=%s\n"
1124                        "Content-Transfer-Encoding: 8bit\n";
1125                strbuf_addf(sb, header_fmt, encoding);
1126        }
1127        if (after_subject) {
1128                strbuf_addstr(sb, after_subject);
1129        }
1130        if (fmt == CMIT_FMT_EMAIL) {
1131                strbuf_addch(sb, '\n');
1132        }
1133        strbuf_release(&title);
1134}
1135
1136void pp_remainder(enum cmit_fmt fmt,
1137                  const char **msg_p,
1138                  struct strbuf *sb,
1139                  int indent)
1140{
1141        int first = 1;
1142        for (;;) {
1143                const char *line = *msg_p;
1144                int linelen = get_one_line(line);
1145                *msg_p += linelen;
1146
1147                if (!linelen)
1148                        break;
1149
1150                if (is_empty_line(line, &linelen)) {
1151                        if (first)
1152                                continue;
1153                        if (fmt == CMIT_FMT_SHORT)
1154                                break;
1155                }
1156                first = 0;
1157
1158                strbuf_grow(sb, linelen + indent + 20);
1159                if (indent) {
1160                        memset(sb->buf + sb->len, ' ', indent);
1161                        strbuf_setlen(sb, sb->len + indent);
1162                }
1163                strbuf_add(sb, line, linelen);
1164                strbuf_addch(sb, '\n');
1165        }
1166}
1167
1168char *reencode_commit_message(const struct commit *commit, const char **encoding_p)
1169{
1170        const char *encoding;
1171
1172        encoding = get_log_output_encoding();
1173        if (encoding_p)
1174                *encoding_p = encoding;
1175        return logmsg_reencode(commit, encoding);
1176}
1177
1178void pretty_print_commit(enum cmit_fmt fmt, const struct commit *commit,
1179                         struct strbuf *sb,
1180                         const struct pretty_print_context *context)
1181{
1182        unsigned long beginning_of_body;
1183        int indent = 4;
1184        const char *msg = commit->buffer;
1185        char *reencoded;
1186        const char *encoding;
1187        int need_8bit_cte = context->need_8bit_cte;
1188
1189        if (fmt == CMIT_FMT_USERFORMAT) {
1190                format_commit_message(commit, user_format, sb, context);
1191                return;
1192        }
1193
1194        reencoded = reencode_commit_message(commit, &encoding);
1195        if (reencoded) {
1196                msg = reencoded;
1197        }
1198
1199        if (fmt == CMIT_FMT_ONELINE || fmt == CMIT_FMT_EMAIL)
1200                indent = 0;
1201
1202        /*
1203         * We need to check and emit Content-type: to mark it
1204         * as 8-bit if we haven't done so.
1205         */
1206        if (fmt == CMIT_FMT_EMAIL && need_8bit_cte == 0) {
1207                int i, ch, in_body;
1208
1209                for (in_body = i = 0; (ch = msg[i]); i++) {
1210                        if (!in_body) {
1211                                /* author could be non 7-bit ASCII but
1212                                 * the log may be so; skip over the
1213                                 * header part first.
1214                                 */
1215                                if (ch == '\n' && msg[i+1] == '\n')
1216                                        in_body = 1;
1217                        }
1218                        else if (non_ascii(ch)) {
1219                                need_8bit_cte = 1;
1220                                break;
1221                        }
1222                }
1223        }
1224
1225        pp_header(fmt, context->abbrev, context->date_mode, encoding,
1226                  commit, &msg, sb);
1227        if (fmt != CMIT_FMT_ONELINE && !context->subject) {
1228                strbuf_addch(sb, '\n');
1229        }
1230
1231        /* Skip excess blank lines at the beginning of body, if any... */
1232        msg = skip_empty_lines(msg);
1233
1234        /* These formats treat the title line specially. */
1235        if (fmt == CMIT_FMT_ONELINE || fmt == CMIT_FMT_EMAIL)
1236                pp_title_line(fmt, &msg, sb, context->subject,
1237                              context->after_subject, encoding, need_8bit_cte);
1238
1239        beginning_of_body = sb->len;
1240        if (fmt != CMIT_FMT_ONELINE)
1241                pp_remainder(fmt, &msg, sb, indent);
1242        strbuf_rtrim(sb);
1243
1244        /* Make sure there is an EOLN for the non-oneline case */
1245        if (fmt != CMIT_FMT_ONELINE)
1246                strbuf_addch(sb, '\n');
1247
1248        /*
1249         * The caller may append additional body text in e-mail
1250         * format.  Make sure we did not strip the blank line
1251         * between the header and the body.
1252         */
1253        if (fmt == CMIT_FMT_EMAIL && sb->len <= beginning_of_body)
1254                strbuf_addch(sb, '\n');
1255
1256        if (context->show_notes)
1257                format_display_notes(commit->object.sha1, sb, encoding,
1258                                     NOTES_SHOW_HEADER | NOTES_INDENT);
1259
1260        free(reencoded);
1261}