merge-recursive: Record more data needed for merging with dual renames
[git] / merge-recursive.c
1 /*
2  * Recursive Merge algorithm stolen from git-merge-recursive.py by
3  * Fredrik Kuivinen.
4  * The thieves were Alex Riesen and Johannes Schindelin, in June/July 2006
5  */
6 #include "advice.h"
7 #include "cache.h"
8 #include "cache-tree.h"
9 #include "commit.h"
10 #include "blob.h"
11 #include "builtin.h"
12 #include "tree-walk.h"
13 #include "diff.h"
14 #include "diffcore.h"
15 #include "tag.h"
16 #include "unpack-trees.h"
17 #include "string-list.h"
18 #include "xdiff-interface.h"
19 #include "ll-merge.h"
20 #include "attr.h"
21 #include "merge-recursive.h"
22 #include "dir.h"
23 #include "submodule.h"
24
25 static struct tree *shift_tree_object(struct tree *one, struct tree *two,
26                                       const char *subtree_shift)
27 {
28         unsigned char shifted[20];
29
30         if (!*subtree_shift) {
31                 shift_tree(one->object.sha1, two->object.sha1, shifted, 0);
32         } else {
33                 shift_tree_by(one->object.sha1, two->object.sha1, shifted,
34                               subtree_shift);
35         }
36         if (!hashcmp(two->object.sha1, shifted))
37                 return two;
38         return lookup_tree(shifted);
39 }
40
41 /*
42  * A virtual commit has (const char *)commit->util set to the name.
43  */
44
45 static struct commit *make_virtual_commit(struct tree *tree, const char *comment)
46 {
47         struct commit *commit = xcalloc(1, sizeof(struct commit));
48         commit->tree = tree;
49         commit->util = (void*)comment;
50         /* avoid warnings */
51         commit->object.parsed = 1;
52         return commit;
53 }
54
55 /*
56  * Since we use get_tree_entry(), which does not put the read object into
57  * the object pool, we cannot rely on a == b.
58  */
59 static int sha_eq(const unsigned char *a, const unsigned char *b)
60 {
61         if (!a && !b)
62                 return 2;
63         return a && b && hashcmp(a, b) == 0;
64 }
65
66 enum rename_type {
67         RENAME_NORMAL = 0,
68         RENAME_DELETE,
69         RENAME_ONE_FILE_TO_ONE,
70         RENAME_ONE_FILE_TO_TWO,
71         RENAME_TWO_FILES_TO_ONE
72 };
73
74 struct rename_conflict_info {
75         enum rename_type rename_type;
76         struct diff_filepair *pair1;
77         struct diff_filepair *pair2;
78         const char *branch1;
79         const char *branch2;
80         struct stage_data *dst_entry1;
81         struct stage_data *dst_entry2;
82         struct diff_filespec ren1_other;
83         struct diff_filespec ren2_other;
84 };
85
86 /*
87  * Since we want to write the index eventually, we cannot reuse the index
88  * for these (temporary) data.
89  */
90 struct stage_data {
91         struct {
92                 unsigned mode;
93                 unsigned char sha[20];
94         } stages[4];
95         struct rename_conflict_info *rename_conflict_info;
96         unsigned processed:1;
97 };
98
99 static inline void setup_rename_conflict_info(enum rename_type rename_type,
100                                               struct diff_filepair *pair1,
101                                               struct diff_filepair *pair2,
102                                               const char *branch1,
103                                               const char *branch2,
104                                               struct stage_data *dst_entry1,
105                                               struct stage_data *dst_entry2,
106                                               struct merge_options *o,
107                                               struct stage_data *src_entry1,
108                                               struct stage_data *src_entry2)
109 {
110         struct rename_conflict_info *ci = xcalloc(1, sizeof(struct rename_conflict_info));
111         ci->rename_type = rename_type;
112         ci->pair1 = pair1;
113         ci->branch1 = branch1;
114         ci->branch2 = branch2;
115
116         ci->dst_entry1 = dst_entry1;
117         dst_entry1->rename_conflict_info = ci;
118         dst_entry1->processed = 0;
119
120         assert(!pair2 == !dst_entry2);
121         if (dst_entry2) {
122                 ci->dst_entry2 = dst_entry2;
123                 ci->pair2 = pair2;
124                 dst_entry2->rename_conflict_info = ci;
125         }
126
127         if (rename_type == RENAME_TWO_FILES_TO_ONE) {
128                 /*
129                  * For each rename, there could have been
130                  * modifications on the side of history where that
131                  * file was not renamed.
132                  */
133                 int ostage1 = o->branch1 == branch1 ? 3 : 2;
134                 int ostage2 = ostage1 ^ 1;
135
136                 ci->ren1_other.path = pair1->one->path;
137                 hashcpy(ci->ren1_other.sha1, src_entry1->stages[ostage1].sha);
138                 ci->ren1_other.mode = src_entry1->stages[ostage1].mode;
139
140                 ci->ren2_other.path = pair2->one->path;
141                 hashcpy(ci->ren2_other.sha1, src_entry2->stages[ostage2].sha);
142                 ci->ren2_other.mode = src_entry2->stages[ostage2].mode;
143         }
144 }
145
146 static int show(struct merge_options *o, int v)
147 {
148         return (!o->call_depth && o->verbosity >= v) || o->verbosity >= 5;
149 }
150
151 static void flush_output(struct merge_options *o)
152 {
153         if (o->obuf.len) {
154                 fputs(o->obuf.buf, stdout);
155                 strbuf_reset(&o->obuf);
156         }
157 }
158
159 __attribute__((format (printf, 3, 4)))
160 static void output(struct merge_options *o, int v, const char *fmt, ...)
161 {
162         va_list ap;
163
164         if (!show(o, v))
165                 return;
166
167         strbuf_grow(&o->obuf, o->call_depth * 2 + 2);
168         memset(o->obuf.buf + o->obuf.len, ' ', o->call_depth * 2);
169         strbuf_setlen(&o->obuf, o->obuf.len + o->call_depth * 2);
170
171         va_start(ap, fmt);
172         strbuf_vaddf(&o->obuf, fmt, ap);
173         va_end(ap);
174
175         strbuf_add(&o->obuf, "\n", 1);
176         if (!o->buffer_output)
177                 flush_output(o);
178 }
179
180 static void output_commit_title(struct merge_options *o, struct commit *commit)
181 {
182         int i;
183         flush_output(o);
184         for (i = o->call_depth; i--;)
185                 fputs("  ", stdout);
186         if (commit->util)
187                 printf("virtual %s\n", (char *)commit->util);
188         else {
189                 printf("%s ", find_unique_abbrev(commit->object.sha1, DEFAULT_ABBREV));
190                 if (parse_commit(commit) != 0)
191                         printf("(bad commit)\n");
192                 else {
193                         const char *title;
194                         int len = find_commit_subject(commit->buffer, &title);
195                         if (len)
196                                 printf("%.*s\n", len, title);
197                 }
198         }
199 }
200
201 static int add_cacheinfo(unsigned int mode, const unsigned char *sha1,
202                 const char *path, int stage, int refresh, int options)
203 {
204         struct cache_entry *ce;
205         ce = make_cache_entry(mode, sha1 ? sha1 : null_sha1, path, stage, refresh);
206         if (!ce)
207                 return error("addinfo_cache failed for path '%s'", path);
208         return add_cache_entry(ce, options);
209 }
210
211 static void init_tree_desc_from_tree(struct tree_desc *desc, struct tree *tree)
212 {
213         parse_tree(tree);
214         init_tree_desc(desc, tree->buffer, tree->size);
215 }
216
217 static int git_merge_trees(int index_only,
218                            struct tree *common,
219                            struct tree *head,
220                            struct tree *merge)
221 {
222         int rc;
223         struct tree_desc t[3];
224         struct unpack_trees_options opts;
225
226         memset(&opts, 0, sizeof(opts));
227         if (index_only)
228                 opts.index_only = 1;
229         else
230                 opts.update = 1;
231         opts.merge = 1;
232         opts.head_idx = 2;
233         opts.fn = threeway_merge;
234         opts.src_index = &the_index;
235         opts.dst_index = &the_index;
236         setup_unpack_trees_porcelain(&opts, "merge");
237
238         init_tree_desc_from_tree(t+0, common);
239         init_tree_desc_from_tree(t+1, head);
240         init_tree_desc_from_tree(t+2, merge);
241
242         rc = unpack_trees(3, t, &opts);
243         cache_tree_free(&active_cache_tree);
244         return rc;
245 }
246
247 struct tree *write_tree_from_memory(struct merge_options *o)
248 {
249         struct tree *result = NULL;
250
251         if (unmerged_cache()) {
252                 int i;
253                 fprintf(stderr, "BUG: There are unmerged index entries:\n");
254                 for (i = 0; i < active_nr; i++) {
255                         struct cache_entry *ce = active_cache[i];
256                         if (ce_stage(ce))
257                                 fprintf(stderr, "BUG: %d %.*s\n", ce_stage(ce),
258                                         (int)ce_namelen(ce), ce->name);
259                 }
260                 die("Bug in merge-recursive.c");
261         }
262
263         if (!active_cache_tree)
264                 active_cache_tree = cache_tree();
265
266         if (!cache_tree_fully_valid(active_cache_tree) &&
267             cache_tree_update(active_cache_tree,
268                               active_cache, active_nr, 0, 0) < 0)
269                 die("error building trees");
270
271         result = lookup_tree(active_cache_tree->sha1);
272
273         return result;
274 }
275
276 static int save_files_dirs(const unsigned char *sha1,
277                 const char *base, int baselen, const char *path,
278                 unsigned int mode, int stage, void *context)
279 {
280         int len = strlen(path);
281         char *newpath = xmalloc(baselen + len + 1);
282         struct merge_options *o = context;
283
284         memcpy(newpath, base, baselen);
285         memcpy(newpath + baselen, path, len);
286         newpath[baselen + len] = '\0';
287
288         if (S_ISDIR(mode))
289                 string_list_insert(&o->current_directory_set, newpath);
290         else
291                 string_list_insert(&o->current_file_set, newpath);
292         free(newpath);
293
294         return (S_ISDIR(mode) ? READ_TREE_RECURSIVE : 0);
295 }
296
297 static int get_files_dirs(struct merge_options *o, struct tree *tree)
298 {
299         int n;
300         if (read_tree_recursive(tree, "", 0, 0, NULL, save_files_dirs, o))
301                 return 0;
302         n = o->current_file_set.nr + o->current_directory_set.nr;
303         return n;
304 }
305
306 /*
307  * Returns an index_entry instance which doesn't have to correspond to
308  * a real cache entry in Git's index.
309  */
310 static struct stage_data *insert_stage_data(const char *path,
311                 struct tree *o, struct tree *a, struct tree *b,
312                 struct string_list *entries)
313 {
314         struct string_list_item *item;
315         struct stage_data *e = xcalloc(1, sizeof(struct stage_data));
316         get_tree_entry(o->object.sha1, path,
317                         e->stages[1].sha, &e->stages[1].mode);
318         get_tree_entry(a->object.sha1, path,
319                         e->stages[2].sha, &e->stages[2].mode);
320         get_tree_entry(b->object.sha1, path,
321                         e->stages[3].sha, &e->stages[3].mode);
322         item = string_list_insert(entries, path);
323         item->util = e;
324         return e;
325 }
326
327 /*
328  * Create a dictionary mapping file names to stage_data objects. The
329  * dictionary contains one entry for every path with a non-zero stage entry.
330  */
331 static struct string_list *get_unmerged(void)
332 {
333         struct string_list *unmerged = xcalloc(1, sizeof(struct string_list));
334         int i;
335
336         unmerged->strdup_strings = 1;
337
338         for (i = 0; i < active_nr; i++) {
339                 struct string_list_item *item;
340                 struct stage_data *e;
341                 struct cache_entry *ce = active_cache[i];
342                 if (!ce_stage(ce))
343                         continue;
344
345                 item = string_list_lookup(unmerged, ce->name);
346                 if (!item) {
347                         item = string_list_insert(unmerged, ce->name);
348                         item->util = xcalloc(1, sizeof(struct stage_data));
349                 }
350                 e = item->util;
351                 e->stages[ce_stage(ce)].mode = ce->ce_mode;
352                 hashcpy(e->stages[ce_stage(ce)].sha, ce->sha1);
353         }
354
355         return unmerged;
356 }
357
358 static int string_list_df_name_compare(const void *a, const void *b)
359 {
360         const struct string_list_item *one = a;
361         const struct string_list_item *two = b;
362         int onelen = strlen(one->string);
363         int twolen = strlen(two->string);
364         /*
365          * Here we only care that entries for D/F conflicts are
366          * adjacent, in particular with the file of the D/F conflict
367          * appearing before files below the corresponding directory.
368          * The order of the rest of the list is irrelevant for us.
369          *
370          * To achieve this, we sort with df_name_compare and provide
371          * the mode S_IFDIR so that D/F conflicts will sort correctly.
372          * We use the mode S_IFDIR for everything else for simplicity,
373          * since in other cases any changes in their order due to
374          * sorting cause no problems for us.
375          */
376         int cmp = df_name_compare(one->string, onelen, S_IFDIR,
377                                   two->string, twolen, S_IFDIR);
378         /*
379          * Now that 'foo' and 'foo/bar' compare equal, we have to make sure
380          * that 'foo' comes before 'foo/bar'.
381          */
382         if (cmp)
383                 return cmp;
384         return onelen - twolen;
385 }
386
387 static void record_df_conflict_files(struct merge_options *o,
388                                      struct string_list *entries)
389 {
390         /* If there is a D/F conflict and the file for such a conflict
391          * currently exist in the working copy, we want to allow it to be
392          * removed to make room for the corresponding directory if needed.
393          * The files underneath the directories of such D/F conflicts will
394          * be processed before the corresponding file involved in the D/F
395          * conflict.  If the D/F directory ends up being removed by the
396          * merge, then we won't have to touch the D/F file.  If the D/F
397          * directory needs to be written to the working copy, then the D/F
398          * file will simply be removed (in make_room_for_path()) to make
399          * room for the necessary paths.  Note that if both the directory
400          * and the file need to be present, then the D/F file will be
401          * reinstated with a new unique name at the time it is processed.
402          */
403         const char *last_file = NULL;
404         int last_len = 0;
405         int i;
406
407         /*
408          * If we're merging merge-bases, we don't want to bother with
409          * any working directory changes.
410          */
411         if (o->call_depth)
412                 return;
413
414         /* Ensure D/F conflicts are adjacent in the entries list. */
415         qsort(entries->items, entries->nr, sizeof(*entries->items),
416               string_list_df_name_compare);
417
418         string_list_clear(&o->df_conflict_file_set, 1);
419         for (i = 0; i < entries->nr; i++) {
420                 const char *path = entries->items[i].string;
421                 int len = strlen(path);
422                 struct stage_data *e = entries->items[i].util;
423
424                 /*
425                  * Check if last_file & path correspond to a D/F conflict;
426                  * i.e. whether path is last_file+'/'+<something>.
427                  * If so, record that it's okay to remove last_file to make
428                  * room for path and friends if needed.
429                  */
430                 if (last_file &&
431                     len > last_len &&
432                     memcmp(path, last_file, last_len) == 0 &&
433                     path[last_len] == '/') {
434                         string_list_insert(&o->df_conflict_file_set, last_file);
435                 }
436
437                 /*
438                  * Determine whether path could exist as a file in the
439                  * working directory as a possible D/F conflict.  This
440                  * will only occur when it exists in stage 2 as a
441                  * file.
442                  */
443                 if (S_ISREG(e->stages[2].mode) || S_ISLNK(e->stages[2].mode)) {
444                         last_file = path;
445                         last_len = len;
446                 } else {
447                         last_file = NULL;
448                 }
449         }
450 }
451
452 struct rename {
453         struct diff_filepair *pair;
454         struct stage_data *src_entry;
455         struct stage_data *dst_entry;
456         unsigned processed:1;
457 };
458
459 /*
460  * Get information of all renames which occurred between 'o_tree' and
461  * 'tree'. We need the three trees in the merge ('o_tree', 'a_tree' and
462  * 'b_tree') to be able to associate the correct cache entries with
463  * the rename information. 'tree' is always equal to either a_tree or b_tree.
464  */
465 static struct string_list *get_renames(struct merge_options *o,
466                                        struct tree *tree,
467                                        struct tree *o_tree,
468                                        struct tree *a_tree,
469                                        struct tree *b_tree,
470                                        struct string_list *entries)
471 {
472         int i;
473         struct string_list *renames;
474         struct diff_options opts;
475
476         renames = xcalloc(1, sizeof(struct string_list));
477         diff_setup(&opts);
478         DIFF_OPT_SET(&opts, RECURSIVE);
479         opts.detect_rename = DIFF_DETECT_RENAME;
480         opts.rename_limit = o->merge_rename_limit >= 0 ? o->merge_rename_limit :
481                             o->diff_rename_limit >= 0 ? o->diff_rename_limit :
482                             1000;
483         opts.rename_score = o->rename_score;
484         opts.show_rename_progress = o->show_rename_progress;
485         opts.output_format = DIFF_FORMAT_NO_OUTPUT;
486         if (diff_setup_done(&opts) < 0)
487                 die("diff setup failed");
488         diff_tree_sha1(o_tree->object.sha1, tree->object.sha1, "", &opts);
489         diffcore_std(&opts);
490         if (opts.needed_rename_limit > o->needed_rename_limit)
491                 o->needed_rename_limit = opts.needed_rename_limit;
492         for (i = 0; i < diff_queued_diff.nr; ++i) {
493                 struct string_list_item *item;
494                 struct rename *re;
495                 struct diff_filepair *pair = diff_queued_diff.queue[i];
496                 if (pair->status != 'R') {
497                         diff_free_filepair(pair);
498                         continue;
499                 }
500                 re = xmalloc(sizeof(*re));
501                 re->processed = 0;
502                 re->pair = pair;
503                 item = string_list_lookup(entries, re->pair->one->path);
504                 if (!item)
505                         re->src_entry = insert_stage_data(re->pair->one->path,
506                                         o_tree, a_tree, b_tree, entries);
507                 else
508                         re->src_entry = item->util;
509
510                 item = string_list_lookup(entries, re->pair->two->path);
511                 if (!item)
512                         re->dst_entry = insert_stage_data(re->pair->two->path,
513                                         o_tree, a_tree, b_tree, entries);
514                 else
515                         re->dst_entry = item->util;
516                 item = string_list_insert(renames, pair->one->path);
517                 item->util = re;
518         }
519         opts.output_format = DIFF_FORMAT_NO_OUTPUT;
520         diff_queued_diff.nr = 0;
521         diff_flush(&opts);
522         return renames;
523 }
524
525 static int update_stages(const char *path, const struct diff_filespec *o,
526                          const struct diff_filespec *a,
527                          const struct diff_filespec *b)
528 {
529         int clear = 1;
530         int options = ADD_CACHE_OK_TO_ADD | ADD_CACHE_SKIP_DFCHECK;
531         if (clear)
532                 if (remove_file_from_cache(path))
533                         return -1;
534         if (o)
535                 if (add_cacheinfo(o->mode, o->sha1, path, 1, 0, options))
536                         return -1;
537         if (a)
538                 if (add_cacheinfo(a->mode, a->sha1, path, 2, 0, options))
539                         return -1;
540         if (b)
541                 if (add_cacheinfo(b->mode, b->sha1, path, 3, 0, options))
542                         return -1;
543         return 0;
544 }
545
546 static void update_entry(struct stage_data *entry,
547                          struct diff_filespec *o,
548                          struct diff_filespec *a,
549                          struct diff_filespec *b)
550 {
551         entry->processed = 0;
552         entry->stages[1].mode = o->mode;
553         entry->stages[2].mode = a->mode;
554         entry->stages[3].mode = b->mode;
555         hashcpy(entry->stages[1].sha, o->sha1);
556         hashcpy(entry->stages[2].sha, a->sha1);
557         hashcpy(entry->stages[3].sha, b->sha1);
558 }
559
560 static int remove_file(struct merge_options *o, int clean,
561                        const char *path, int no_wd)
562 {
563         int update_cache = o->call_depth || clean;
564         int update_working_directory = !o->call_depth && !no_wd;
565
566         if (update_cache) {
567                 if (remove_file_from_cache(path))
568                         return -1;
569         }
570         if (update_working_directory) {
571                 if (remove_path(path))
572                         return -1;
573         }
574         return 0;
575 }
576
577 static char *unique_path(struct merge_options *o, const char *path, const char *branch)
578 {
579         char *newpath = xmalloc(strlen(path) + 1 + strlen(branch) + 8 + 1);
580         int suffix = 0;
581         struct stat st;
582         char *p = newpath + strlen(path);
583         strcpy(newpath, path);
584         *(p++) = '~';
585         strcpy(p, branch);
586         for (; *p; ++p)
587                 if ('/' == *p)
588                         *p = '_';
589         while (string_list_has_string(&o->current_file_set, newpath) ||
590                string_list_has_string(&o->current_directory_set, newpath) ||
591                lstat(newpath, &st) == 0)
592                 sprintf(p, "_%d", suffix++);
593
594         string_list_insert(&o->current_file_set, newpath);
595         return newpath;
596 }
597
598 static void flush_buffer(int fd, const char *buf, unsigned long size)
599 {
600         while (size > 0) {
601                 long ret = write_in_full(fd, buf, size);
602                 if (ret < 0) {
603                         /* Ignore epipe */
604                         if (errno == EPIPE)
605                                 break;
606                         die_errno("merge-recursive");
607                 } else if (!ret) {
608                         die("merge-recursive: disk full?");
609                 }
610                 size -= ret;
611                 buf += ret;
612         }
613 }
614
615 static int dir_in_way(const char *path, int check_working_copy)
616 {
617         int pos, pathlen = strlen(path);
618         char *dirpath = xmalloc(pathlen + 2);
619         struct stat st;
620
621         strcpy(dirpath, path);
622         dirpath[pathlen] = '/';
623         dirpath[pathlen+1] = '\0';
624
625         pos = cache_name_pos(dirpath, pathlen+1);
626
627         if (pos < 0)
628                 pos = -1 - pos;
629         if (pos < active_nr &&
630             !strncmp(dirpath, active_cache[pos]->name, pathlen+1)) {
631                 free(dirpath);
632                 return 1;
633         }
634
635         free(dirpath);
636         return check_working_copy && !lstat(path, &st) && S_ISDIR(st.st_mode);
637 }
638
639 static int was_tracked(const char *path)
640 {
641         int pos = cache_name_pos(path, strlen(path));
642
643         if (pos < 0)
644                 pos = -1 - pos;
645         while (pos < active_nr &&
646                !strcmp(path, active_cache[pos]->name)) {
647                 /*
648                  * If stage #0, it is definitely tracked.
649                  * If it has stage #2 then it was tracked
650                  * before this merge started.  All other
651                  * cases the path was not tracked.
652                  */
653                 switch (ce_stage(active_cache[pos])) {
654                 case 0:
655                 case 2:
656                         return 1;
657                 }
658                 pos++;
659         }
660         return 0;
661 }
662
663 static int would_lose_untracked(const char *path)
664 {
665         return !was_tracked(path) && file_exists(path);
666 }
667
668 static int make_room_for_path(struct merge_options *o, const char *path)
669 {
670         int status, i;
671         const char *msg = "failed to create path '%s'%s";
672
673         /* Unlink any D/F conflict files that are in the way */
674         for (i = 0; i < o->df_conflict_file_set.nr; i++) {
675                 const char *df_path = o->df_conflict_file_set.items[i].string;
676                 size_t pathlen = strlen(path);
677                 size_t df_pathlen = strlen(df_path);
678                 if (df_pathlen < pathlen &&
679                     path[df_pathlen] == '/' &&
680                     strncmp(path, df_path, df_pathlen) == 0) {
681                         output(o, 3,
682                                "Removing %s to make room for subdirectory\n",
683                                df_path);
684                         unlink(df_path);
685                         unsorted_string_list_delete_item(&o->df_conflict_file_set,
686                                                          i, 0);
687                         break;
688                 }
689         }
690
691         /* Make sure leading directories are created */
692         status = safe_create_leading_directories_const(path);
693         if (status) {
694                 if (status == -3) {
695                         /* something else exists */
696                         error(msg, path, ": perhaps a D/F conflict?");
697                         return -1;
698                 }
699                 die(msg, path, "");
700         }
701
702         /*
703          * Do not unlink a file in the work tree if we are not
704          * tracking it.
705          */
706         if (would_lose_untracked(path))
707                 return error("refusing to lose untracked file at '%s'",
708                              path);
709
710         /* Successful unlink is good.. */
711         if (!unlink(path))
712                 return 0;
713         /* .. and so is no existing file */
714         if (errno == ENOENT)
715                 return 0;
716         /* .. but not some other error (who really cares what?) */
717         return error(msg, path, ": perhaps a D/F conflict?");
718 }
719
720 static void update_file_flags(struct merge_options *o,
721                               const unsigned char *sha,
722                               unsigned mode,
723                               const char *path,
724                               int update_cache,
725                               int update_wd)
726 {
727         if (o->call_depth)
728                 update_wd = 0;
729
730         if (update_wd) {
731                 enum object_type type;
732                 void *buf;
733                 unsigned long size;
734
735                 if (S_ISGITLINK(mode)) {
736                         /*
737                          * We may later decide to recursively descend into
738                          * the submodule directory and update its index
739                          * and/or work tree, but we do not do that now.
740                          */
741                         update_wd = 0;
742                         goto update_index;
743                 }
744
745                 buf = read_sha1_file(sha, &type, &size);
746                 if (!buf)
747                         die("cannot read object %s '%s'", sha1_to_hex(sha), path);
748                 if (type != OBJ_BLOB)
749                         die("blob expected for %s '%s'", sha1_to_hex(sha), path);
750                 if (S_ISREG(mode)) {
751                         struct strbuf strbuf = STRBUF_INIT;
752                         if (convert_to_working_tree(path, buf, size, &strbuf)) {
753                                 free(buf);
754                                 size = strbuf.len;
755                                 buf = strbuf_detach(&strbuf, NULL);
756                         }
757                 }
758
759                 if (make_room_for_path(o, path) < 0) {
760                         update_wd = 0;
761                         free(buf);
762                         goto update_index;
763                 }
764                 if (S_ISREG(mode) || (!has_symlinks && S_ISLNK(mode))) {
765                         int fd;
766                         if (mode & 0100)
767                                 mode = 0777;
768                         else
769                                 mode = 0666;
770                         fd = open(path, O_WRONLY | O_TRUNC | O_CREAT, mode);
771                         if (fd < 0)
772                                 die_errno("failed to open '%s'", path);
773                         flush_buffer(fd, buf, size);
774                         close(fd);
775                 } else if (S_ISLNK(mode)) {
776                         char *lnk = xmemdupz(buf, size);
777                         safe_create_leading_directories_const(path);
778                         unlink(path);
779                         if (symlink(lnk, path))
780                                 die_errno("failed to symlink '%s'", path);
781                         free(lnk);
782                 } else
783                         die("do not know what to do with %06o %s '%s'",
784                             mode, sha1_to_hex(sha), path);
785                 free(buf);
786         }
787  update_index:
788         if (update_cache)
789                 add_cacheinfo(mode, sha, path, 0, update_wd, ADD_CACHE_OK_TO_ADD);
790 }
791
792 static void update_file(struct merge_options *o,
793                         int clean,
794                         const unsigned char *sha,
795                         unsigned mode,
796                         const char *path)
797 {
798         update_file_flags(o, sha, mode, path, o->call_depth || clean, !o->call_depth);
799 }
800
801 /* Low level file merging, update and removal */
802
803 struct merge_file_info {
804         unsigned char sha[20];
805         unsigned mode;
806         unsigned clean:1,
807                  merge:1;
808 };
809
810 static int merge_3way(struct merge_options *o,
811                       mmbuffer_t *result_buf,
812                       const struct diff_filespec *one,
813                       const struct diff_filespec *a,
814                       const struct diff_filespec *b,
815                       const char *branch1,
816                       const char *branch2)
817 {
818         mmfile_t orig, src1, src2;
819         struct ll_merge_options ll_opts = {0};
820         char *base_name, *name1, *name2;
821         int merge_status;
822
823         ll_opts.renormalize = o->renormalize;
824         ll_opts.xdl_opts = o->xdl_opts;
825
826         if (o->call_depth) {
827                 ll_opts.virtual_ancestor = 1;
828                 ll_opts.variant = 0;
829         } else {
830                 switch (o->recursive_variant) {
831                 case MERGE_RECURSIVE_OURS:
832                         ll_opts.variant = XDL_MERGE_FAVOR_OURS;
833                         break;
834                 case MERGE_RECURSIVE_THEIRS:
835                         ll_opts.variant = XDL_MERGE_FAVOR_THEIRS;
836                         break;
837                 default:
838                         ll_opts.variant = 0;
839                         break;
840                 }
841         }
842
843         if (strcmp(a->path, b->path) ||
844             (o->ancestor != NULL && strcmp(a->path, one->path) != 0)) {
845                 base_name = o->ancestor == NULL ? NULL :
846                         xstrdup(mkpath("%s:%s", o->ancestor, one->path));
847                 name1 = xstrdup(mkpath("%s:%s", branch1, a->path));
848                 name2 = xstrdup(mkpath("%s:%s", branch2, b->path));
849         } else {
850                 base_name = o->ancestor == NULL ? NULL :
851                         xstrdup(mkpath("%s", o->ancestor));
852                 name1 = xstrdup(mkpath("%s", branch1));
853                 name2 = xstrdup(mkpath("%s", branch2));
854         }
855
856         read_mmblob(&orig, one->sha1);
857         read_mmblob(&src1, a->sha1);
858         read_mmblob(&src2, b->sha1);
859
860         merge_status = ll_merge(result_buf, a->path, &orig, base_name,
861                                 &src1, name1, &src2, name2, &ll_opts);
862
863         free(name1);
864         free(name2);
865         free(orig.ptr);
866         free(src1.ptr);
867         free(src2.ptr);
868         return merge_status;
869 }
870
871 static struct merge_file_info merge_file_1(struct merge_options *o,
872                                            const struct diff_filespec *one,
873                                            const struct diff_filespec *a,
874                                            const struct diff_filespec *b,
875                                            const char *branch1,
876                                            const char *branch2)
877 {
878         struct merge_file_info result;
879         result.merge = 0;
880         result.clean = 1;
881
882         if ((S_IFMT & a->mode) != (S_IFMT & b->mode)) {
883                 result.clean = 0;
884                 if (S_ISREG(a->mode)) {
885                         result.mode = a->mode;
886                         hashcpy(result.sha, a->sha1);
887                 } else {
888                         result.mode = b->mode;
889                         hashcpy(result.sha, b->sha1);
890                 }
891         } else {
892                 if (!sha_eq(a->sha1, one->sha1) && !sha_eq(b->sha1, one->sha1))
893                         result.merge = 1;
894
895                 /*
896                  * Merge modes
897                  */
898                 if (a->mode == b->mode || a->mode == one->mode)
899                         result.mode = b->mode;
900                 else {
901                         result.mode = a->mode;
902                         if (b->mode != one->mode) {
903                                 result.clean = 0;
904                                 result.merge = 1;
905                         }
906                 }
907
908                 if (sha_eq(a->sha1, b->sha1) || sha_eq(a->sha1, one->sha1))
909                         hashcpy(result.sha, b->sha1);
910                 else if (sha_eq(b->sha1, one->sha1))
911                         hashcpy(result.sha, a->sha1);
912                 else if (S_ISREG(a->mode)) {
913                         mmbuffer_t result_buf;
914                         int merge_status;
915
916                         merge_status = merge_3way(o, &result_buf, one, a, b,
917                                                   branch1, branch2);
918
919                         if ((merge_status < 0) || !result_buf.ptr)
920                                 die("Failed to execute internal merge");
921
922                         if (write_sha1_file(result_buf.ptr, result_buf.size,
923                                             blob_type, result.sha))
924                                 die("Unable to add %s to database",
925                                     a->path);
926
927                         free(result_buf.ptr);
928                         result.clean = (merge_status == 0);
929                 } else if (S_ISGITLINK(a->mode)) {
930                         result.clean = merge_submodule(result.sha, one->path, one->sha1,
931                                                        a->sha1, b->sha1);
932                 } else if (S_ISLNK(a->mode)) {
933                         hashcpy(result.sha, a->sha1);
934
935                         if (!sha_eq(a->sha1, b->sha1))
936                                 result.clean = 0;
937                 } else {
938                         die("unsupported object type in the tree");
939                 }
940         }
941
942         return result;
943 }
944
945 static struct merge_file_info merge_file(struct merge_options *o,
946                                          const char *path,
947                                          const unsigned char *o_sha, int o_mode,
948                                          const unsigned char *a_sha, int a_mode,
949                                          const unsigned char *b_sha, int b_mode,
950                                          const char *branch1,
951                                          const char *branch2)
952 {
953         struct diff_filespec one, a, b;
954
955         one.path = a.path = b.path = (char *)path;
956         hashcpy(one.sha1, o_sha);
957         one.mode = o_mode;
958         hashcpy(a.sha1, a_sha);
959         a.mode = a_mode;
960         hashcpy(b.sha1, b_sha);
961         b.mode = b_mode;
962         return merge_file_1(o, &one, &a, &b, branch1, branch2);
963 }
964
965 static void conflict_rename_delete(struct merge_options *o,
966                                    struct diff_filepair *pair,
967                                    const char *rename_branch,
968                                    const char *other_branch)
969 {
970         char *dest_name = pair->two->path;
971         int df_conflict = 0;
972
973         output(o, 1, "CONFLICT (rename/delete): Rename %s->%s in %s "
974                "and deleted in %s",
975                pair->one->path, pair->two->path, rename_branch,
976                other_branch);
977         if (!o->call_depth)
978                 update_stages(dest_name, NULL,
979                               rename_branch == o->branch1 ? pair->two : NULL,
980                               rename_branch == o->branch1 ? NULL : pair->two);
981         if (dir_in_way(dest_name, !o->call_depth)) {
982                 dest_name = unique_path(o, dest_name, rename_branch);
983                 df_conflict = 1;
984         }
985         update_file(o, 0, pair->two->sha1, pair->two->mode, dest_name);
986         if (df_conflict)
987                 free(dest_name);
988 }
989
990 static void conflict_rename_rename_1to2(struct merge_options *o,
991                                         struct rename_conflict_info *ci)
992 {
993         /* One file was renamed in both branches, but to different names. */
994         struct diff_filespec *one = ci->pair1->one;
995         struct diff_filespec *a = ci->pair1->two;
996         struct diff_filespec *b = ci->pair2->two;
997         const char *dst_name_a = a->path;
998         const char *dst_name_b = b->path;
999         char *del[2];
1000         int delp = 0;
1001
1002         output(o, 1, "CONFLICT (rename/rename): "
1003                "Rename \"%s\"->\"%s\" in branch \"%s\" "
1004                "rename \"%s\"->\"%s\" in \"%s\"%s",
1005                one->path, a->path, ci->branch1,
1006                one->path, b->path, ci->branch2,
1007                o->call_depth ? " (left unresolved)" : "");
1008         if (dir_in_way(a->path, !o->call_depth)) {
1009                 dst_name_a = del[delp++] = unique_path(o, a->path, ci->branch1);
1010                 output(o, 1, "%s is a directory in %s adding as %s instead",
1011                        a->path, ci->branch2, dst_name_a);
1012         }
1013         if (dir_in_way(b->path, !o->call_depth)) {
1014                 dst_name_b = del[delp++] = unique_path(o, b->path, ci->branch2);
1015                 output(o, 1, "%s is a directory in %s adding as %s instead",
1016                        b->path, ci->branch1, dst_name_b);
1017         }
1018         if (o->call_depth) {
1019                 struct merge_file_info mfi;
1020                 mfi = merge_file(o, one->path,
1021                                  one->sha1, one->mode,
1022                                  a->sha1, a->mode,
1023                                  b->sha1, b->mode,
1024                                  ci->branch1, ci->branch2);
1025                 /*
1026                  * FIXME: For rename/add-source conflicts (if we could detect
1027                  * such), this is wrong.  We should instead find a unique
1028                  * pathname and then either rename the add-source file to that
1029                  * unique path, or use that unique path instead of src here.
1030                  */
1031                 update_file(o, 0, mfi.sha, mfi.mode, one->path);
1032                 remove_file_from_cache(a->path);
1033                 remove_file_from_cache(b->path);
1034         } else {
1035                 update_stages(a->path, NULL, a, NULL);
1036                 update_stages(b->path, NULL, NULL, b);
1037
1038                 update_file(o, 0, a->sha1, a->mode, dst_name_a);
1039                 update_file(o, 0, b->sha1, b->mode, dst_name_b);
1040         }
1041         while (delp--)
1042                 free(del[delp]);
1043 }
1044
1045 static void conflict_rename_rename_2to1(struct merge_options *o,
1046                                         struct rename_conflict_info *ci)
1047 {
1048         /* Two files, a & b, were renamed to the same thing, c. */
1049         struct diff_filespec *a = ci->pair1->one;
1050         struct diff_filespec *b = ci->pair2->one;
1051         struct diff_filespec *c1 = ci->pair1->two;
1052         struct diff_filespec *c2 = ci->pair2->two;
1053         char *path = c1->path; /* == c2->path */
1054
1055         output(o, 1, "CONFLICT (rename/rename): "
1056                "Rename %s->%s in %s. "
1057                "Rename %s->%s in %s",
1058                a->path, c1->path, ci->branch1,
1059                b->path, c2->path, ci->branch2);
1060
1061         remove_file(o, 1, a->path, would_lose_untracked(a->path));
1062         remove_file(o, 1, b->path, would_lose_untracked(b->path));
1063
1064         if (o->call_depth) {
1065                 struct merge_file_info mfi;
1066                 mfi = merge_file(o, path, null_sha1, 0,
1067                                  c1->sha1, c1->mode,
1068                                  c2->sha1, c2->mode,
1069                                  ci->branch1, ci->branch2);
1070                 output(o, 1, "Adding merged %s", path);
1071                 update_file(o, 0, mfi.sha, mfi.mode, path);
1072         } else {
1073                 char *new_path1 = unique_path(o, path, ci->branch1);
1074                 char *new_path2 = unique_path(o, path, ci->branch2);
1075                 output(o, 1, "Renaming %s to %s and %s to %s instead",
1076                        a->path, new_path1, b->path, new_path2);
1077                 remove_file(o, 0, path, 0);
1078                 update_file(o, 0, c1->sha1, c1->mode, new_path1);
1079                 update_file(o, 0, c2->sha1, c2->mode, new_path2);
1080                 free(new_path2);
1081                 free(new_path1);
1082         }
1083 }
1084
1085 static int process_renames(struct merge_options *o,
1086                            struct string_list *a_renames,
1087                            struct string_list *b_renames)
1088 {
1089         int clean_merge = 1, i, j;
1090         struct string_list a_by_dst = STRING_LIST_INIT_NODUP;
1091         struct string_list b_by_dst = STRING_LIST_INIT_NODUP;
1092         const struct rename *sre;
1093
1094         for (i = 0; i < a_renames->nr; i++) {
1095                 sre = a_renames->items[i].util;
1096                 string_list_insert(&a_by_dst, sre->pair->two->path)->util
1097                         = (void *)sre;
1098         }
1099         for (i = 0; i < b_renames->nr; i++) {
1100                 sre = b_renames->items[i].util;
1101                 string_list_insert(&b_by_dst, sre->pair->two->path)->util
1102                         = (void *)sre;
1103         }
1104
1105         for (i = 0, j = 0; i < a_renames->nr || j < b_renames->nr;) {
1106                 struct string_list *renames1, *renames2Dst;
1107                 struct rename *ren1 = NULL, *ren2 = NULL;
1108                 const char *branch1, *branch2;
1109                 const char *ren1_src, *ren1_dst;
1110                 struct string_list_item *lookup;
1111
1112                 if (i >= a_renames->nr) {
1113                         ren2 = b_renames->items[j++].util;
1114                 } else if (j >= b_renames->nr) {
1115                         ren1 = a_renames->items[i++].util;
1116                 } else {
1117                         int compare = strcmp(a_renames->items[i].string,
1118                                              b_renames->items[j].string);
1119                         if (compare <= 0)
1120                                 ren1 = a_renames->items[i++].util;
1121                         if (compare >= 0)
1122                                 ren2 = b_renames->items[j++].util;
1123                 }
1124
1125                 /* TODO: refactor, so that 1/2 are not needed */
1126                 if (ren1) {
1127                         renames1 = a_renames;
1128                         renames2Dst = &b_by_dst;
1129                         branch1 = o->branch1;
1130                         branch2 = o->branch2;
1131                 } else {
1132                         struct rename *tmp;
1133                         renames1 = b_renames;
1134                         renames2Dst = &a_by_dst;
1135                         branch1 = o->branch2;
1136                         branch2 = o->branch1;
1137                         tmp = ren2;
1138                         ren2 = ren1;
1139                         ren1 = tmp;
1140                 }
1141
1142                 if (ren1->processed)
1143                         continue;
1144                 ren1->processed = 1;
1145                 ren1->dst_entry->processed = 1;
1146                 /* BUG: We should only mark src_entry as processed if we
1147                  * are not dealing with a rename + add-source case.
1148                  */
1149                 ren1->src_entry->processed = 1;
1150
1151                 ren1_src = ren1->pair->one->path;
1152                 ren1_dst = ren1->pair->two->path;
1153
1154                 if (ren2) {
1155                         /* One file renamed on both sides */
1156                         const char *ren2_src = ren2->pair->one->path;
1157                         const char *ren2_dst = ren2->pair->two->path;
1158                         enum rename_type rename_type;
1159                         if (strcmp(ren1_src, ren2_src) != 0)
1160                                 die("ren1_src != ren2_src");
1161                         ren2->dst_entry->processed = 1;
1162                         ren2->processed = 1;
1163                         if (strcmp(ren1_dst, ren2_dst) != 0) {
1164                                 rename_type = RENAME_ONE_FILE_TO_TWO;
1165                                 clean_merge = 0;
1166                         } else {
1167                                 rename_type = RENAME_ONE_FILE_TO_ONE;
1168                                 /* BUG: We should only remove ren1_src in
1169                                  * the base stage (think of rename +
1170                                  * add-source cases).
1171                                  */
1172                                 remove_file(o, 1, ren1_src, 1);
1173                                 update_entry(ren1->dst_entry,
1174                                              ren1->pair->one,
1175                                              ren1->pair->two,
1176                                              ren2->pair->two);
1177                         }
1178                         setup_rename_conflict_info(rename_type,
1179                                                    ren1->pair,
1180                                                    ren2->pair,
1181                                                    branch1,
1182                                                    branch2,
1183                                                    ren1->dst_entry,
1184                                                    ren2->dst_entry,
1185                                                    o,
1186                                                    NULL,
1187                                                    NULL);
1188                 } else if ((lookup = string_list_lookup(renames2Dst, ren1_dst))) {
1189                         /* Two different files renamed to the same thing */
1190                         char *ren2_dst;
1191                         ren2 = lookup->util;
1192                         ren2_dst = ren2->pair->two->path;
1193                         if (strcmp(ren1_dst, ren2_dst) != 0)
1194                                 die("ren1_dst != ren2_dst");
1195
1196                         clean_merge = 0;
1197                         ren2->processed = 1;
1198                         /*
1199                          * BUG: We should only mark src_entry as processed
1200                          * if we are not dealing with a rename + add-source
1201                          * case.
1202                          */
1203                         ren2->src_entry->processed = 1;
1204
1205                         setup_rename_conflict_info(RENAME_TWO_FILES_TO_ONE,
1206                                                    ren1->pair,
1207                                                    ren2->pair,
1208                                                    branch1,
1209                                                    branch2,
1210                                                    ren1->dst_entry,
1211                                                    ren2->dst_entry,
1212                                                    o,
1213                                                    ren1->src_entry,
1214                                                    ren2->src_entry);
1215
1216                 } else {
1217                         /* Renamed in 1, maybe changed in 2 */
1218                         /* we only use sha1 and mode of these */
1219                         struct diff_filespec src_other, dst_other;
1220                         int try_merge;
1221
1222                         /*
1223                          * unpack_trees loads entries from common-commit
1224                          * into stage 1, from head-commit into stage 2, and
1225                          * from merge-commit into stage 3.  We keep track
1226                          * of which side corresponds to the rename.
1227                          */
1228                         int renamed_stage = a_renames == renames1 ? 2 : 3;
1229                         int other_stage =   a_renames == renames1 ? 3 : 2;
1230
1231                         /* BUG: We should only remove ren1_src in the base
1232                          * stage and in other_stage (think of rename +
1233                          * add-source case).
1234                          */
1235                         remove_file(o, 1, ren1_src,
1236                                     renamed_stage == 2 || !was_tracked(ren1_src));
1237
1238                         hashcpy(src_other.sha1, ren1->src_entry->stages[other_stage].sha);
1239                         src_other.mode = ren1->src_entry->stages[other_stage].mode;
1240                         hashcpy(dst_other.sha1, ren1->dst_entry->stages[other_stage].sha);
1241                         dst_other.mode = ren1->dst_entry->stages[other_stage].mode;
1242                         try_merge = 0;
1243
1244                         if (sha_eq(src_other.sha1, null_sha1)) {
1245                                 setup_rename_conflict_info(RENAME_DELETE,
1246                                                            ren1->pair,
1247                                                            NULL,
1248                                                            branch1,
1249                                                            branch2,
1250                                                            ren1->dst_entry,
1251                                                            NULL,
1252                                                            o,
1253                                                            NULL,
1254                                                            NULL);
1255                         } else if ((dst_other.mode == ren1->pair->two->mode) &&
1256                                    sha_eq(dst_other.sha1, ren1->pair->two->sha1)) {
1257                                 /* Added file on the other side
1258                                    identical to the file being
1259                                    renamed: clean merge */
1260                                 update_file(o, 1, ren1->pair->two->sha1, ren1->pair->two->mode, ren1_dst);
1261                         } else if (!sha_eq(dst_other.sha1, null_sha1)) {
1262                                 clean_merge = 0;
1263                                 try_merge = 1;
1264                                 output(o, 1, "CONFLICT (rename/add): Rename %s->%s in %s. "
1265                                        "%s added in %s",
1266                                        ren1_src, ren1_dst, branch1,
1267                                        ren1_dst, branch2);
1268                                 if (o->call_depth) {
1269                                         struct merge_file_info mfi;
1270                                         mfi = merge_file(o, ren1_dst, null_sha1, 0,
1271                                                          ren1->pair->two->sha1, ren1->pair->two->mode,
1272                                                          dst_other.sha1, dst_other.mode,
1273                                                          branch1, branch2);
1274                                         output(o, 1, "Adding merged %s", ren1_dst);
1275                                         update_file(o, 0, mfi.sha, mfi.mode, ren1_dst);
1276                                         try_merge = 0;
1277                                 } else {
1278                                         char *new_path = unique_path(o, ren1_dst, branch2);
1279                                         output(o, 1, "Adding as %s instead", new_path);
1280                                         update_file(o, 0, dst_other.sha1, dst_other.mode, new_path);
1281                                         free(new_path);
1282                                 }
1283                         } else
1284                                 try_merge = 1;
1285
1286                         if (try_merge) {
1287                                 struct diff_filespec *one, *a, *b;
1288                                 src_other.path = (char *)ren1_src;
1289
1290                                 one = ren1->pair->one;
1291                                 if (a_renames == renames1) {
1292                                         a = ren1->pair->two;
1293                                         b = &src_other;
1294                                 } else {
1295                                         b = ren1->pair->two;
1296                                         a = &src_other;
1297                                 }
1298                                 update_entry(ren1->dst_entry, one, a, b);
1299                                 setup_rename_conflict_info(RENAME_NORMAL,
1300                                                            ren1->pair,
1301                                                            NULL,
1302                                                            branch1,
1303                                                            NULL,
1304                                                            ren1->dst_entry,
1305                                                            NULL,
1306                                                            o,
1307                                                            NULL,
1308                                                            NULL);
1309                         }
1310                 }
1311         }
1312         string_list_clear(&a_by_dst, 0);
1313         string_list_clear(&b_by_dst, 0);
1314
1315         return clean_merge;
1316 }
1317
1318 static unsigned char *stage_sha(const unsigned char *sha, unsigned mode)
1319 {
1320         return (is_null_sha1(sha) || mode == 0) ? NULL: (unsigned char *)sha;
1321 }
1322
1323 static int read_sha1_strbuf(const unsigned char *sha1, struct strbuf *dst)
1324 {
1325         void *buf;
1326         enum object_type type;
1327         unsigned long size;
1328         buf = read_sha1_file(sha1, &type, &size);
1329         if (!buf)
1330                 return error("cannot read object %s", sha1_to_hex(sha1));
1331         if (type != OBJ_BLOB) {
1332                 free(buf);
1333                 return error("object %s is not a blob", sha1_to_hex(sha1));
1334         }
1335         strbuf_attach(dst, buf, size, size + 1);
1336         return 0;
1337 }
1338
1339 static int blob_unchanged(const unsigned char *o_sha,
1340                           const unsigned char *a_sha,
1341                           int renormalize, const char *path)
1342 {
1343         struct strbuf o = STRBUF_INIT;
1344         struct strbuf a = STRBUF_INIT;
1345         int ret = 0; /* assume changed for safety */
1346
1347         if (sha_eq(o_sha, a_sha))
1348                 return 1;
1349         if (!renormalize)
1350                 return 0;
1351
1352         assert(o_sha && a_sha);
1353         if (read_sha1_strbuf(o_sha, &o) || read_sha1_strbuf(a_sha, &a))
1354                 goto error_return;
1355         /*
1356          * Note: binary | is used so that both renormalizations are
1357          * performed.  Comparison can be skipped if both files are
1358          * unchanged since their sha1s have already been compared.
1359          */
1360         if (renormalize_buffer(path, o.buf, o.len, &o) |
1361             renormalize_buffer(path, a.buf, o.len, &a))
1362                 ret = (o.len == a.len && !memcmp(o.buf, a.buf, o.len));
1363
1364 error_return:
1365         strbuf_release(&o);
1366         strbuf_release(&a);
1367         return ret;
1368 }
1369
1370 static void handle_delete_modify(struct merge_options *o,
1371                                  const char *path,
1372                                  unsigned char *o_sha, int o_mode,
1373                                  unsigned char *a_sha, int a_mode,
1374                                  unsigned char *b_sha, int b_mode)
1375 {
1376         char *renamed = NULL;
1377         if (dir_in_way(path, !o->call_depth)) {
1378                 renamed = unique_path(o, path, a_sha ? o->branch1 : o->branch2);
1379         }
1380
1381         if (o->call_depth) {
1382                 /*
1383                  * We cannot arbitrarily accept either a_sha or b_sha as
1384                  * correct; since there is no true "middle point" between
1385                  * them, simply reuse the base version for virtual merge base.
1386                  */
1387                 remove_file_from_cache(path);
1388                 update_file(o, 0, o_sha, o_mode, renamed ? renamed : path);
1389         } else if (!a_sha) {
1390                 output(o, 1, "CONFLICT (delete/modify): %s deleted in %s "
1391                        "and modified in %s. Version %s of %s left in tree%s%s.",
1392                        path, o->branch1,
1393                        o->branch2, o->branch2, path,
1394                        NULL == renamed ? "" : " at ",
1395                        NULL == renamed ? "" : renamed);
1396                 update_file(o, 0, b_sha, b_mode, renamed ? renamed : path);
1397         } else {
1398                 output(o, 1, "CONFLICT (delete/modify): %s deleted in %s "
1399                        "and modified in %s. Version %s of %s left in tree%s%s.",
1400                        path, o->branch2,
1401                        o->branch1, o->branch1, path,
1402                        NULL == renamed ? "" : " at ",
1403                        NULL == renamed ? "" : renamed);
1404                 update_file(o, 0, a_sha, a_mode, renamed ? renamed : path);
1405         }
1406         free(renamed);
1407
1408 }
1409
1410 static int merge_content(struct merge_options *o,
1411                          const char *path,
1412                          unsigned char *o_sha, int o_mode,
1413                          unsigned char *a_sha, int a_mode,
1414                          unsigned char *b_sha, int b_mode,
1415                          struct rename_conflict_info *rename_conflict_info)
1416 {
1417         const char *reason = "content";
1418         char *side1 = NULL, *side2 = NULL;
1419         const char *path1 = NULL, *path2 = NULL;
1420         struct merge_file_info mfi;
1421         struct diff_filespec one, a, b;
1422         unsigned df_conflict_remains = 0;
1423
1424         if (!o_sha) {
1425                 reason = "add/add";
1426                 o_sha = (unsigned char *)null_sha1;
1427         }
1428         one.path = a.path = b.path = (char *)path;
1429         hashcpy(one.sha1, o_sha);
1430         one.mode = o_mode;
1431         hashcpy(a.sha1, a_sha);
1432         a.mode = a_mode;
1433         hashcpy(b.sha1, b_sha);
1434         b.mode = b_mode;
1435
1436         if (rename_conflict_info) {
1437                 struct diff_filepair *pair1 = rename_conflict_info->pair1;
1438
1439                 path1 = (o->branch1 == rename_conflict_info->branch1) ?
1440                         pair1->two->path : pair1->one->path;
1441                 /* If rename_conflict_info->pair2 != NULL, we are in
1442                  * RENAME_ONE_FILE_TO_ONE case.  Otherwise, we have a
1443                  * normal rename.
1444                  */
1445                 path2 = (rename_conflict_info->pair2 ||
1446                          o->branch2 == rename_conflict_info->branch1) ?
1447                         pair1->two->path : pair1->one->path;
1448                 side1 = xmalloc(strlen(o->branch1) + strlen(path1) + 2);
1449                 side2 = xmalloc(strlen(o->branch2) + strlen(path2) + 2);
1450                 sprintf(side1, "%s:%s", o->branch1, path1);
1451                 sprintf(side2, "%s:%s", o->branch2, path2);
1452
1453                 if (dir_in_way(path, !o->call_depth))
1454                         df_conflict_remains = 1;
1455         }
1456         mfi = merge_file_1(o, &one, &a, &b,
1457                            side1 ? side1 : o->branch1, side2 ? side2 : o->branch2);
1458         free(side1);
1459         free(side2);
1460
1461         if (mfi.clean && !df_conflict_remains &&
1462             sha_eq(mfi.sha, a_sha) && mfi.mode == a_mode) {
1463                 int path_renamed_outside_HEAD;
1464                 output(o, 3, "Skipped %s (merged same as existing)", path);
1465                 /*
1466                  * The content merge resulted in the same file contents we
1467                  * already had.  We can return early if those file contents
1468                  * are recorded at the correct path (which may not be true
1469                  * if the merge involves a rename).
1470                  */
1471                 path_renamed_outside_HEAD = !path2 || !strcmp(path, path2);
1472                 if (!path_renamed_outside_HEAD) {
1473                         add_cacheinfo(mfi.mode, mfi.sha, path,
1474                                       0 /*stage*/, 1 /*refresh*/, 0 /*options*/);
1475                         return mfi.clean;
1476                 }
1477         } else
1478                 output(o, 2, "Auto-merging %s", path);
1479
1480         if (!mfi.clean) {
1481                 if (S_ISGITLINK(mfi.mode))
1482                         reason = "submodule";
1483                 output(o, 1, "CONFLICT (%s): Merge conflict in %s",
1484                                 reason, path);
1485                 if (rename_conflict_info && !df_conflict_remains)
1486                         update_stages(path, &one, &a, &b);
1487         }
1488
1489         if (df_conflict_remains) {
1490                 char *new_path;
1491                 if (o->call_depth) {
1492                         remove_file_from_cache(path);
1493                 } else {
1494                         if (!mfi.clean)
1495                                 update_stages(path, &one, &a, &b);
1496                         else {
1497                                 int file_from_stage2 = was_tracked(path);
1498                                 struct diff_filespec merged;
1499                                 hashcpy(merged.sha1, mfi.sha);
1500                                 merged.mode = mfi.mode;
1501
1502                                 update_stages(path, NULL,
1503                                               file_from_stage2 ? &merged : NULL,
1504                                               file_from_stage2 ? NULL : &merged);
1505                         }
1506
1507                 }
1508                 new_path = unique_path(o, path, rename_conflict_info->branch1);
1509                 output(o, 1, "Adding as %s instead", new_path);
1510                 update_file(o, 0, mfi.sha, mfi.mode, new_path);
1511                 free(new_path);
1512                 mfi.clean = 0;
1513         } else {
1514                 update_file(o, mfi.clean, mfi.sha, mfi.mode, path);
1515         }
1516         return mfi.clean;
1517
1518 }
1519
1520 /* Per entry merge function */
1521 static int process_entry(struct merge_options *o,
1522                          const char *path, struct stage_data *entry)
1523 {
1524         /*
1525         printf("processing entry, clean cache: %s\n", index_only ? "yes": "no");
1526         print_index_entry("\tpath: ", entry);
1527         */
1528         int clean_merge = 1;
1529         int normalize = o->renormalize;
1530         unsigned o_mode = entry->stages[1].mode;
1531         unsigned a_mode = entry->stages[2].mode;
1532         unsigned b_mode = entry->stages[3].mode;
1533         unsigned char *o_sha = stage_sha(entry->stages[1].sha, o_mode);
1534         unsigned char *a_sha = stage_sha(entry->stages[2].sha, a_mode);
1535         unsigned char *b_sha = stage_sha(entry->stages[3].sha, b_mode);
1536
1537         entry->processed = 1;
1538         if (entry->rename_conflict_info) {
1539                 struct rename_conflict_info *conflict_info = entry->rename_conflict_info;
1540                 switch (conflict_info->rename_type) {
1541                 case RENAME_NORMAL:
1542                 case RENAME_ONE_FILE_TO_ONE:
1543                         clean_merge = merge_content(o, path,
1544                                                     o_sha, o_mode, a_sha, a_mode, b_sha, b_mode,
1545                                                     conflict_info);
1546                         break;
1547                 case RENAME_DELETE:
1548                         clean_merge = 0;
1549                         conflict_rename_delete(o, conflict_info->pair1,
1550                                                conflict_info->branch1,
1551                                                conflict_info->branch2);
1552                         break;
1553                 case RENAME_ONE_FILE_TO_TWO:
1554                         clean_merge = 0;
1555                         conflict_rename_rename_1to2(o, conflict_info);
1556                         break;
1557                 case RENAME_TWO_FILES_TO_ONE:
1558                         clean_merge = 0;
1559                         conflict_rename_rename_2to1(o, conflict_info);
1560                         break;
1561                 default:
1562                         entry->processed = 0;
1563                         break;
1564                 }
1565         } else if (o_sha && (!a_sha || !b_sha)) {
1566                 /* Case A: Deleted in one */
1567                 if ((!a_sha && !b_sha) ||
1568                     (!b_sha && blob_unchanged(o_sha, a_sha, normalize, path)) ||
1569                     (!a_sha && blob_unchanged(o_sha, b_sha, normalize, path))) {
1570                         /* Deleted in both or deleted in one and
1571                          * unchanged in the other */
1572                         if (a_sha)
1573                                 output(o, 2, "Removing %s", path);
1574                         /* do not touch working file if it did not exist */
1575                         remove_file(o, 1, path, !a_sha);
1576                 } else {
1577                         /* Modify/delete; deleted side may have put a directory in the way */
1578                         clean_merge = 0;
1579                         handle_delete_modify(o, path, o_sha, o_mode,
1580                                              a_sha, a_mode, b_sha, b_mode);
1581                 }
1582         } else if ((!o_sha && a_sha && !b_sha) ||
1583                    (!o_sha && !a_sha && b_sha)) {
1584                 /* Case B: Added in one. */
1585                 /* [nothing|directory] -> ([nothing|directory], file) */
1586
1587                 const char *add_branch;
1588                 const char *other_branch;
1589                 unsigned mode;
1590                 const unsigned char *sha;
1591                 const char *conf;
1592
1593                 if (a_sha) {
1594                         add_branch = o->branch1;
1595                         other_branch = o->branch2;
1596                         mode = a_mode;
1597                         sha = a_sha;
1598                         conf = "file/directory";
1599                 } else {
1600                         add_branch = o->branch2;
1601                         other_branch = o->branch1;
1602                         mode = b_mode;
1603                         sha = b_sha;
1604                         conf = "directory/file";
1605                 }
1606                 if (dir_in_way(path, !o->call_depth)) {
1607                         char *new_path = unique_path(o, path, add_branch);
1608                         clean_merge = 0;
1609                         output(o, 1, "CONFLICT (%s): There is a directory with name %s in %s. "
1610                                "Adding %s as %s",
1611                                conf, path, other_branch, path, new_path);
1612                         if (o->call_depth)
1613                                 remove_file_from_cache(path);
1614                         update_file(o, 0, sha, mode, new_path);
1615                         if (o->call_depth)
1616                                 remove_file_from_cache(path);
1617                         free(new_path);
1618                 } else {
1619                         output(o, 2, "Adding %s", path);
1620                         update_file(o, 1, sha, mode, path);
1621                 }
1622         } else if (a_sha && b_sha) {
1623                 /* Case C: Added in both (check for same permissions) and */
1624                 /* case D: Modified in both, but differently. */
1625                 clean_merge = merge_content(o, path,
1626                                             o_sha, o_mode, a_sha, a_mode, b_sha, b_mode,
1627                                             NULL);
1628         } else if (!o_sha && !a_sha && !b_sha) {
1629                 /*
1630                  * this entry was deleted altogether. a_mode == 0 means
1631                  * we had that path and want to actively remove it.
1632                  */
1633                 remove_file(o, 1, path, !a_mode);
1634         } else
1635                 die("Fatal merge failure, shouldn't happen.");
1636
1637         return clean_merge;
1638 }
1639
1640 int merge_trees(struct merge_options *o,
1641                 struct tree *head,
1642                 struct tree *merge,
1643                 struct tree *common,
1644                 struct tree **result)
1645 {
1646         int code, clean;
1647
1648         if (o->subtree_shift) {
1649                 merge = shift_tree_object(head, merge, o->subtree_shift);
1650                 common = shift_tree_object(head, common, o->subtree_shift);
1651         }
1652
1653         if (sha_eq(common->object.sha1, merge->object.sha1)) {
1654                 output(o, 0, "Already up-to-date!");
1655                 *result = head;
1656                 return 1;
1657         }
1658
1659         code = git_merge_trees(o->call_depth, common, head, merge);
1660
1661         if (code != 0) {
1662                 if (show(o, 4) || o->call_depth)
1663                         die("merging of trees %s and %s failed",
1664                             sha1_to_hex(head->object.sha1),
1665                             sha1_to_hex(merge->object.sha1));
1666                 else
1667                         exit(128);
1668         }
1669
1670         if (unmerged_cache()) {
1671                 struct string_list *entries, *re_head, *re_merge;
1672                 int i;
1673                 string_list_clear(&o->current_file_set, 1);
1674                 string_list_clear(&o->current_directory_set, 1);
1675                 get_files_dirs(o, head);
1676                 get_files_dirs(o, merge);
1677
1678                 entries = get_unmerged();
1679                 record_df_conflict_files(o, entries);
1680                 re_head  = get_renames(o, head, common, head, merge, entries);
1681                 re_merge = get_renames(o, merge, common, head, merge, entries);
1682                 clean = process_renames(o, re_head, re_merge);
1683                 for (i = entries->nr-1; 0 <= i; i--) {
1684                         const char *path = entries->items[i].string;
1685                         struct stage_data *e = entries->items[i].util;
1686                         if (!e->processed
1687                                 && !process_entry(o, path, e))
1688                                 clean = 0;
1689                 }
1690                 for (i = 0; i < entries->nr; i++) {
1691                         struct stage_data *e = entries->items[i].util;
1692                         if (!e->processed)
1693                                 die("Unprocessed path??? %s",
1694                                     entries->items[i].string);
1695                 }
1696
1697                 string_list_clear(re_merge, 0);
1698                 string_list_clear(re_head, 0);
1699                 string_list_clear(entries, 1);
1700
1701         }
1702         else
1703                 clean = 1;
1704
1705         if (o->call_depth)
1706                 *result = write_tree_from_memory(o);
1707
1708         return clean;
1709 }
1710
1711 static struct commit_list *reverse_commit_list(struct commit_list *list)
1712 {
1713         struct commit_list *next = NULL, *current, *backup;
1714         for (current = list; current; current = backup) {
1715                 backup = current->next;
1716                 current->next = next;
1717                 next = current;
1718         }
1719         return next;
1720 }
1721
1722 /*
1723  * Merge the commits h1 and h2, return the resulting virtual
1724  * commit object and a flag indicating the cleanness of the merge.
1725  */
1726 int merge_recursive(struct merge_options *o,
1727                     struct commit *h1,
1728                     struct commit *h2,
1729                     struct commit_list *ca,
1730                     struct commit **result)
1731 {
1732         struct commit_list *iter;
1733         struct commit *merged_common_ancestors;
1734         struct tree *mrtree = mrtree;
1735         int clean;
1736
1737         if (show(o, 4)) {
1738                 output(o, 4, "Merging:");
1739                 output_commit_title(o, h1);
1740                 output_commit_title(o, h2);
1741         }
1742
1743         if (!ca) {
1744                 ca = get_merge_bases(h1, h2, 1);
1745                 ca = reverse_commit_list(ca);
1746         }
1747
1748         if (show(o, 5)) {
1749                 output(o, 5, "found %u common ancestor(s):", commit_list_count(ca));
1750                 for (iter = ca; iter; iter = iter->next)
1751                         output_commit_title(o, iter->item);
1752         }
1753
1754         merged_common_ancestors = pop_commit(&ca);
1755         if (merged_common_ancestors == NULL) {
1756                 /* if there is no common ancestor, make an empty tree */
1757                 struct tree *tree = xcalloc(1, sizeof(struct tree));
1758
1759                 tree->object.parsed = 1;
1760                 tree->object.type = OBJ_TREE;
1761                 pretend_sha1_file(NULL, 0, OBJ_TREE, tree->object.sha1);
1762                 merged_common_ancestors = make_virtual_commit(tree, "ancestor");
1763         }
1764
1765         for (iter = ca; iter; iter = iter->next) {
1766                 const char *saved_b1, *saved_b2;
1767                 o->call_depth++;
1768                 /*
1769                  * When the merge fails, the result contains files
1770                  * with conflict markers. The cleanness flag is
1771                  * ignored, it was never actually used, as result of
1772                  * merge_trees has always overwritten it: the committed
1773                  * "conflicts" were already resolved.
1774                  */
1775                 discard_cache();
1776                 saved_b1 = o->branch1;
1777                 saved_b2 = o->branch2;
1778                 o->branch1 = "Temporary merge branch 1";
1779                 o->branch2 = "Temporary merge branch 2";
1780                 merge_recursive(o, merged_common_ancestors, iter->item,
1781                                 NULL, &merged_common_ancestors);
1782                 o->branch1 = saved_b1;
1783                 o->branch2 = saved_b2;
1784                 o->call_depth--;
1785
1786                 if (!merged_common_ancestors)
1787                         die("merge returned no commit");
1788         }
1789
1790         discard_cache();
1791         if (!o->call_depth)
1792                 read_cache();
1793
1794         o->ancestor = "merged common ancestors";
1795         clean = merge_trees(o, h1->tree, h2->tree, merged_common_ancestors->tree,
1796                             &mrtree);
1797
1798         if (o->call_depth) {
1799                 *result = make_virtual_commit(mrtree, "merged tree");
1800                 commit_list_insert(h1, &(*result)->parents);
1801                 commit_list_insert(h2, &(*result)->parents->next);
1802         }
1803         flush_output(o);
1804         if (show(o, 2))
1805                 diff_warn_rename_limit("merge.renamelimit",
1806                                        o->needed_rename_limit, 0);
1807         return clean;
1808 }
1809
1810 static struct commit *get_ref(const unsigned char *sha1, const char *name)
1811 {
1812         struct object *object;
1813
1814         object = deref_tag(parse_object(sha1), name, strlen(name));
1815         if (!object)
1816                 return NULL;
1817         if (object->type == OBJ_TREE)
1818                 return make_virtual_commit((struct tree*)object, name);
1819         if (object->type != OBJ_COMMIT)
1820                 return NULL;
1821         if (parse_commit((struct commit *)object))
1822                 return NULL;
1823         return (struct commit *)object;
1824 }
1825
1826 int merge_recursive_generic(struct merge_options *o,
1827                             const unsigned char *head,
1828                             const unsigned char *merge,
1829                             int num_base_list,
1830                             const unsigned char **base_list,
1831                             struct commit **result)
1832 {
1833         int clean, index_fd;
1834         struct lock_file *lock = xcalloc(1, sizeof(struct lock_file));
1835         struct commit *head_commit = get_ref(head, o->branch1);
1836         struct commit *next_commit = get_ref(merge, o->branch2);
1837         struct commit_list *ca = NULL;
1838
1839         if (base_list) {
1840                 int i;
1841                 for (i = 0; i < num_base_list; ++i) {
1842                         struct commit *base;
1843                         if (!(base = get_ref(base_list[i], sha1_to_hex(base_list[i]))))
1844                                 return error("Could not parse object '%s'",
1845                                         sha1_to_hex(base_list[i]));
1846                         commit_list_insert(base, &ca);
1847                 }
1848         }
1849
1850         index_fd = hold_locked_index(lock, 1);
1851         clean = merge_recursive(o, head_commit, next_commit, ca,
1852                         result);
1853         if (active_cache_changed &&
1854                         (write_cache(index_fd, active_cache, active_nr) ||
1855                          commit_locked_index(lock)))
1856                 return error("Unable to write index.");
1857
1858         return clean ? 0 : 1;
1859 }
1860
1861 static int merge_recursive_config(const char *var, const char *value, void *cb)
1862 {
1863         struct merge_options *o = cb;
1864         if (!strcmp(var, "merge.verbosity")) {
1865                 o->verbosity = git_config_int(var, value);
1866                 return 0;
1867         }
1868         if (!strcmp(var, "diff.renamelimit")) {
1869                 o->diff_rename_limit = git_config_int(var, value);
1870                 return 0;
1871         }
1872         if (!strcmp(var, "merge.renamelimit")) {
1873                 o->merge_rename_limit = git_config_int(var, value);
1874                 return 0;
1875         }
1876         return git_xmerge_config(var, value, cb);
1877 }
1878
1879 void init_merge_options(struct merge_options *o)
1880 {
1881         memset(o, 0, sizeof(struct merge_options));
1882         o->verbosity = 2;
1883         o->buffer_output = 1;
1884         o->diff_rename_limit = -1;
1885         o->merge_rename_limit = -1;
1886         o->renormalize = 0;
1887         git_config(merge_recursive_config, o);
1888         if (getenv("GIT_MERGE_VERBOSITY"))
1889                 o->verbosity =
1890                         strtol(getenv("GIT_MERGE_VERBOSITY"), NULL, 10);
1891         if (o->verbosity >= 5)
1892                 o->buffer_output = 0;
1893         strbuf_init(&o->obuf, 0);
1894         memset(&o->current_file_set, 0, sizeof(struct string_list));
1895         o->current_file_set.strdup_strings = 1;
1896         memset(&o->current_directory_set, 0, sizeof(struct string_list));
1897         o->current_directory_set.strdup_strings = 1;
1898         memset(&o->df_conflict_file_set, 0, sizeof(struct string_list));
1899         o->df_conflict_file_set.strdup_strings = 1;
1900 }
1901
1902 int parse_merge_opt(struct merge_options *o, const char *s)
1903 {
1904         if (!s || !*s)
1905                 return -1;
1906         if (!strcmp(s, "ours"))
1907                 o->recursive_variant = MERGE_RECURSIVE_OURS;
1908         else if (!strcmp(s, "theirs"))
1909                 o->recursive_variant = MERGE_RECURSIVE_THEIRS;
1910         else if (!strcmp(s, "subtree"))
1911                 o->subtree_shift = "";
1912         else if (!prefixcmp(s, "subtree="))
1913                 o->subtree_shift = s + strlen("subtree=");
1914         else if (!strcmp(s, "patience"))
1915                 o->xdl_opts |= XDF_PATIENCE_DIFF;
1916         else if (!strcmp(s, "ignore-space-change"))
1917                 o->xdl_opts |= XDF_IGNORE_WHITESPACE_CHANGE;
1918         else if (!strcmp(s, "ignore-all-space"))
1919                 o->xdl_opts |= XDF_IGNORE_WHITESPACE;
1920         else if (!strcmp(s, "ignore-space-at-eol"))
1921                 o->xdl_opts |= XDF_IGNORE_WHITESPACE_AT_EOL;
1922         else if (!strcmp(s, "renormalize"))
1923                 o->renormalize = 1;
1924         else if (!strcmp(s, "no-renormalize"))
1925                 o->renormalize = 0;
1926         else if (!prefixcmp(s, "rename-threshold=")) {
1927                 const char *score = s + strlen("rename-threshold=");
1928                 if ((o->rename_score = parse_rename_score(&score)) == -1 || *score != 0)
1929                         return -1;
1930         }
1931         else
1932                 return -1;
1933         return 0;
1934 }