read-tree.c - git - Git at Google

 /*
  * GIT - The information manager from hell
  *
  * Copyright (C) Linus Torvalds, 2005
  */
 #include "cache.h"

 static int stage = 0;
 static int update = 0;

 static int unpack_tree(unsigned char *sha1)
 {
 	void *buffer;
 	unsigned long size;
 	int ret;

 	buffer = read_object_with_reference(sha1, "tree", &size, NULL);
 	if (!buffer)
 		return -1;
 	ret = read_tree(buffer, size, stage, NULL);
 	free(buffer);
 	return ret;
 }

 static int path_matches(struct cache_entry *a, struct cache_entry *b)
 {
 	int len = ce_namelen(a);
 	return ce_namelen(b) == len &&
 		!memcmp(a->name, b->name, len);
 }

 static int same(struct cache_entry *a, struct cache_entry *b)
 {
 	return a->ce_mode == b->ce_mode &&
 		!memcmp(a->sha1, b->sha1, 20);
 }


 /*
  * This removes all trivial merges that don't change the tree
  * and collapses them to state 0.
  */
 static struct cache_entry *merge_entries(struct cache_entry *a,
 					 struct cache_entry *b,
 					 struct cache_entry *c)
 {
 	/*
 	 * Ok, all three entries describe the same
 	 * filename, but maybe the contents or file
 	 * mode have changed?
 	 *
 	 * The trivial cases end up being the ones where two
 	 * out of three files are the same:
 	 *  - both destinations the same, trivially take either
 	 *  - one of the destination versions hasn't changed,
 	 *    take the other.
 	 *
 	 * The "all entries exactly the same" case falls out as
 	 * a special case of any of the "two same" cases.
 	 *
 	 * Here "a" is "original", and "b" and "c" are the two
 	 * trees we are merging.
 	 */
 	if (a && b && c) {
 		if (same(b,c))
 			return c;
 		if (same(a,b))
 			return c;
 		if (same(a,c))
 			return b;
 	}
 	return NULL;
 }

 /*
  * When a CE gets turned into an unmerged entry, we
  * want it to be up-to-date
  */
 static void verify_uptodate(struct cache_entry *ce)
 {
 	struct stat st;

 	if (!lstat(ce->name, &st)) {
 		unsigned changed = ce_match_stat(ce, &st);
 		if (!changed)
 			return;
 		errno = 0;
 	}
 	if (errno == ENOENT)
 		return;
 	die("Entry '%s' not uptodate. Cannot merge.", ce->name);
 }

 /*
  * If the old tree contained a CE that isn't even in the
  * result, that's always a problem, regardless of whether
  * it's up-to-date or not (ie it can be a file that we
  * have updated but not committed yet).
  */
 static void reject_merge(struct cache_entry *ce)
 {
 	die("Entry '%s' would be overwritten by merge. Cannot merge.", ce->name);
 }

 static int merged_entry_internal(struct cache_entry *merge, struct cache_entry *old, struct cache_entry **dst, int allow_dirty)
 {
 	merge->ce_flags |= htons(CE_UPDATE);
 	if (old) {
 		/*
 		 * See if we can re-use the old CE directly?
 		 * That way we get the uptodate stat info.
 		 *
 		 * This also removes the UPDATE flag on
 		 * a match.
 		 */
 		if (same(old, merge)) {
 			*merge = *old;
 		} else if (!allow_dirty) {
 			verify_uptodate(old);
 		}
 	}
 	merge->ce_flags &= ~htons(CE_STAGEMASK);
 	*dst++ = merge;
 	return 1;
 }

 static int merged_entry_allow_dirty(struct cache_entry *merge, struct cache_entry *old, struct cache_entry **dst)
 {
 	return merged_entry_internal(merge, old, dst, 1);
 }

 static int merged_entry(struct cache_entry *merge, struct cache_entry *old, struct cache_entry **dst)
 {
 	return merged_entry_internal(merge, old, dst, 0);
 }

 static int deleted_entry(struct cache_entry *ce, struct cache_entry *old, struct cache_entry **dst)
 {
 	if (old)
 		verify_uptodate(old);
 	ce->ce_mode = 0;
 	*dst++ = ce;
 	return 1;
 }

 static int causes_df_conflict(struct cache_entry *ce, int stage,
 			      struct cache_entry **dst_,
 			      struct cache_entry **next_,
 			      int tail)
 {
 	/* This is called during the merge operation and walking
 	 * the active_cache[] array is messy, because it is in the
 	 * middle of overlapping copy operation.  The invariants
 	 * are:
 	 * (1) active_cache points at the first (zeroth) entry.
 	 * (2) up to dst pointer are resolved entries.
 	 * (3) from the next pointer (head-inclusive) to the tail
 	 *     of the active_cache array have the remaining paths
 	 *     to be processed.  There can be a gap between dst
 	 *     and next.  Note that next is called "src" in the
 	 *     merge_cache() function, and tail is the original
 	 *     end of active_cache array when merge_cache() started.
 	 * (4) the path corresponding to *ce is not found in (2)
 	 *     or (3).  It is in the gap.
 	 *
 	 *  active_cache -----......+++++++++++++.
 	 *                    ^dst  ^next        ^tail
 	 */
 	int i, next, dst;
 	const char *path = ce->name;
 	int namelen = ce_namelen(ce);

 	next = next_ - active_cache;
 	dst = dst_ - active_cache;

 	for (i = 0; i < tail; i++) {
 		int entlen, len;
 		const char *one, *two;
 		if (dst <= i && i < next)
 			continue;
 		ce = active_cache[i];
 		if (ce_stage(ce) != stage)
 			continue;
 		/* If ce->name is a prefix of path, then path is a file
 		 * that hangs underneath ce->name, which is bad.
 		 * If path is a prefix of ce->name, then it is the
 		 * other way around which also is bad.
 		 */
 		entlen = ce_namelen(ce);
 		if (namelen == entlen)
 			continue;
 		if (namelen < entlen) {
 			len = namelen;
 			one = path;
 			two = ce->name;
 		} else {
 			len = entlen;
 			one = ce->name;
 			two = path;
 		}
 		if (memcmp(one, two, len))
 			continue;
 		if (two[len] == '/')
 			return 1;
 	}
 	return 0;
 }

 static int threeway_merge(struct cache_entry *stages[4],
 			  struct cache_entry **dst,
 			  struct cache_entry **next, int tail)
 {
 	struct cache_entry *old = stages[0];
 	struct cache_entry *a = stages[1], *b = stages[2], *c = stages[3];
 	struct cache_entry *merge;
 	int count;

 	/* #5ALT */
 	if (!a && b && c && same(b, c)) {
 		if (old && !same(b, old))
 			return -1;
 		return merged_entry_allow_dirty(b, old, dst);
 	}
 	/* #2ALT and #3ALT */
 	if (!a && (!!b != !!c)) {
 		/*
 		 * The reason we need to worry about directory/file
 		 * conflicts only in #2ALT and #3ALT case is this:
 		 *
 		 * (1) For all other cases that read-tree internally
 		 *     resolves a path, we always have such a path in
 		 *     *both* stage2 and stage3 when we begin.
 		 *     Traditionally, the behaviour has been even
 		 *     stricter and we did not resolve a path without
 		 *     initially being in all of stage1, 2, and 3.
 		 *
 		 * (2) When read-tree finishes, all resolved paths (i.e.
 		 *     the paths that are in stage0) must have come from
 		 *     either stage2 or stage3.  It is not possible to
 		 *     have a stage0 path as a result of a merge if
 		 *     neither stage2 nor stage3 had that path.
 		 *
 		 * (3) It is guaranteed that just after reading the
 		 *     stages, each stage cannot have directory/file
 		 *     conflicts on its own, because they are populated
 		 *     by reading hierarchy of a tree.  Combined with
 		 *     (1) and (2) above, this means that no matter what
 		 *     combination of paths we take from stage2 and
 		 *     stage3 as a result of a merge, they cannot cause
 		 *     a directory/file conflict situation (otherwise
 		 *     the "guilty" path would have already had such a
 		 *     conflict in the original stage, either stage2
 		 *     or stage3).  Although its stage2 is synthesized
 		 *     by overlaying the current index on top of "our
 		 *     head" tree, --emu23 case also has this guarantee,
 		 *     by calling add_cache_entry() to create such stage2
 		 *     entries.
 		 *
 		 * (4) Only #2ALT and #3ALT lack the guarantee (1).
 		 *     They resolve paths that exist only in stage2
 		 *     or stage3.  The stage2 tree may have a file DF
 		 *     while stage3 tree may have a file DF/DF.  If
 		 *     #2ALT and #3ALT rules happen to apply to both
 		 *     of them, we would end up having DF (coming from
 		 *     stage2) and DF/DF (from stage3) in the result.
 		 *     When we attempt to resolve a path that exists
 		 *     only in stage2, we need to make sure there is
 		 *     no path that would conflict with it in stage3
 		 *     and vice versa.
 		 */
 		if (c) { /* #2ALT */
 			if (!causes_df_conflict(c, 2, dst, next, tail) &&
 			    (!old || same(c, old)))
 				return merged_entry_allow_dirty(c, old, dst);
 		}
 		else { /* #3ALT */
 			if (!causes_df_conflict(b, 3, dst, next, tail) &&
 			    (!old || same(b, old)))
 				return merged_entry_allow_dirty(b, old, dst);
 		}
 		/* otherwise we will apply the original rule */
 	}
 	/* #14ALT */
 	if (a && b && c && same(a, b) && !same(a, c)) {
 		if (old && same(old, c))
 			return merged_entry_allow_dirty(c, old, dst);
 		/* otherwise the regular rule applies */
 	}
 	/*
 	 * If we have an entry in the index cache ("old"), then we want
 	 * to make sure that it matches any entries in stage 2 ("first
 	 * branch", aka "b").
 	 */
 	if (old) {
 		if (!b || !same(old, b))
 			return -1;
 	}
 	merge = merge_entries(a, b, c);
 	if (merge)
 		return merged_entry(merge, old, dst);
 	if (old)
 		verify_uptodate(old);
 	count = 0;
 	if (a) { *dst++ = a; count++; }
 	if (b) { *dst++ = b; count++; }
 	if (c) { *dst++ = c; count++; }
 	return count;
 }

 /*
  * Two-way merge.
  *
  * The rule is to "carry forward" what is in the index without losing
  * information across a "fast forward", favoring a successful merge
  * over a merge failure when it makes sense.  For details of the
  * "carry forward" rule, please see <Documentation/git-read-tree.txt>.
  *
  */
 static int twoway_merge(struct cache_entry **src, struct cache_entry **dst,
 			struct cache_entry **next, int tail)
 {
 	struct cache_entry *current = src[0];
 	struct cache_entry *oldtree = src[1], *newtree = src[2];

 	if (src[3])
 		return -1;

 	if (current) {
 		if ((!oldtree && !newtree) || /* 4 and 5 */
 		    (!oldtree && newtree &&
 		     same(current, newtree)) || /* 6 and 7 */
 		    (oldtree && newtree &&
 		     same(oldtree, newtree)) || /* 14 and 15 */
 		    (oldtree && newtree &&
 		     !same(oldtree, newtree) && /* 18 and 19*/
 		     same(current, newtree))) {
 			*dst++ = current;
 			return 1;
 		}
 		else if (oldtree && !newtree && same(current, oldtree)) {
 			/* 10 or 11 */
 			return deleted_entry(oldtree, current, dst);
 		}
 		else if (oldtree && newtree &&
 			 same(current, oldtree) && !same(current, newtree)) {
 			/* 20 or 21 */
 			return merged_entry(newtree, current, dst);
 		}
 		else
 			/* all other failures */
 			return -1;
 	}
 	else if (newtree)
 		return merged_entry(newtree, current, dst);
 	else
 		return deleted_entry(oldtree, current, dst);
 }

 /*
  * Two-way merge emulated with three-way merge.
  *
  * This treats "read-tree -m H M" by transforming it internally
  * into "read-tree -m H I+H M", where I+H is a tree that would
  * contain the contents of the current index file, overlayed on
  * top of H.  Unlike the traditional two-way merge, this leaves
  * the stages in the resulting index file and lets the user resolve
  * the merge conflicts using standard tools for three-way merge.
  *
  * This function is just to set-up such an arrangement, and the
  * actual merge uses threeway_merge() function.
  */
 static void setup_emu23(void)
 {
 	/* stage0 contains I, stage1 H, stage2 M.
 	 * move stage2 to stage3, and create stage2 entries
 	 * by scanning stage0 and stage1 entries.
 	 */
 	int i, namelen, size;
 	struct cache_entry *ce, *stage2;

 	for (i = 0; i < active_nr; i++) {
 		ce = active_cache[i];
 		if (ce_stage(ce) != 2)
 			continue;
 		/* hoist them up to stage 3 */
 		namelen = ce_namelen(ce);
 		ce->ce_flags = create_ce_flags(namelen, 3);
 	}

 	for (i = 0; i < active_nr; i++) {
 		ce = active_cache[i];
 		if (ce_stage(ce) > 1)
 			continue;
 		namelen = ce_namelen(ce);
 		size = cache_entry_size(namelen);
 		stage2 = xmalloc(size);
 		memcpy(stage2, ce, size);
 		stage2->ce_flags = create_ce_flags(namelen, 2);
 		if (add_cache_entry(stage2, ADD_CACHE_OK_TO_ADD) < 0)
 			die("cannot merge index and our head tree");

 		/* We are done with this name, so skip to next name */
 		while (i < active_nr &&
 		       ce_namelen(active_cache[i]) == namelen &&
 		       !memcmp(active_cache[i]->name, ce->name, namelen))
 			i++;
 		i--; /* compensate for the loop control */
 	}
 }

 /*
  * One-way merge.
  *
  * The rule is:
  * - take the stat information from stage0, take the data from stage1
  */
 static int oneway_merge(struct cache_entry **src, struct cache_entry **dst,
 			struct cache_entry **next, int tail)
 {
 	struct cache_entry *old = src[0];
 	struct cache_entry *a = src[1];

 	if (src[2] || src[3])
 		return -1;

 	if (!a)
 		return 0;
 	if (old && same(old, a)) {
 		*dst++ = old;
 		return 1;
 	}
 	return merged_entry(a, NULL, dst);
 }

 static void check_updates(struct cache_entry **src, int nr)
 {
 	static struct checkout state = {
 		.base_dir = "",
 		.force = 1,
 		.quiet = 1,
 		.refresh_cache = 1,
 	};
 	unsigned short mask = htons(CE_UPDATE);
 	while (nr--) {
 		struct cache_entry *ce = *src++;
 		if (!ce->ce_mode) {
 			if (update)
 				unlink(ce->name);
 			continue;
 		}
 		if (ce->ce_flags & mask) {
 			ce->ce_flags &= ~mask;
 			if (update)
 				checkout_entry(ce, &state);
 		}
 	}
 }

 typedef int (*merge_fn_t)(struct cache_entry **, struct cache_entry **, struct cache_entry **, int);

 static void merge_cache(struct cache_entry **src, int nr, merge_fn_t fn)
 {
 	struct cache_entry **dst = src;
 	int tail = nr;

 	while (nr) {
 		int entries;
 		struct cache_entry *name, *ce, *stages[4] = { NULL, };

 		name = ce = *src;
 		for (;;) {
 			int stage = ce_stage(ce);
 			stages[stage] = ce;
 			ce = *++src;
 			active_nr--;
 			if (!--nr)
 				break;
 			if (!path_matches(ce, name))
 				break;
 		}

 		entries = fn(stages, dst, src, tail);
 		if (entries < 0)
 			reject_merge(name);
 		dst += entries;
 		active_nr += entries;
 	}
 	check_updates(active_cache, active_nr);
 }

 static int read_cache_unmerged(void)
 {
 	int i, deleted;
 	struct cache_entry **dst;

 	read_cache();
 	dst = active_cache;
 	deleted = 0;
 	for (i = 0; i < active_nr; i++) {
 		struct cache_entry *ce = active_cache[i];
 		if (ce_stage(ce)) {
 			deleted++;
 			continue;
 		}
 		if (deleted)
 			*dst = ce;
 		dst++;
 	}
 	active_nr -= deleted;
 	return deleted;
 }

 static const char read_tree_usage[] = "git-read-tree (<sha> | -m [-u] <sha1> [<sha2> [<sha3>]])";

 static struct cache_file cache_file;

 int main(int argc, char **argv)
 {
 	int i, newfd, merge, reset, emu23;
 	unsigned char sha1[20];

 	newfd = hold_index_file_for_update(&cache_file, get_index_file());
 	if (newfd < 0)
 		die("unable to create new cachefile");

 	merge = 0;
 	reset = 0;
 	emu23 = 0;
 	for (i = 1; i < argc; i++) {
 		const char *arg = argv[i];

 		/* "-u" means "update", meaning that a merge will update the working directory */
 		if (!strcmp(arg, "-u")) {
 			update = 1;
 			continue;
 		}

 		/* This differs from "-m" in that we'll silently ignore unmerged entries */
 		if (!strcmp(arg, "--reset")) {
 			if (stage || merge || emu23)
 				usage(read_tree_usage);
 			reset = 1;
 			merge = 1;
 			stage = 1;
 			read_cache_unmerged();
 			continue;
 		}

 		/* "-m" stands for "merge", meaning we start in stage 1 */
 		if (!strcmp(arg, "-m")) {
 			if (stage || merge || emu23)
 				usage(read_tree_usage);
 			if (read_cache_unmerged())
 				die("you need to resolve your current index first");
 			stage = 1;
 			merge = 1;
 			continue;
 		}

 		/* "-emu23" uses 3-way merge logic to perform fast-forward */
 		if (!strcmp(arg, "--emu23")) {
 			if (stage || merge || emu23)
 				usage(read_tree_usage);
 			if (read_cache_unmerged())
 				die("you need to resolve your current index first");
 			merge = emu23 = stage = 1;
 			continue;
 		}

 		if (get_sha1(arg, sha1) < 0)
 			usage(read_tree_usage);
 		if (stage > 3)
 			usage(read_tree_usage);
 		if (unpack_tree(sha1) < 0)
 			die("failed to unpack tree object %s", arg);
 		stage++;
 	}
 	if (update && !merge)
 		usage(read_tree_usage);
 	if (merge) {
 		static const merge_fn_t merge_function[] = {
 			[1] = oneway_merge,
 			[2] = twoway_merge,
 			[3] = threeway_merge,
 		};
 		merge_fn_t fn;

 		if (stage < 2 || stage > 4)
 			die("just how do you expect me to merge %d trees?", stage-1);
 		if (emu23 && stage != 3)
 			die("--emu23 takes only two trees");
 		fn = merge_function[stage-1];
 		if (stage == 3 && emu23) {
 			setup_emu23();
 			fn = merge_function[3];
 		}
 		merge_cache(active_cache, active_nr, fn);
 	}
 	if (write_cache(newfd, active_cache, active_nr) ||
 	    commit_index_file(&cache_file))
 		die("unable to write new index file");
 	return 0;
 }
	/*
	* GIT - The information manager from hell
	*
	* Copyright (C) Linus Torvalds, 2005
	*/
	#include "cache.h"

	static int stage = 0;
	static int update = 0;

	static int unpack_tree(unsigned char *sha1)
	{
	void *buffer;
	unsigned long size;
	int ret;

	buffer = read_object_with_reference(sha1, "tree", &size, NULL);
	if (!buffer)
	return -1;
	ret = read_tree(buffer, size, stage, NULL);
	free(buffer);
	return ret;
	}

	static int path_matches(struct cache_entry a, struct cache_entry b)
	{
	int len = ce_namelen(a);
	return ce_namelen(b) == len &&
	!memcmp(a->name, b->name, len);
	}

	static int same(struct cache_entry a, struct cache_entry b)
	{
	return a->ce_mode == b->ce_mode &&
	!memcmp(a->sha1, b->sha1, 20);
	}


	/*
	* This removes all trivial merges that don't change the tree
	* and collapses them to state 0.
	*/
	static struct cache_entry merge_entries(struct cache_entry a,
	struct cache_entry *b,
	struct cache_entry *c)
	{
	/*
	* Ok, all three entries describe the same
	* filename, but maybe the contents or file
	* mode have changed?
	*
	* The trivial cases end up being the ones where two
	* out of three files are the same:
	* - both destinations the same, trivially take either
	* - one of the destination versions hasn't changed,
	* take the other.
	*
	* The "all entries exactly the same" case falls out as
	* a special case of any of the "two same" cases.
	*
	* Here "a" is "original", and "b" and "c" are the two
	* trees we are merging.
	*/
	if (a && b && c) {
	if (same(b,c))
	return c;
	if (same(a,b))
	return c;
	if (same(a,c))
	return b;
	}
	return NULL;
	}

	/*
	* When a CE gets turned into an unmerged entry, we
	* want it to be up-to-date
	*/
	static void verify_uptodate(struct cache_entry *ce)
	{
	struct stat st;

	if (!lstat(ce->name, &st)) {
	unsigned changed = ce_match_stat(ce, &st);
	if (!changed)
	return;
	errno = 0;
	}
	if (errno == ENOENT)
	return;
	die("Entry '%s' not uptodate. Cannot merge.", ce->name);
	}

	/*
	* If the old tree contained a CE that isn't even in the
	* result, that's always a problem, regardless of whether
	* it's up-to-date or not (ie it can be a file that we
	* have updated but not committed yet).
	*/
	static void reject_merge(struct cache_entry *ce)
	{
	die("Entry '%s' would be overwritten by merge. Cannot merge.", ce->name);
	}

	static int merged_entry_internal(struct cache_entry merge, struct cache_entry old, struct cache_entry **dst, int allow_dirty)
	{
	merge->ce_flags \|= htons(CE_UPDATE);
	if (old) {
	/*
	* See if we can re-use the old CE directly?
	* That way we get the uptodate stat info.
	*
	* This also removes the UPDATE flag on
	* a match.
	*/
	if (same(old, merge)) {
	merge = old;
	} else if (!allow_dirty) {
	verify_uptodate(old);
	}
	}
	merge->ce_flags &= ~htons(CE_STAGEMASK);
	*dst++ = merge;
	return 1;
	}

	static int merged_entry_allow_dirty(struct cache_entry merge, struct cache_entry old, struct cache_entry **dst)
	{
	return merged_entry_internal(merge, old, dst, 1);
	}

	static int merged_entry(struct cache_entry merge, struct cache_entry old, struct cache_entry **dst)
	{
	return merged_entry_internal(merge, old, dst, 0);
	}

	static int deleted_entry(struct cache_entry ce, struct cache_entry old, struct cache_entry **dst)
	{
	if (old)
	verify_uptodate(old);
	ce->ce_mode = 0;
	*dst++ = ce;
	return 1;
	}

	static int causes_df_conflict(struct cache_entry *ce, int stage,
	struct cache_entry **dst_,
	struct cache_entry **next_,
	int tail)
	{
	/* This is called during the merge operation and walking
	* the active_cache[] array is messy, because it is in the
	* middle of overlapping copy operation. The invariants
	* are:
	* (1) active_cache points at the first (zeroth) entry.
	* (2) up to dst pointer are resolved entries.
	* (3) from the next pointer (head-inclusive) to the tail
	* of the active_cache array have the remaining paths
	* to be processed. There can be a gap between dst
	* and next. Note that next is called "src" in the
	* merge_cache() function, and tail is the original
	* end of active_cache array when merge_cache() started.
	* (4) the path corresponding to *ce is not found in (2)
	* or (3). It is in the gap.
	*
	* active_cache -----......+++++++++++++.
	* ^dst ^next ^tail
	*/
	int i, next, dst;
	const char *path = ce->name;
	int namelen = ce_namelen(ce);

	next = next_ - active_cache;
	dst = dst_ - active_cache;

	for (i = 0; i < tail; i++) {
	int entlen, len;
	const char one, two;
	if (dst <= i && i < next)
	continue;
	ce = active_cache[i];
	if (ce_stage(ce) != stage)
	continue;
	/* If ce->name is a prefix of path, then path is a file
	* that hangs underneath ce->name, which is bad.
	* If path is a prefix of ce->name, then it is the
	* other way around which also is bad.
	*/
	entlen = ce_namelen(ce);
	if (namelen == entlen)
	continue;
	if (namelen < entlen) {
	len = namelen;
	one = path;
	two = ce->name;
	} else {
	len = entlen;
	one = ce->name;
	two = path;
	}
	if (memcmp(one, two, len))
	continue;
	if (two[len] == '/')
	return 1;
	}
	return 0;
	}

	static int threeway_merge(struct cache_entry *stages[4],
	struct cache_entry **dst,
	struct cache_entry **next, int tail)
	{
	struct cache_entry *old = stages[0];
	struct cache_entry a = stages[1], b = stages[2], *c = stages[3];
	struct cache_entry *merge;
	int count;

	/* #5ALT */
	if (!a && b && c && same(b, c)) {
	if (old && !same(b, old))
	return -1;
	return merged_entry_allow_dirty(b, old, dst);
	}
	/* #2ALT and #3ALT */
	if (!a && (!!b != !!c)) {
	/*
	* The reason we need to worry about directory/file
	* conflicts only in #2ALT and #3ALT case is this:
	*
	* (1) For all other cases that read-tree internally
	* resolves a path, we always have such a path in
	* both stage2 and stage3 when we begin.
	* Traditionally, the behaviour has been even
	* stricter and we did not resolve a path without
	* initially being in all of stage1, 2, and 3.
	*
	* (2) When read-tree finishes, all resolved paths (i.e.
	* the paths that are in stage0) must have come from
	* either stage2 or stage3. It is not possible to
	* have a stage0 path as a result of a merge if
	* neither stage2 nor stage3 had that path.
	*
	* (3) It is guaranteed that just after reading the
	* stages, each stage cannot have directory/file
	* conflicts on its own, because they are populated
	* by reading hierarchy of a tree. Combined with
	* (1) and (2) above, this means that no matter what
	* combination of paths we take from stage2 and
	* stage3 as a result of a merge, they cannot cause
	* a directory/file conflict situation (otherwise
	* the "guilty" path would have already had such a
	* conflict in the original stage, either stage2
	* or stage3). Although its stage2 is synthesized
	* by overlaying the current index on top of "our
	* head" tree, --emu23 case also has this guarantee,
	* by calling add_cache_entry() to create such stage2
	* entries.
	*
	* (4) Only #2ALT and #3ALT lack the guarantee (1).
	* They resolve paths that exist only in stage2
	* or stage3. The stage2 tree may have a file DF
	* while stage3 tree may have a file DF/DF. If
	* #2ALT and #3ALT rules happen to apply to both
	* of them, we would end up having DF (coming from
	* stage2) and DF/DF (from stage3) in the result.
	* When we attempt to resolve a path that exists
	* only in stage2, we need to make sure there is
	* no path that would conflict with it in stage3
	* and vice versa.
	*/
	if (c) { /* #2ALT */
	if (!causes_df_conflict(c, 2, dst, next, tail) &&
	(!old \|\| same(c, old)))
	return merged_entry_allow_dirty(c, old, dst);
	}
	else { /* #3ALT */
	if (!causes_df_conflict(b, 3, dst, next, tail) &&
	(!old \|\| same(b, old)))
	return merged_entry_allow_dirty(b, old, dst);
	}
	/* otherwise we will apply the original rule */
	}
	/* #14ALT */
	if (a && b && c && same(a, b) && !same(a, c)) {
	if (old && same(old, c))
	return merged_entry_allow_dirty(c, old, dst);
	/* otherwise the regular rule applies */
	}
	/*
	* If we have an entry in the index cache ("old"), then we want
	* to make sure that it matches any entries in stage 2 ("first
	* branch", aka "b").
	*/
	if (old) {
	if (!b \|\| !same(old, b))
	return -1;
	}
	merge = merge_entries(a, b, c);
	if (merge)
	return merged_entry(merge, old, dst);
	if (old)
	verify_uptodate(old);
	count = 0;
	if (a) { *dst++ = a; count++; }
	if (b) { *dst++ = b; count++; }
	if (c) { *dst++ = c; count++; }
	return count;
	}

	/*
	* Two-way merge.
	*
	* The rule is to "carry forward" what is in the index without losing
	* information across a "fast forward", favoring a successful merge
	* over a merge failure when it makes sense. For details of the
	* "carry forward" rule, please see <Documentation/git-read-tree.txt>.
	*
	*/
	static int twoway_merge(struct cache_entry src, struct cache_entry dst,
	struct cache_entry **next, int tail)
	{
	struct cache_entry *current = src[0];
	struct cache_entry oldtree = src[1], newtree = src[2];

	if (src[3])
	return -1;

	if (current) {
	if ((!oldtree && !newtree) \|\| /* 4 and 5 */
	(!oldtree && newtree &&
	same(current, newtree)) \|\| /* 6 and 7 */
	(oldtree && newtree &&
	same(oldtree, newtree)) \|\| /* 14 and 15 */
	(oldtree && newtree &&
	!same(oldtree, newtree) && /* 18 and 19*/
	same(current, newtree))) {
	*dst++ = current;
	return 1;
	}
	else if (oldtree && !newtree && same(current, oldtree)) {
	/* 10 or 11 */
	return deleted_entry(oldtree, current, dst);
	}
	else if (oldtree && newtree &&
	same(current, oldtree) && !same(current, newtree)) {
	/* 20 or 21 */
	return merged_entry(newtree, current, dst);
	}
	else
	/* all other failures */
	return -1;
	}
	else if (newtree)
	return merged_entry(newtree, current, dst);
	else
	return deleted_entry(oldtree, current, dst);
	}

	/*
	* Two-way merge emulated with three-way merge.
	*
	* This treats "read-tree -m H M" by transforming it internally
	* into "read-tree -m H I+H M", where I+H is a tree that would
	* contain the contents of the current index file, overlayed on
	* top of H. Unlike the traditional two-way merge, this leaves
	* the stages in the resulting index file and lets the user resolve
	* the merge conflicts using standard tools for three-way merge.
	*
	* This function is just to set-up such an arrangement, and the
	* actual merge uses threeway_merge() function.
	*/
	static void setup_emu23(void)
	{
	/* stage0 contains I, stage1 H, stage2 M.
	* move stage2 to stage3, and create stage2 entries
	* by scanning stage0 and stage1 entries.
	*/
	int i, namelen, size;
	struct cache_entry ce, stage2;

	for (i = 0; i < active_nr; i++) {
	ce = active_cache[i];
	if (ce_stage(ce) != 2)
	continue;
	/* hoist them up to stage 3 */
	namelen = ce_namelen(ce);
	ce->ce_flags = create_ce_flags(namelen, 3);
	}

	for (i = 0; i < active_nr; i++) {
	ce = active_cache[i];
	if (ce_stage(ce) > 1)
	continue;
	namelen = ce_namelen(ce);
	size = cache_entry_size(namelen);
	stage2 = xmalloc(size);
	memcpy(stage2, ce, size);
	stage2->ce_flags = create_ce_flags(namelen, 2);
	if (add_cache_entry(stage2, ADD_CACHE_OK_TO_ADD) < 0)
	die("cannot merge index and our head tree");

	/* We are done with this name, so skip to next name */
	while (i < active_nr &&
	ce_namelen(active_cache[i]) == namelen &&
	!memcmp(active_cache[i]->name, ce->name, namelen))
	i++;
	i--; /* compensate for the loop control */
	}
	}

	/*
	* One-way merge.
	*
	* The rule is:
	* - take the stat information from stage0, take the data from stage1
	*/
	static int oneway_merge(struct cache_entry src, struct cache_entry dst,
	struct cache_entry **next, int tail)
	{
	struct cache_entry *old = src[0];
	struct cache_entry *a = src[1];

	if (src[2] \|\| src[3])
	return -1;

	if (!a)
	return 0;
	if (old && same(old, a)) {
	*dst++ = old;
	return 1;
	}
	return merged_entry(a, NULL, dst);
	}

	static void check_updates(struct cache_entry **src, int nr)
	{
	static struct checkout state = {
	.base_dir = "",
	.force = 1,
	.quiet = 1,
	.refresh_cache = 1,
	};
	unsigned short mask = htons(CE_UPDATE);
	while (nr--) {
	struct cache_entry ce = src++;
	if (!ce->ce_mode) {
	if (update)
	unlink(ce->name);
	continue;
	}
	if (ce->ce_flags & mask) {
	ce->ce_flags &= ~mask;
	if (update)
	checkout_entry(ce, &state);
	}
	}
	}

	typedef int (merge_fn_t)(struct cache_entry , struct cache_entry , struct cache_entry *, int);

	static void merge_cache(struct cache_entry **src, int nr, merge_fn_t fn)
	{
	struct cache_entry **dst = src;
	int tail = nr;

	while (nr) {
	int entries;
	struct cache_entry name, ce, *stages[4] = { NULL, };

	name = ce = *src;
	for (;;) {
	int stage = ce_stage(ce);
	stages[stage] = ce;
	ce = *++src;
	active_nr--;
	if (!--nr)
	break;
	if (!path_matches(ce, name))
	break;
	}

	entries = fn(stages, dst, src, tail);
	if (entries < 0)
	reject_merge(name);
	dst += entries;
	active_nr += entries;
	}
	check_updates(active_cache, active_nr);
	}

	static int read_cache_unmerged(void)
	{
	int i, deleted;
	struct cache_entry **dst;

	read_cache();
	dst = active_cache;
	deleted = 0;
	for (i = 0; i < active_nr; i++) {
	struct cache_entry *ce = active_cache[i];
	if (ce_stage(ce)) {
	deleted++;
	continue;
	}
	if (deleted)
	*dst = ce;
	dst++;
	}
	active_nr -= deleted;
	return deleted;
	}

	static const char read_tree_usage[] = "git-read-tree (<sha> \| -m [-u] <sha1> [<sha2> [<sha3>]])";

	static struct cache_file cache_file;

	int main(int argc, char **argv)
	{
	int i, newfd, merge, reset, emu23;
	unsigned char sha1[20];

	newfd = hold_index_file_for_update(&cache_file, get_index_file());
	if (newfd < 0)
	die("unable to create new cachefile");

	merge = 0;
	reset = 0;
	emu23 = 0;
	for (i = 1; i < argc; i++) {
	const char *arg = argv[i];

	/* "-u" means "update", meaning that a merge will update the working directory */
	if (!strcmp(arg, "-u")) {
	update = 1;
	continue;
	}

	/* This differs from "-m" in that we'll silently ignore unmerged entries */
	if (!strcmp(arg, "--reset")) {
	if (stage \|\| merge \|\| emu23)
	usage(read_tree_usage);
	reset = 1;
	merge = 1;
	stage = 1;
	read_cache_unmerged();
	continue;
	}

	/* "-m" stands for "merge", meaning we start in stage 1 */
	if (!strcmp(arg, "-m")) {
	if (stage \|\| merge \|\| emu23)
	usage(read_tree_usage);
	if (read_cache_unmerged())
	die("you need to resolve your current index first");
	stage = 1;
	merge = 1;
	continue;
	}

	/* "-emu23" uses 3-way merge logic to perform fast-forward */
	if (!strcmp(arg, "--emu23")) {
	if (stage \|\| merge \|\| emu23)
	usage(read_tree_usage);
	if (read_cache_unmerged())
	die("you need to resolve your current index first");
	merge = emu23 = stage = 1;
	continue;
	}

	if (get_sha1(arg, sha1) < 0)
	usage(read_tree_usage);
	if (stage > 3)
	usage(read_tree_usage);
	if (unpack_tree(sha1) < 0)
	die("failed to unpack tree object %s", arg);
	stage++;
	}
	if (update && !merge)
	usage(read_tree_usage);
	if (merge) {
	static const merge_fn_t merge_function[] = {
	[1] = oneway_merge,
	[2] = twoway_merge,
	[3] = threeway_merge,
	};
	merge_fn_t fn;

	if (stage < 2 \|\| stage > 4)
	die("just how do you expect me to merge %d trees?", stage-1);
	if (emu23 && stage != 3)
	die("--emu23 takes only two trees");
	fn = merge_function[stage-1];
	if (stage == 3 && emu23) {
	setup_emu23();
	fn = merge_function[3];
	}
	merge_cache(active_cache, active_nr, fn);
	}
	if (write_cache(newfd, active_cache, active_nr) \|\|
	commit_index_file(&cache_file))
	die("unable to write new index file");
	return 0;
	}