git-read-tree: simplify merge loops enormously

Stop trying to haev this stateful thing that keeps track of what it has
seen, and use a much simpler "gather all the different stages with the
same name together and just merge them in one go" approach.

Makes it a lot more understandable, and allows the different merge
algorithms to share the basic merge loop.
This commit is contained in:
Linus Torvalds
2005-06-06 14:01:58 -07:00
parent 96cd5429a4
commit d723c69063

View File

@ -39,27 +39,11 @@ static int same(struct cache_entry *a, struct cache_entry *b)
/* /*
* This removes all trivial merges that don't change the tree * This removes all trivial merges that don't change the tree
* and collapses them to state 0. * and collapses them to state 0.
*
* _Any_ other merge is left to user policy. That includes "both
* created the same file", and "both removed the same file" - which are
* trivial, but the user might still want to _note_ it.
*/ */
static struct cache_entry *merge_entries(struct cache_entry *a, static struct cache_entry *merge_entries(struct cache_entry *a,
struct cache_entry *b, struct cache_entry *b,
struct cache_entry *c) struct cache_entry *c)
{ {
int len = ce_namelen(a);
/*
* Are they all the same filename? We won't do
* any name merging
*/
if (ce_namelen(b) != len ||
ce_namelen(c) != len ||
memcmp(a->name, b->name, len) ||
memcmp(a->name, c->name, len))
return NULL;
/* /*
* Ok, all three entries describe the same * Ok, all three entries describe the same
* filename, but maybe the contents or file * filename, but maybe the contents or file
@ -77,12 +61,14 @@ static struct cache_entry *merge_entries(struct cache_entry *a,
* Here "a" is "original", and "b" and "c" are the two * Here "a" is "original", and "b" and "c" are the two
* trees we are merging. * trees we are merging.
*/ */
if (a && b && c) {
if (same(b,c)) if (same(b,c))
return c; return c;
if (same(a,b)) if (same(a,b))
return c; return c;
if (same(a,c)) if (same(a,c))
return b; return b;
}
return NULL; return NULL;
} }
@ -116,30 +102,10 @@ static void reject_merge(struct cache_entry *ce)
die("Entry '%s' would be overwritten by merge. Cannot merge.", ce->name); die("Entry '%s' would be overwritten by merge. Cannot merge.", ce->name);
} }
#define CHECK_OLD(ce) if (old && same(old, ce)) { verify_uptodate(old); old = NULL; } static int merged_entry(struct cache_entry *merge, struct cache_entry *old, struct cache_entry **dst)
static void trivially_merge_cache(struct cache_entry **src, int nr)
{ {
struct cache_entry **dst = src; merge->ce_flags |= htons(CE_UPDATE);
struct cache_entry *old = NULL; if (old) {
while (nr--) {
struct cache_entry *ce, *result;
ce = *src++;
/* We throw away original cache entries except for the stat information */
if (!ce_stage(ce)) {
if (old)
reject_merge(old);
old = ce;
active_nr--;
continue;
}
if (old && !path_matches(old, ce))
reject_merge(old);
if (nr > 1 && (result = merge_entries(ce, src[0], src[1])) != NULL) {
result->ce_flags |= htons(CE_UPDATE);
/* /*
* See if we can re-use the old CE directly? * See if we can re-use the old CE directly?
* That way we get the uptodate stat info. * That way we get the uptodate stat info.
@ -147,57 +113,43 @@ static void trivially_merge_cache(struct cache_entry **src, int nr)
* This also removes the UPDATE flag on * This also removes the UPDATE flag on
* a match. * a match.
*/ */
if (old && same(old, result)) { if (same(old, merge)) {
*result = *old; *merge = *old;
old = NULL; } else {
verify_uptodate(old);
} }
CHECK_OLD(ce);
CHECK_OLD(src[0]);
CHECK_OLD(src[1]);
ce = result;
ce->ce_flags &= ~htons(CE_STAGEMASK);
src += 2;
nr -= 2;
active_nr -= 2;
} }
merge->ce_flags &= ~htons(CE_STAGEMASK);
/* *dst++ = merge;
* If we had an old entry that we now effectively return 1;
* overwrite, make sure it wasn't dirty.
*/
CHECK_OLD(ce);
*dst++ = ce;
}
if (old)
reject_merge(old);
} }
/* static int threeway_merge(struct cache_entry *stages[4], struct cache_entry **dst)
* When we find a "stage2" entry in the two-way merge, that's
* the one that will remain. If we have an exact old match,
* we don't care whether the file is up-to-date or not, we just
* re-use the thing directly.
*
* If we didn't have an exact match, then we want to make sure
* that we've seen a stage1 that matched the old, and that the
* old file was up-to-date. Because it will be gone after this
* merge..
*/
static void twoway_check(struct cache_entry *old, int seen_stage1, struct cache_entry *ce)
{ {
if (path_matches(old, ce)) { struct cache_entry *old = stages[0];
struct cache_entry *a = stages[1], *b = stages[2], *c = stages[3];
struct cache_entry *merge;
int count;
/* /*
* This also removes the UPDATE flag on * If we have an entry in the index cache ("old"), then we want
* a match * to make sure that it matches any entries in stage 2 ("first
* branch", aka "b").
*/ */
if (same(old, ce)) { if (old) {
*ce = *old; if (!b || !same(old, b))
return; return -1;
}
if (!seen_stage1)
reject_merge(old);
} }
merge = merge_entries(a, b, c);
if (merge)
return merged_entry(merge, old, dst);
if (old)
verify_uptodate(old); verify_uptodate(old);
count = 0;
if (a) { *dst++ = a; count++; }
if (b) { *dst++ = b; count++; }
if (c) { *dst++ = c; count++; }
return count;
} }
/* /*
@ -208,79 +160,46 @@ static void twoway_check(struct cache_entry *old, int seen_stage1, struct cache_
* - if the current entry matches the new tree, we leave it * - if the current entry matches the new tree, we leave it
* as-is. Otherwise we require that it be up-to-date. * as-is. Otherwise we require that it be up-to-date.
*/ */
static void twoway_merge(struct cache_entry **src, int nr) static int twoway_merge(struct cache_entry **src, struct cache_entry **dst)
{ {
int seen_stage1 = 0; struct cache_entry *old = src[0];
struct cache_entry *old = NULL; struct cache_entry *a = src[1], *b = src[2];
struct cache_entry **dst = src;
while (nr--) { if (src[3])
struct cache_entry *ce = *src++; return -1;
int stage = ce_stage(ce);
switch (stage) { if (old) {
case 0: if (!a || !same(old, a))
return -1;
}
if (b)
return merged_entry(b, old, dst);
if (old) if (old)
reject_merge(old);
old = ce;
seen_stage1 = 0;
active_nr--;
continue;
case 1:
active_nr--;
if (!old)
continue;
if (!path_matches(old, ce) || !same(old, ce))
reject_merge(old);
seen_stage1 = 1;
continue;
case 2:
ce->ce_flags |= htons(CE_UPDATE);
if (old) {
twoway_check(old, seen_stage1, ce);
old = NULL;
}
ce->ce_flags &= ~htons(CE_STAGEMASK);
*dst++ = ce;
continue;
}
die("impossible two-way stage");
}
/*
* Unmatched with a new entry? Make sure it was
* at least uptodate in the working directory _and_
* the original tree..
*/
if (old) {
if (!seen_stage1)
reject_merge(old);
verify_uptodate(old); verify_uptodate(old);
} return 0;
} }
static void merge_stat_info(struct cache_entry **src, int nr) /*
* One-way merge.
*
* The rule is:
* - take the stat information from stage0, take the data from stage1
*/
static int oneway_merge(struct cache_entry **src, struct cache_entry **dst)
{ {
static struct cache_entry null_entry; struct cache_entry *old = src[0];
struct cache_entry **dst = src; struct cache_entry *a = src[1];
struct cache_entry *stat = &null_entry;
while (nr--) { if (src[2] || src[3])
struct cache_entry *ce = *src++; return -1;
/* We throw away original cache entries except for the stat information */ if (!a)
if (!ce_stage(ce)) { return 0;
stat = ce; if (old && same(old, a))
active_nr--; *a = *old;
continue; a->ce_flags &= ~htons(CE_STAGEMASK);
} *dst++ = a;
if (path_matches(ce, stat) && same(ce, stat)) return 1;
*ce = *stat;
ce->ce_flags &= ~htons(CE_STAGEMASK);
*dst++ = ce;
}
} }
static void check_updates(struct cache_entry **src, int nr) static void check_updates(struct cache_entry **src, int nr)
@ -302,6 +221,35 @@ static void check_updates(struct cache_entry **src, int nr)
} }
} }
static void merge_cache(struct cache_entry **src, int nr, int (*fn)(struct cache_entry **, struct cache_entry **))
{
struct cache_entry **dst = src;
while (nr) {
int entries;
struct cache_entry *name, *ce, *stages[4] = { NULL, };
name = ce = *src;
for (;;) {
int stage = ce_stage(ce);
stages[stage] = ce;
ce = *++src;
active_nr--;
if (!--nr)
break;
if (!path_matches(ce, name))
break;
}
entries = fn(stages, dst);
if (entries < 0)
reject_merge(name);
dst += entries;
active_nr += entries;
}
check_updates(active_cache, active_nr);
}
static char *read_tree_usage = "git-read-tree (<sha> | -m <sha1> [<sha2> [<sha3>]])"; static char *read_tree_usage = "git-read-tree (<sha> | -m <sha1> [<sha2> [<sha3>]])";
static struct cache_file cache_file; static struct cache_file cache_file;
@ -350,15 +298,14 @@ int main(int argc, char **argv)
if (merge) { if (merge) {
switch (stage) { switch (stage) {
case 4: /* Three-way merge */ case 4: /* Three-way merge */
trivially_merge_cache(active_cache, active_nr); merge_cache(active_cache, active_nr, threeway_merge);
check_updates(active_cache, active_nr);
break; break;
case 3: /* Update from one tree to another */ case 3: /* Update from one tree to another */
twoway_merge(active_cache, active_nr); merge_cache(active_cache, active_nr, twoway_merge);
check_updates(active_cache, active_nr); check_updates(active_cache, active_nr);
break; break;
case 2: /* Just read a tree, merge with old cache contents */ case 2: /* Just read a tree, merge with old cache contents */
merge_stat_info(active_cache, active_nr); merge_cache(active_cache, active_nr, oneway_merge);
break; break;
default: default:
die("just how do you expect me to merge %d trees?", stage-1); die("just how do you expect me to merge %d trees?", stage-1);