You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
603 lines
16 KiB
603 lines
16 KiB
/* |
|
* GIT - The information manager from hell |
|
* |
|
* Copyright (C) Linus Torvalds, 2005 |
|
*/ |
|
#include "cache.h" |
|
|
|
static int stage = 0; |
|
static int update = 0; |
|
|
|
static int unpack_tree(unsigned char *sha1) |
|
{ |
|
void *buffer; |
|
unsigned long size; |
|
int ret; |
|
|
|
buffer = read_object_with_reference(sha1, "tree", &size, NULL); |
|
if (!buffer) |
|
return -1; |
|
ret = read_tree(buffer, size, stage); |
|
free(buffer); |
|
return ret; |
|
} |
|
|
|
static int path_matches(struct cache_entry *a, struct cache_entry *b) |
|
{ |
|
int len = ce_namelen(a); |
|
return ce_namelen(b) == len && |
|
!memcmp(a->name, b->name, len); |
|
} |
|
|
|
static int same(struct cache_entry *a, struct cache_entry *b) |
|
{ |
|
return a->ce_mode == b->ce_mode && |
|
!memcmp(a->sha1, b->sha1, 20); |
|
} |
|
|
|
|
|
/* |
|
* This removes all trivial merges that don't change the tree |
|
* and collapses them to state 0. |
|
*/ |
|
static struct cache_entry *merge_entries(struct cache_entry *a, |
|
struct cache_entry *b, |
|
struct cache_entry *c) |
|
{ |
|
/* |
|
* Ok, all three entries describe the same |
|
* filename, but maybe the contents or file |
|
* mode have changed? |
|
* |
|
* The trivial cases end up being the ones where two |
|
* out of three files are the same: |
|
* - both destinations the same, trivially take either |
|
* - one of the destination versions hasn't changed, |
|
* take the other. |
|
* |
|
* The "all entries exactly the same" case falls out as |
|
* a special case of any of the "two same" cases. |
|
* |
|
* Here "a" is "original", and "b" and "c" are the two |
|
* trees we are merging. |
|
*/ |
|
if (a && b && c) { |
|
if (same(b,c)) |
|
return c; |
|
if (same(a,b)) |
|
return c; |
|
if (same(a,c)) |
|
return b; |
|
} |
|
return NULL; |
|
} |
|
|
|
/* |
|
* When a CE gets turned into an unmerged entry, we |
|
* want it to be up-to-date |
|
*/ |
|
static void verify_uptodate(struct cache_entry *ce) |
|
{ |
|
struct stat st; |
|
|
|
if (!lstat(ce->name, &st)) { |
|
unsigned changed = ce_match_stat(ce, &st); |
|
if (!changed) |
|
return; |
|
errno = 0; |
|
} |
|
if (errno == ENOENT) |
|
return; |
|
die("Entry '%s' not uptodate. Cannot merge.", ce->name); |
|
} |
|
|
|
/* |
|
* If the old tree contained a CE that isn't even in the |
|
* result, that's always a problem, regardless of whether |
|
* it's up-to-date or not (ie it can be a file that we |
|
* have updated but not committed yet). |
|
*/ |
|
static void reject_merge(struct cache_entry *ce) |
|
{ |
|
die("Entry '%s' would be overwritten by merge. Cannot merge.", ce->name); |
|
} |
|
|
|
static int merged_entry_internal(struct cache_entry *merge, struct cache_entry *old, struct cache_entry **dst, int allow_dirty) |
|
{ |
|
merge->ce_flags |= htons(CE_UPDATE); |
|
if (old) { |
|
/* |
|
* See if we can re-use the old CE directly? |
|
* That way we get the uptodate stat info. |
|
* |
|
* This also removes the UPDATE flag on |
|
* a match. |
|
*/ |
|
if (same(old, merge)) { |
|
*merge = *old; |
|
} else if (!allow_dirty) { |
|
verify_uptodate(old); |
|
} |
|
} |
|
merge->ce_flags &= ~htons(CE_STAGEMASK); |
|
*dst++ = merge; |
|
return 1; |
|
} |
|
|
|
static int merged_entry_allow_dirty(struct cache_entry *merge, struct cache_entry *old, struct cache_entry **dst) |
|
{ |
|
return merged_entry_internal(merge, old, dst, 1); |
|
} |
|
|
|
static int merged_entry(struct cache_entry *merge, struct cache_entry *old, struct cache_entry **dst) |
|
{ |
|
return merged_entry_internal(merge, old, dst, 0); |
|
} |
|
|
|
static int deleted_entry(struct cache_entry *ce, struct cache_entry *old, struct cache_entry **dst) |
|
{ |
|
if (old) |
|
verify_uptodate(old); |
|
ce->ce_mode = 0; |
|
*dst++ = ce; |
|
return 1; |
|
} |
|
|
|
static int causes_df_conflict(struct cache_entry *ce, int stage, |
|
struct cache_entry **dst_, |
|
struct cache_entry **next_, |
|
int tail) |
|
{ |
|
/* This is called during the merge operation and walking |
|
* the active_cache[] array is messy, because it is in the |
|
* middle of overlapping copy operation. The invariants |
|
* are: |
|
* (1) active_cache points at the first (zeroth) entry. |
|
* (2) up to dst pointer are resolved entries. |
|
* (3) from the next pointer (head-inclusive) to the tail |
|
* of the active_cache array have the remaining paths |
|
* to be processed. There can be a gap between dst |
|
* and next. Note that next is called "src" in the |
|
* merge_cache() function, and tail is the original |
|
* end of active_cache array when merge_cache() started. |
|
* (4) the path corresponding to *ce is not found in (2) |
|
* or (3). It is in the gap. |
|
* |
|
* active_cache -----......+++++++++++++. |
|
* ^dst ^next ^tail |
|
*/ |
|
int i, next, dst; |
|
const char *path = ce->name; |
|
int namelen = ce_namelen(ce); |
|
|
|
next = next_ - active_cache; |
|
dst = dst_ - active_cache; |
|
|
|
for (i = 0; i < tail; i++) { |
|
int entlen, len; |
|
const char *one, *two; |
|
if (dst <= i && i < next) |
|
continue; |
|
ce = active_cache[i]; |
|
if (ce_stage(ce) != stage) |
|
continue; |
|
/* If ce->name is a prefix of path, then path is a file |
|
* that hangs underneath ce->name, which is bad. |
|
* If path is a prefix of ce->name, then it is the |
|
* other way around which also is bad. |
|
*/ |
|
entlen = ce_namelen(ce); |
|
if (namelen == entlen) |
|
continue; |
|
if (namelen < entlen) { |
|
len = namelen; |
|
one = path; |
|
two = ce->name; |
|
} else { |
|
len = entlen; |
|
one = ce->name; |
|
two = path; |
|
} |
|
if (memcmp(one, two, len)) |
|
continue; |
|
if (two[len] == '/') |
|
return 1; |
|
} |
|
return 0; |
|
} |
|
|
|
static int threeway_merge(struct cache_entry *stages[4], |
|
struct cache_entry **dst, |
|
struct cache_entry **next, int tail) |
|
{ |
|
struct cache_entry *old = stages[0]; |
|
struct cache_entry *a = stages[1], *b = stages[2], *c = stages[3]; |
|
struct cache_entry *merge; |
|
int count; |
|
|
|
/* #5ALT */ |
|
if (!a && b && c && same(b, c)) { |
|
if (old && !same(b, old)) |
|
return -1; |
|
return merged_entry_allow_dirty(b, old, dst); |
|
} |
|
/* #2ALT and #3ALT */ |
|
if (!a && (!!b != !!c)) { |
|
/* |
|
* The reason we need to worry about directory/file |
|
* conflicts only in #2ALT and #3ALT case is this: |
|
* |
|
* (1) For all other cases that read-tree internally |
|
* resolves a path, we always have such a path in |
|
* *both* stage2 and stage3 when we begin. |
|
* Traditionally, the behaviour has been even |
|
* stricter and we did not resolve a path without |
|
* initially being in all of stage1, 2, and 3. |
|
* |
|
* (2) When read-tree finishes, all resolved paths (i.e. |
|
* the paths that are in stage0) must have come from |
|
* either stage2 or stage3. It is not possible to |
|
* have a stage0 path as a result of a merge if |
|
* neither stage2 nor stage3 had that path. |
|
* |
|
* (3) It is guaranteed that just after reading the |
|
* stages, each stage cannot have directory/file |
|
* conflicts on its own, because they are populated |
|
* by reading hierarchy of a tree. Combined with |
|
* (1) and (2) above, this means that no matter what |
|
* combination of paths we take from stage2 and |
|
* stage3 as a result of a merge, they cannot cause |
|
* a directory/file conflict situation (otherwise |
|
* the "guilty" path would have already had such a |
|
* conflict in the original stage, either stage2 |
|
* or stage3). Although its stage2 is synthesized |
|
* by overlaying the current index on top of "our |
|
* head" tree, --emu23 case also has this guarantee, |
|
* by calling add_cache_entry() to create such stage2 |
|
* entries. |
|
* |
|
* (4) Only #2ALT and #3ALT lack the guarantee (1). |
|
* They resolve paths that exist only in stage2 |
|
* or stage3. The stage2 tree may have a file DF |
|
* while stage3 tree may have a file DF/DF. If |
|
* #2ALT and #3ALT rules happen to apply to both |
|
* of them, we would end up having DF (coming from |
|
* stage2) and DF/DF (from stage3) in the result. |
|
* When we attempt to resolve a path that exists |
|
* only in stage2, we need to make sure there is |
|
* no path that would conflict with it in stage3 |
|
* and vice versa. |
|
*/ |
|
if (c) { /* #2ALT */ |
|
if (!causes_df_conflict(c, 2, dst, next, tail) && |
|
(!old || same(c, old))) |
|
return merged_entry_allow_dirty(c, old, dst); |
|
} |
|
else { /* #3ALT */ |
|
if (!causes_df_conflict(b, 3, dst, next, tail) && |
|
(!old || same(b, old))) |
|
return merged_entry_allow_dirty(b, old, dst); |
|
} |
|
/* otherwise we will apply the original rule */ |
|
} |
|
/* #14ALT */ |
|
if (a && b && c && same(a, b) && !same(a, c)) { |
|
if (old && same(old, c)) |
|
return merged_entry_allow_dirty(c, old, dst); |
|
/* otherwise the regular rule applies */ |
|
} |
|
/* |
|
* If we have an entry in the index cache ("old"), then we want |
|
* to make sure that it matches any entries in stage 2 ("first |
|
* branch", aka "b"). |
|
*/ |
|
if (old) { |
|
if (!b || !same(old, b)) |
|
return -1; |
|
} |
|
merge = merge_entries(a, b, c); |
|
if (merge) |
|
return merged_entry(merge, old, dst); |
|
if (old) |
|
verify_uptodate(old); |
|
count = 0; |
|
if (a) { *dst++ = a; count++; } |
|
if (b) { *dst++ = b; count++; } |
|
if (c) { *dst++ = c; count++; } |
|
return count; |
|
} |
|
|
|
/* |
|
* Two-way merge. |
|
* |
|
* The rule is to "carry forward" what is in the index without losing |
|
* information across a "fast forward", favoring a successful merge |
|
* over a merge failure when it makes sense. For details of the |
|
* "carry forward" rule, please see <Documentation/git-read-tree.txt>. |
|
* |
|
*/ |
|
static int twoway_merge(struct cache_entry **src, struct cache_entry **dst, |
|
struct cache_entry **next, int tail) |
|
{ |
|
struct cache_entry *current = src[0]; |
|
struct cache_entry *oldtree = src[1], *newtree = src[2]; |
|
|
|
if (src[3]) |
|
return -1; |
|
|
|
if (current) { |
|
if ((!oldtree && !newtree) || /* 4 and 5 */ |
|
(!oldtree && newtree && |
|
same(current, newtree)) || /* 6 and 7 */ |
|
(oldtree && newtree && |
|
same(oldtree, newtree)) || /* 14 and 15 */ |
|
(oldtree && newtree && |
|
!same(oldtree, newtree) && /* 18 and 19*/ |
|
same(current, newtree))) { |
|
*dst++ = current; |
|
return 1; |
|
} |
|
else if (oldtree && !newtree && same(current, oldtree)) { |
|
/* 10 or 11 */ |
|
return deleted_entry(oldtree, current, dst); |
|
} |
|
else if (oldtree && newtree && |
|
same(current, oldtree) && !same(current, newtree)) { |
|
/* 20 or 21 */ |
|
return merged_entry(newtree, current, dst); |
|
} |
|
else |
|
/* all other failures */ |
|
return -1; |
|
} |
|
else if (newtree) |
|
return merged_entry(newtree, current, dst); |
|
else |
|
return deleted_entry(oldtree, current, dst); |
|
} |
|
|
|
/* |
|
* Two-way merge emulated with three-way merge. |
|
* |
|
* This treats "read-tree -m H M" by transforming it internally |
|
* into "read-tree -m H I+H M", where I+H is a tree that would |
|
* contain the contents of the current index file, overlayed on |
|
* top of H. Unlike the traditional two-way merge, this leaves |
|
* the stages in the resulting index file and lets the user resolve |
|
* the merge conflicts using standard tools for three-way merge. |
|
* |
|
* This function is just to set-up such an arrangement, and the |
|
* actual merge uses threeway_merge() function. |
|
*/ |
|
static void setup_emu23(void) |
|
{ |
|
/* stage0 contains I, stage1 H, stage2 M. |
|
* move stage2 to stage3, and create stage2 entries |
|
* by scanning stage0 and stage1 entries. |
|
*/ |
|
int i, namelen, size; |
|
struct cache_entry *ce, *stage2; |
|
|
|
for (i = 0; i < active_nr; i++) { |
|
ce = active_cache[i]; |
|
if (ce_stage(ce) != 2) |
|
continue; |
|
/* hoist them up to stage 3 */ |
|
namelen = ce_namelen(ce); |
|
ce->ce_flags = create_ce_flags(namelen, 3); |
|
} |
|
|
|
for (i = 0; i < active_nr; i++) { |
|
ce = active_cache[i]; |
|
if (ce_stage(ce) > 1) |
|
continue; |
|
namelen = ce_namelen(ce); |
|
size = cache_entry_size(namelen); |
|
stage2 = xmalloc(size); |
|
memcpy(stage2, ce, size); |
|
stage2->ce_flags = create_ce_flags(namelen, 2); |
|
if (add_cache_entry(stage2, ADD_CACHE_OK_TO_ADD) < 0) |
|
die("cannot merge index and our head tree"); |
|
|
|
/* We are done with this name, so skip to next name */ |
|
while (i < active_nr && |
|
ce_namelen(active_cache[i]) == namelen && |
|
!memcmp(active_cache[i]->name, ce->name, namelen)) |
|
i++; |
|
i--; /* compensate for the loop control */ |
|
} |
|
} |
|
|
|
/* |
|
* One-way merge. |
|
* |
|
* The rule is: |
|
* - take the stat information from stage0, take the data from stage1 |
|
*/ |
|
static int oneway_merge(struct cache_entry **src, struct cache_entry **dst, |
|
struct cache_entry **next, int tail) |
|
{ |
|
struct cache_entry *old = src[0]; |
|
struct cache_entry *a = src[1]; |
|
|
|
if (src[2] || src[3]) |
|
return -1; |
|
|
|
if (!a) |
|
return 0; |
|
if (old && same(old, a)) { |
|
*dst++ = old; |
|
return 1; |
|
} |
|
return merged_entry(a, NULL, dst); |
|
} |
|
|
|
static void check_updates(struct cache_entry **src, int nr) |
|
{ |
|
static struct checkout state = { |
|
.base_dir = "", |
|
.force = 1, |
|
.quiet = 1, |
|
.refresh_cache = 1, |
|
}; |
|
unsigned short mask = htons(CE_UPDATE); |
|
while (nr--) { |
|
struct cache_entry *ce = *src++; |
|
if (!ce->ce_mode) { |
|
if (update) |
|
unlink(ce->name); |
|
continue; |
|
} |
|
if (ce->ce_flags & mask) { |
|
ce->ce_flags &= ~mask; |
|
if (update) |
|
checkout_entry(ce, &state); |
|
} |
|
} |
|
} |
|
|
|
typedef int (*merge_fn_t)(struct cache_entry **, struct cache_entry **, struct cache_entry **, int); |
|
|
|
static void merge_cache(struct cache_entry **src, int nr, merge_fn_t fn) |
|
{ |
|
struct cache_entry **dst = src; |
|
int tail = nr; |
|
|
|
while (nr) { |
|
int entries; |
|
struct cache_entry *name, *ce, *stages[4] = { NULL, }; |
|
|
|
name = ce = *src; |
|
for (;;) { |
|
int stage = ce_stage(ce); |
|
stages[stage] = ce; |
|
ce = *++src; |
|
active_nr--; |
|
if (!--nr) |
|
break; |
|
if (!path_matches(ce, name)) |
|
break; |
|
} |
|
|
|
entries = fn(stages, dst, src, tail); |
|
if (entries < 0) |
|
reject_merge(name); |
|
dst += entries; |
|
active_nr += entries; |
|
} |
|
check_updates(active_cache, active_nr); |
|
} |
|
|
|
static int read_cache_unmerged(void) |
|
{ |
|
int i, deleted; |
|
struct cache_entry **dst; |
|
|
|
read_cache(); |
|
dst = active_cache; |
|
deleted = 0; |
|
for (i = 0; i < active_nr; i++) { |
|
struct cache_entry *ce = active_cache[i]; |
|
if (ce_stage(ce)) { |
|
deleted++; |
|
continue; |
|
} |
|
if (deleted) |
|
*dst = ce; |
|
dst++; |
|
} |
|
active_nr -= deleted; |
|
return deleted; |
|
} |
|
|
|
static char *read_tree_usage = "git-read-tree (<sha> | -m [-u] <sha1> [<sha2> [<sha3>]])"; |
|
|
|
static struct cache_file cache_file; |
|
|
|
int main(int argc, char **argv) |
|
{ |
|
int i, newfd, merge, reset, emu23; |
|
unsigned char sha1[20]; |
|
|
|
newfd = hold_index_file_for_update(&cache_file, get_index_file()); |
|
if (newfd < 0) |
|
die("unable to create new cachefile"); |
|
|
|
merge = 0; |
|
reset = 0; |
|
emu23 = 0; |
|
for (i = 1; i < argc; i++) { |
|
const char *arg = argv[i]; |
|
|
|
/* "-u" means "update", meaning that a merge will update the working directory */ |
|
if (!strcmp(arg, "-u")) { |
|
update = 1; |
|
continue; |
|
} |
|
|
|
/* This differs from "-m" in that we'll silently ignore unmerged entries */ |
|
if (!strcmp(arg, "--reset")) { |
|
if (stage || merge || emu23) |
|
usage(read_tree_usage); |
|
reset = 1; |
|
merge = 1; |
|
stage = 1; |
|
read_cache_unmerged(); |
|
continue; |
|
} |
|
|
|
/* "-m" stands for "merge", meaning we start in stage 1 */ |
|
if (!strcmp(arg, "-m")) { |
|
if (stage || merge || emu23) |
|
usage(read_tree_usage); |
|
if (read_cache_unmerged()) |
|
die("you need to resolve your current index first"); |
|
stage = 1; |
|
merge = 1; |
|
continue; |
|
} |
|
|
|
/* "-emu23" uses 3-way merge logic to perform fast-forward */ |
|
if (!strcmp(arg, "--emu23")) { |
|
if (stage || merge || emu23) |
|
usage(read_tree_usage); |
|
if (read_cache_unmerged()) |
|
die("you need to resolve your current index first"); |
|
merge = emu23 = stage = 1; |
|
continue; |
|
} |
|
|
|
if (get_sha1(arg, sha1) < 0) |
|
usage(read_tree_usage); |
|
if (stage > 3) |
|
usage(read_tree_usage); |
|
if (unpack_tree(sha1) < 0) |
|
die("failed to unpack tree object %s", arg); |
|
stage++; |
|
} |
|
if (update && !merge) |
|
usage(read_tree_usage); |
|
if (merge) { |
|
static const merge_fn_t merge_function[] = { |
|
[1] = oneway_merge, |
|
[2] = twoway_merge, |
|
[3] = threeway_merge, |
|
}; |
|
merge_fn_t fn; |
|
|
|
if (stage < 2 || stage > 4) |
|
die("just how do you expect me to merge %d trees?", stage-1); |
|
if (emu23 && stage != 3) |
|
die("--emu23 takes only two trees"); |
|
fn = merge_function[stage-1]; |
|
if (stage == 3 && emu23) { |
|
setup_emu23(); |
|
fn = merge_function[3]; |
|
} |
|
merge_cache(active_cache, active_nr, fn); |
|
} |
|
if (write_cache(newfd, active_cache, active_nr) || |
|
commit_index_file(&cache_file)) |
|
die("unable to write new index file"); |
|
return 0; |
|
}
|
|
|