604 lines
16 KiB
C
604 lines
16 KiB
C
/*
|
|
* GIT - The information manager from hell
|
|
*
|
|
* Copyright (C) Linus Torvalds, 2005
|
|
*/
|
|
#include "cache.h"
|
|
|
|
static int stage = 0;
|
|
static int update = 0;
|
|
|
|
static int unpack_tree(unsigned char *sha1)
|
|
{
|
|
void *buffer;
|
|
unsigned long size;
|
|
int ret;
|
|
|
|
buffer = read_object_with_reference(sha1, "tree", &size, NULL);
|
|
if (!buffer)
|
|
return -1;
|
|
ret = read_tree(buffer, size, stage, NULL);
|
|
free(buffer);
|
|
return ret;
|
|
}
|
|
|
|
static int path_matches(struct cache_entry *a, struct cache_entry *b)
|
|
{
|
|
int len = ce_namelen(a);
|
|
return ce_namelen(b) == len &&
|
|
!memcmp(a->name, b->name, len);
|
|
}
|
|
|
|
static int same(struct cache_entry *a, struct cache_entry *b)
|
|
{
|
|
return a->ce_mode == b->ce_mode &&
|
|
!memcmp(a->sha1, b->sha1, 20);
|
|
}
|
|
|
|
|
|
/*
|
|
* This removes all trivial merges that don't change the tree
|
|
* and collapses them to state 0.
|
|
*/
|
|
static struct cache_entry *merge_entries(struct cache_entry *a,
|
|
struct cache_entry *b,
|
|
struct cache_entry *c)
|
|
{
|
|
/*
|
|
* Ok, all three entries describe the same
|
|
* filename, but maybe the contents or file
|
|
* mode have changed?
|
|
*
|
|
* The trivial cases end up being the ones where two
|
|
* out of three files are the same:
|
|
* - both destinations the same, trivially take either
|
|
* - one of the destination versions hasn't changed,
|
|
* take the other.
|
|
*
|
|
* The "all entries exactly the same" case falls out as
|
|
* a special case of any of the "two same" cases.
|
|
*
|
|
* Here "a" is "original", and "b" and "c" are the two
|
|
* trees we are merging.
|
|
*/
|
|
if (a && b && c) {
|
|
if (same(b,c))
|
|
return c;
|
|
if (same(a,b))
|
|
return c;
|
|
if (same(a,c))
|
|
return b;
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
/*
|
|
* When a CE gets turned into an unmerged entry, we
|
|
* want it to be up-to-date
|
|
*/
|
|
static void verify_uptodate(struct cache_entry *ce)
|
|
{
|
|
struct stat st;
|
|
|
|
if (!lstat(ce->name, &st)) {
|
|
unsigned changed = ce_match_stat(ce, &st);
|
|
if (!changed)
|
|
return;
|
|
errno = 0;
|
|
}
|
|
if (errno == ENOENT)
|
|
return;
|
|
die("Entry '%s' not uptodate. Cannot merge.", ce->name);
|
|
}
|
|
|
|
/*
|
|
* If the old tree contained a CE that isn't even in the
|
|
* result, that's always a problem, regardless of whether
|
|
* it's up-to-date or not (ie it can be a file that we
|
|
* have updated but not committed yet).
|
|
*/
|
|
static void reject_merge(struct cache_entry *ce)
|
|
{
|
|
die("Entry '%s' would be overwritten by merge. Cannot merge.", ce->name);
|
|
}
|
|
|
|
static int merged_entry_internal(struct cache_entry *merge, struct cache_entry *old, struct cache_entry **dst, int allow_dirty)
|
|
{
|
|
merge->ce_flags |= htons(CE_UPDATE);
|
|
if (old) {
|
|
/*
|
|
* See if we can re-use the old CE directly?
|
|
* That way we get the uptodate stat info.
|
|
*
|
|
* This also removes the UPDATE flag on
|
|
* a match.
|
|
*/
|
|
if (same(old, merge)) {
|
|
*merge = *old;
|
|
} else if (!allow_dirty) {
|
|
verify_uptodate(old);
|
|
}
|
|
}
|
|
merge->ce_flags &= ~htons(CE_STAGEMASK);
|
|
*dst++ = merge;
|
|
return 1;
|
|
}
|
|
|
|
static int merged_entry_allow_dirty(struct cache_entry *merge, struct cache_entry *old, struct cache_entry **dst)
|
|
{
|
|
return merged_entry_internal(merge, old, dst, 1);
|
|
}
|
|
|
|
static int merged_entry(struct cache_entry *merge, struct cache_entry *old, struct cache_entry **dst)
|
|
{
|
|
return merged_entry_internal(merge, old, dst, 0);
|
|
}
|
|
|
|
static int deleted_entry(struct cache_entry *ce, struct cache_entry *old, struct cache_entry **dst)
|
|
{
|
|
if (old)
|
|
verify_uptodate(old);
|
|
ce->ce_mode = 0;
|
|
*dst++ = ce;
|
|
return 1;
|
|
}
|
|
|
|
static int causes_df_conflict(struct cache_entry *ce, int stage,
|
|
struct cache_entry **dst_,
|
|
struct cache_entry **next_,
|
|
int tail)
|
|
{
|
|
/* This is called during the merge operation and walking
|
|
* the active_cache[] array is messy, because it is in the
|
|
* middle of overlapping copy operation. The invariants
|
|
* are:
|
|
* (1) active_cache points at the first (zeroth) entry.
|
|
* (2) up to dst pointer are resolved entries.
|
|
* (3) from the next pointer (head-inclusive) to the tail
|
|
* of the active_cache array have the remaining paths
|
|
* to be processed. There can be a gap between dst
|
|
* and next. Note that next is called "src" in the
|
|
* merge_cache() function, and tail is the original
|
|
* end of active_cache array when merge_cache() started.
|
|
* (4) the path corresponding to *ce is not found in (2)
|
|
* or (3). It is in the gap.
|
|
*
|
|
* active_cache -----......+++++++++++++.
|
|
* ^dst ^next ^tail
|
|
*/
|
|
int i, next, dst;
|
|
const char *path = ce->name;
|
|
int namelen = ce_namelen(ce);
|
|
|
|
next = next_ - active_cache;
|
|
dst = dst_ - active_cache;
|
|
|
|
for (i = 0; i < tail; i++) {
|
|
int entlen, len;
|
|
const char *one, *two;
|
|
if (dst <= i && i < next)
|
|
continue;
|
|
ce = active_cache[i];
|
|
if (ce_stage(ce) != stage)
|
|
continue;
|
|
/* If ce->name is a prefix of path, then path is a file
|
|
* that hangs underneath ce->name, which is bad.
|
|
* If path is a prefix of ce->name, then it is the
|
|
* other way around which also is bad.
|
|
*/
|
|
entlen = ce_namelen(ce);
|
|
if (namelen == entlen)
|
|
continue;
|
|
if (namelen < entlen) {
|
|
len = namelen;
|
|
one = path;
|
|
two = ce->name;
|
|
} else {
|
|
len = entlen;
|
|
one = ce->name;
|
|
two = path;
|
|
}
|
|
if (memcmp(one, two, len))
|
|
continue;
|
|
if (two[len] == '/')
|
|
return 1;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
static int threeway_merge(struct cache_entry *stages[4],
|
|
struct cache_entry **dst,
|
|
struct cache_entry **next, int tail)
|
|
{
|
|
struct cache_entry *old = stages[0];
|
|
struct cache_entry *a = stages[1], *b = stages[2], *c = stages[3];
|
|
struct cache_entry *merge;
|
|
int count;
|
|
|
|
/* #5ALT */
|
|
if (!a && b && c && same(b, c)) {
|
|
if (old && !same(b, old))
|
|
return -1;
|
|
return merged_entry_allow_dirty(b, old, dst);
|
|
}
|
|
/* #2ALT and #3ALT */
|
|
if (!a && (!!b != !!c)) {
|
|
/*
|
|
* The reason we need to worry about directory/file
|
|
* conflicts only in #2ALT and #3ALT case is this:
|
|
*
|
|
* (1) For all other cases that read-tree internally
|
|
* resolves a path, we always have such a path in
|
|
* *both* stage2 and stage3 when we begin.
|
|
* Traditionally, the behaviour has been even
|
|
* stricter and we did not resolve a path without
|
|
* initially being in all of stage1, 2, and 3.
|
|
*
|
|
* (2) When read-tree finishes, all resolved paths (i.e.
|
|
* the paths that are in stage0) must have come from
|
|
* either stage2 or stage3. It is not possible to
|
|
* have a stage0 path as a result of a merge if
|
|
* neither stage2 nor stage3 had that path.
|
|
*
|
|
* (3) It is guaranteed that just after reading the
|
|
* stages, each stage cannot have directory/file
|
|
* conflicts on its own, because they are populated
|
|
* by reading hierarchy of a tree. Combined with
|
|
* (1) and (2) above, this means that no matter what
|
|
* combination of paths we take from stage2 and
|
|
* stage3 as a result of a merge, they cannot cause
|
|
* a directory/file conflict situation (otherwise
|
|
* the "guilty" path would have already had such a
|
|
* conflict in the original stage, either stage2
|
|
* or stage3). Although its stage2 is synthesized
|
|
* by overlaying the current index on top of "our
|
|
* head" tree, --emu23 case also has this guarantee,
|
|
* by calling add_cache_entry() to create such stage2
|
|
* entries.
|
|
*
|
|
* (4) Only #2ALT and #3ALT lack the guarantee (1).
|
|
* They resolve paths that exist only in stage2
|
|
* or stage3. The stage2 tree may have a file DF
|
|
* while stage3 tree may have a file DF/DF. If
|
|
* #2ALT and #3ALT rules happen to apply to both
|
|
* of them, we would end up having DF (coming from
|
|
* stage2) and DF/DF (from stage3) in the result.
|
|
* When we attempt to resolve a path that exists
|
|
* only in stage2, we need to make sure there is
|
|
* no path that would conflict with it in stage3
|
|
* and vice versa.
|
|
*/
|
|
if (c) { /* #2ALT */
|
|
if (!causes_df_conflict(c, 2, dst, next, tail) &&
|
|
(!old || same(c, old)))
|
|
return merged_entry_allow_dirty(c, old, dst);
|
|
}
|
|
else { /* #3ALT */
|
|
if (!causes_df_conflict(b, 3, dst, next, tail) &&
|
|
(!old || same(b, old)))
|
|
return merged_entry_allow_dirty(b, old, dst);
|
|
}
|
|
/* otherwise we will apply the original rule */
|
|
}
|
|
/* #14ALT */
|
|
if (a && b && c && same(a, b) && !same(a, c)) {
|
|
if (old && same(old, c))
|
|
return merged_entry_allow_dirty(c, old, dst);
|
|
/* otherwise the regular rule applies */
|
|
}
|
|
/*
|
|
* If we have an entry in the index cache ("old"), then we want
|
|
* to make sure that it matches any entries in stage 2 ("first
|
|
* branch", aka "b").
|
|
*/
|
|
if (old) {
|
|
if (!b || !same(old, b))
|
|
return -1;
|
|
}
|
|
merge = merge_entries(a, b, c);
|
|
if (merge)
|
|
return merged_entry(merge, old, dst);
|
|
if (old)
|
|
verify_uptodate(old);
|
|
count = 0;
|
|
if (a) { *dst++ = a; count++; }
|
|
if (b) { *dst++ = b; count++; }
|
|
if (c) { *dst++ = c; count++; }
|
|
return count;
|
|
}
|
|
|
|
/*
|
|
* Two-way merge.
|
|
*
|
|
* The rule is to "carry forward" what is in the index without losing
|
|
* information across a "fast forward", favoring a successful merge
|
|
* over a merge failure when it makes sense. For details of the
|
|
* "carry forward" rule, please see <Documentation/git-read-tree.txt>.
|
|
*
|
|
*/
|
|
static int twoway_merge(struct cache_entry **src, struct cache_entry **dst,
|
|
struct cache_entry **next, int tail)
|
|
{
|
|
struct cache_entry *current = src[0];
|
|
struct cache_entry *oldtree = src[1], *newtree = src[2];
|
|
|
|
if (src[3])
|
|
return -1;
|
|
|
|
if (current) {
|
|
if ((!oldtree && !newtree) || /* 4 and 5 */
|
|
(!oldtree && newtree &&
|
|
same(current, newtree)) || /* 6 and 7 */
|
|
(oldtree && newtree &&
|
|
same(oldtree, newtree)) || /* 14 and 15 */
|
|
(oldtree && newtree &&
|
|
!same(oldtree, newtree) && /* 18 and 19*/
|
|
same(current, newtree))) {
|
|
*dst++ = current;
|
|
return 1;
|
|
}
|
|
else if (oldtree && !newtree && same(current, oldtree)) {
|
|
/* 10 or 11 */
|
|
return deleted_entry(oldtree, current, dst);
|
|
}
|
|
else if (oldtree && newtree &&
|
|
same(current, oldtree) && !same(current, newtree)) {
|
|
/* 20 or 21 */
|
|
return merged_entry(newtree, current, dst);
|
|
}
|
|
else
|
|
/* all other failures */
|
|
return -1;
|
|
}
|
|
else if (newtree)
|
|
return merged_entry(newtree, current, dst);
|
|
else
|
|
return deleted_entry(oldtree, current, dst);
|
|
}
|
|
|
|
/*
|
|
* Two-way merge emulated with three-way merge.
|
|
*
|
|
* This treats "read-tree -m H M" by transforming it internally
|
|
* into "read-tree -m H I+H M", where I+H is a tree that would
|
|
* contain the contents of the current index file, overlayed on
|
|
* top of H. Unlike the traditional two-way merge, this leaves
|
|
* the stages in the resulting index file and lets the user resolve
|
|
* the merge conflicts using standard tools for three-way merge.
|
|
*
|
|
* This function is just to set-up such an arrangement, and the
|
|
* actual merge uses threeway_merge() function.
|
|
*/
|
|
static void setup_emu23(void)
|
|
{
|
|
/* stage0 contains I, stage1 H, stage2 M.
|
|
* move stage2 to stage3, and create stage2 entries
|
|
* by scanning stage0 and stage1 entries.
|
|
*/
|
|
int i, namelen, size;
|
|
struct cache_entry *ce, *stage2;
|
|
|
|
for (i = 0; i < active_nr; i++) {
|
|
ce = active_cache[i];
|
|
if (ce_stage(ce) != 2)
|
|
continue;
|
|
/* hoist them up to stage 3 */
|
|
namelen = ce_namelen(ce);
|
|
ce->ce_flags = create_ce_flags(namelen, 3);
|
|
}
|
|
|
|
for (i = 0; i < active_nr; i++) {
|
|
ce = active_cache[i];
|
|
if (ce_stage(ce) > 1)
|
|
continue;
|
|
namelen = ce_namelen(ce);
|
|
size = cache_entry_size(namelen);
|
|
stage2 = xmalloc(size);
|
|
memcpy(stage2, ce, size);
|
|
stage2->ce_flags = create_ce_flags(namelen, 2);
|
|
if (add_cache_entry(stage2, ADD_CACHE_OK_TO_ADD) < 0)
|
|
die("cannot merge index and our head tree");
|
|
|
|
/* We are done with this name, so skip to next name */
|
|
while (i < active_nr &&
|
|
ce_namelen(active_cache[i]) == namelen &&
|
|
!memcmp(active_cache[i]->name, ce->name, namelen))
|
|
i++;
|
|
i--; /* compensate for the loop control */
|
|
}
|
|
}
|
|
|
|
/*
|
|
* One-way merge.
|
|
*
|
|
* The rule is:
|
|
* - take the stat information from stage0, take the data from stage1
|
|
*/
|
|
static int oneway_merge(struct cache_entry **src, struct cache_entry **dst,
|
|
struct cache_entry **next, int tail)
|
|
{
|
|
struct cache_entry *old = src[0];
|
|
struct cache_entry *a = src[1];
|
|
|
|
if (src[2] || src[3])
|
|
return -1;
|
|
|
|
if (!a)
|
|
return 0;
|
|
if (old && same(old, a)) {
|
|
*dst++ = old;
|
|
return 1;
|
|
}
|
|
return merged_entry(a, NULL, dst);
|
|
}
|
|
|
|
static void check_updates(struct cache_entry **src, int nr)
|
|
{
|
|
static struct checkout state = {
|
|
.base_dir = "",
|
|
.force = 1,
|
|
.quiet = 1,
|
|
.refresh_cache = 1,
|
|
};
|
|
unsigned short mask = htons(CE_UPDATE);
|
|
while (nr--) {
|
|
struct cache_entry *ce = *src++;
|
|
if (!ce->ce_mode) {
|
|
if (update)
|
|
unlink(ce->name);
|
|
continue;
|
|
}
|
|
if (ce->ce_flags & mask) {
|
|
ce->ce_flags &= ~mask;
|
|
if (update)
|
|
checkout_entry(ce, &state);
|
|
}
|
|
}
|
|
}
|
|
|
|
typedef int (*merge_fn_t)(struct cache_entry **, struct cache_entry **, struct cache_entry **, int);
|
|
|
|
static void merge_cache(struct cache_entry **src, int nr, merge_fn_t fn)
|
|
{
|
|
struct cache_entry **dst = src;
|
|
int tail = nr;
|
|
|
|
while (nr) {
|
|
int entries;
|
|
struct cache_entry *name, *ce, *stages[4] = { NULL, };
|
|
|
|
name = ce = *src;
|
|
for (;;) {
|
|
int stage = ce_stage(ce);
|
|
stages[stage] = ce;
|
|
ce = *++src;
|
|
active_nr--;
|
|
if (!--nr)
|
|
break;
|
|
if (!path_matches(ce, name))
|
|
break;
|
|
}
|
|
|
|
entries = fn(stages, dst, src, tail);
|
|
if (entries < 0)
|
|
reject_merge(name);
|
|
dst += entries;
|
|
active_nr += entries;
|
|
}
|
|
check_updates(active_cache, active_nr);
|
|
}
|
|
|
|
static int read_cache_unmerged(void)
|
|
{
|
|
int i, deleted;
|
|
struct cache_entry **dst;
|
|
|
|
read_cache();
|
|
dst = active_cache;
|
|
deleted = 0;
|
|
for (i = 0; i < active_nr; i++) {
|
|
struct cache_entry *ce = active_cache[i];
|
|
if (ce_stage(ce)) {
|
|
deleted++;
|
|
continue;
|
|
}
|
|
if (deleted)
|
|
*dst = ce;
|
|
dst++;
|
|
}
|
|
active_nr -= deleted;
|
|
return deleted;
|
|
}
|
|
|
|
static char *read_tree_usage = "git-read-tree (<sha> | -m [-u] <sha1> [<sha2> [<sha3>]])";
|
|
|
|
static struct cache_file cache_file;
|
|
|
|
int main(int argc, char **argv)
|
|
{
|
|
int i, newfd, merge, reset, emu23;
|
|
unsigned char sha1[20];
|
|
|
|
newfd = hold_index_file_for_update(&cache_file, get_index_file());
|
|
if (newfd < 0)
|
|
die("unable to create new cachefile");
|
|
|
|
merge = 0;
|
|
reset = 0;
|
|
emu23 = 0;
|
|
for (i = 1; i < argc; i++) {
|
|
const char *arg = argv[i];
|
|
|
|
/* "-u" means "update", meaning that a merge will update the working directory */
|
|
if (!strcmp(arg, "-u")) {
|
|
update = 1;
|
|
continue;
|
|
}
|
|
|
|
/* This differs from "-m" in that we'll silently ignore unmerged entries */
|
|
if (!strcmp(arg, "--reset")) {
|
|
if (stage || merge || emu23)
|
|
usage(read_tree_usage);
|
|
reset = 1;
|
|
merge = 1;
|
|
stage = 1;
|
|
read_cache_unmerged();
|
|
continue;
|
|
}
|
|
|
|
/* "-m" stands for "merge", meaning we start in stage 1 */
|
|
if (!strcmp(arg, "-m")) {
|
|
if (stage || merge || emu23)
|
|
usage(read_tree_usage);
|
|
if (read_cache_unmerged())
|
|
die("you need to resolve your current index first");
|
|
stage = 1;
|
|
merge = 1;
|
|
continue;
|
|
}
|
|
|
|
/* "-emu23" uses 3-way merge logic to perform fast-forward */
|
|
if (!strcmp(arg, "--emu23")) {
|
|
if (stage || merge || emu23)
|
|
usage(read_tree_usage);
|
|
if (read_cache_unmerged())
|
|
die("you need to resolve your current index first");
|
|
merge = emu23 = stage = 1;
|
|
continue;
|
|
}
|
|
|
|
if (get_sha1(arg, sha1) < 0)
|
|
usage(read_tree_usage);
|
|
if (stage > 3)
|
|
usage(read_tree_usage);
|
|
if (unpack_tree(sha1) < 0)
|
|
die("failed to unpack tree object %s", arg);
|
|
stage++;
|
|
}
|
|
if (update && !merge)
|
|
usage(read_tree_usage);
|
|
if (merge) {
|
|
static const merge_fn_t merge_function[] = {
|
|
[1] = oneway_merge,
|
|
[2] = twoway_merge,
|
|
[3] = threeway_merge,
|
|
};
|
|
merge_fn_t fn;
|
|
|
|
if (stage < 2 || stage > 4)
|
|
die("just how do you expect me to merge %d trees?", stage-1);
|
|
if (emu23 && stage != 3)
|
|
die("--emu23 takes only two trees");
|
|
fn = merge_function[stage-1];
|
|
if (stage == 3 && emu23) {
|
|
setup_emu23();
|
|
fn = merge_function[3];
|
|
}
|
|
merge_cache(active_cache, active_nr, fn);
|
|
}
|
|
if (write_cache(newfd, active_cache, active_nr) ||
|
|
commit_index_file(&cache_file))
|
|
die("unable to write new index file");
|
|
return 0;
|
|
}
|