/* * GIT - The information manager from hell * * Copyright (C) Linus Torvalds, 2005 */ #include "cache.h" static int stage = 0; static int update = 0; static int unpack_tree(unsigned char *sha1) { void *buffer; unsigned long size; int ret; buffer = read_object_with_reference(sha1, "tree", &size, NULL); if (!buffer) return -1; ret = read_tree(buffer, size, stage); free(buffer); return ret; } static int path_matches(struct cache_entry *a, struct cache_entry *b) { int len = ce_namelen(a); return ce_namelen(b) == len && !memcmp(a->name, b->name, len); } static int same(struct cache_entry *a, struct cache_entry *b) { return a->ce_mode == b->ce_mode && !memcmp(a->sha1, b->sha1, 20); } /* * This removes all trivial merges that don't change the tree * and collapses them to state 0. */ static struct cache_entry *merge_entries(struct cache_entry *a, struct cache_entry *b, struct cache_entry *c) { /* * Ok, all three entries describe the same * filename, but maybe the contents or file * mode have changed? * * The trivial cases end up being the ones where two * out of three files are the same: * - both destinations the same, trivially take either * - one of the destination versions hasn't changed, * take the other. * * The "all entries exactly the same" case falls out as * a special case of any of the "two same" cases. * * Here "a" is "original", and "b" and "c" are the two * trees we are merging. */ if (a && b && c) { if (same(b,c)) return c; if (same(a,b)) return c; if (same(a,c)) return b; } return NULL; } /* * When a CE gets turned into an unmerged entry, we * want it to be up-to-date */ static void verify_uptodate(struct cache_entry *ce) { struct stat st; if (!lstat(ce->name, &st)) { unsigned changed = ce_match_stat(ce, &st); if (!changed) return; errno = 0; } if (errno == ENOENT) return; die("Entry '%s' not uptodate. Cannot merge.", ce->name); } /* * If the old tree contained a CE that isn't even in the * result, that's always a problem, regardless of whether * it's up-to-date or not (ie it can be a file that we * have updated but not committed yet). */ static void reject_merge(struct cache_entry *ce) { die("Entry '%s' would be overwritten by merge. Cannot merge.", ce->name); } static int merged_entry_internal(struct cache_entry *merge, struct cache_entry *old, struct cache_entry **dst, int allow_dirty) { merge->ce_flags |= htons(CE_UPDATE); if (old) { /* * See if we can re-use the old CE directly? * That way we get the uptodate stat info. * * This also removes the UPDATE flag on * a match. */ if (same(old, merge)) { *merge = *old; } else if (!allow_dirty) { verify_uptodate(old); } } merge->ce_flags &= ~htons(CE_STAGEMASK); *dst++ = merge; return 1; } static int merged_entry_allow_dirty(struct cache_entry *merge, struct cache_entry *old, struct cache_entry **dst) { return merged_entry_internal(merge, old, dst, 1); } static int merged_entry(struct cache_entry *merge, struct cache_entry *old, struct cache_entry **dst) { return merged_entry_internal(merge, old, dst, 0); } static int deleted_entry(struct cache_entry *ce, struct cache_entry *old, struct cache_entry **dst) { if (old) verify_uptodate(old); ce->ce_mode = 0; *dst++ = ce; return 1; } static int causes_df_conflict(struct cache_entry *ce, int stage, struct cache_entry **dst_, struct cache_entry **next_, int tail) { /* This is called during the merge operation and walking * the active_cache[] array is messy, because it is in the * middle of overlapping copy operation. The invariants * are: * (1) active_cache points at the first (zeroth) entry. * (2) up to dst pointer are resolved entries. * (3) from the next pointer (head-inclusive) to the tail * of the active_cache array have the remaining paths * to be processed. There can be a gap between dst * and next. Note that next is called "src" in the * merge_cache() function, and tail is the original * end of active_cache array when merge_cache() started. * (4) the path corresponding to *ce is not found in (2) * or (3). It is in the gap. * * active_cache -----......+++++++++++++. * ^dst ^next ^tail */ int i, next, dst; const char *path = ce->name; int namelen = ce_namelen(ce); next = next_ - active_cache; dst = dst_ - active_cache; for (i = 0; i < tail; i++) { int entlen, len; const char *one, *two; if (dst <= i && i < next) continue; ce = active_cache[i]; if (ce_stage(ce) != stage) continue; /* If ce->name is a prefix of path, then path is a file * that hangs underneath ce->name, which is bad. * If path is a prefix of ce->name, then it is the * other way around which also is bad. */ entlen = ce_namelen(ce); if (namelen == entlen) continue; if (namelen < entlen) { len = namelen; one = path; two = ce->name; } else { len = entlen; one = ce->name; two = path; } if (memcmp(one, two, len)) continue; if (two[len] == '/') return 1; } return 0; } static int threeway_merge(struct cache_entry *stages[4], struct cache_entry **dst, struct cache_entry **next, int tail) { struct cache_entry *old = stages[0]; struct cache_entry *a = stages[1], *b = stages[2], *c = stages[3]; struct cache_entry *merge; int count; /* #5ALT */ if (!a && b && c && same(b, c)) { if (old && !same(b, old)) return -1; return merged_entry_allow_dirty(b, old, dst); } /* #2ALT and #3ALT */ if (!a && (!!b != !!c)) { /* * The reason we need to worry about directory/file * conflicts only in #2ALT and #3ALT case is this: * * (1) For all other cases that read-tree internally * resolves a path, we always have such a path in * *both* stage2 and stage3 when we begin. * Traditionally, the behaviour has been even * stricter and we did not resolve a path without * initially being in all of stage1, 2, and 3. * * (2) When read-tree finishes, all resolved paths (i.e. * the paths that are in stage0) must have come from * either stage2 or stage3. It is not possible to * have a stage0 path as a result of a merge if * neither stage2 nor stage3 had that path. * * (3) It is guaranteed that just after reading the * stages, each stage cannot have directory/file * conflicts on its own, because they are populated * by reading hierarchy of a tree. Combined with * (1) and (2) above, this means that no matter what * combination of paths we take from stage2 and * stage3 as a result of a merge, they cannot cause * a directory/file conflict situation (otherwise * the "guilty" path would have already had such a * conflict in the original stage, either stage2 * or stage3). Although its stage2 is synthesized * by overlaying the current index on top of "our * head" tree, --emu23 case also has this guarantee, * by calling add_cache_entry() to create such stage2 * entries. * * (4) Only #2ALT and #3ALT lack the guarantee (1). * They resolve paths that exist only in stage2 * or stage3. The stage2 tree may have a file DF * while stage3 tree may have a file DF/DF. If * #2ALT and #3ALT rules happen to apply to both * of them, we would end up having DF (coming from * stage2) and DF/DF (from stage3) in the result. * When we attempt to resolve a path that exists * only in stage2, we need to make sure there is * no path that would conflict with it in stage3 * and vice versa. */ if (c) { /* #2ALT */ if (!causes_df_conflict(c, 2, dst, next, tail) && (!old || same(c, old))) return merged_entry_allow_dirty(c, old, dst); } else { /* #3ALT */ if (!causes_df_conflict(b, 3, dst, next, tail) && (!old || same(b, old))) return merged_entry_allow_dirty(b, old, dst); } /* otherwise we will apply the original rule */ } /* * If we have an entry in the index cache ("old"), then we want * to make sure that it matches any entries in stage 2 ("first * branch", aka "b"). */ if (old) { if (!b || !same(old, b)) return -1; } merge = merge_entries(a, b, c); if (merge) return merged_entry(merge, old, dst); if (old) verify_uptodate(old); count = 0; if (a) { *dst++ = a; count++; } if (b) { *dst++ = b; count++; } if (c) { *dst++ = c; count++; } return count; } /* * Two-way merge. * * The rule is to "carry forward" what is in the index without losing * information across a "fast forward", favoring a successful merge * over a merge failure when it makes sense. For details of the * "carry forward" rule, please see . * */ static int twoway_merge(struct cache_entry **src, struct cache_entry **dst, struct cache_entry **next, int tail) { struct cache_entry *current = src[0]; struct cache_entry *oldtree = src[1], *newtree = src[2]; if (src[3]) return -1; if (current) { if ((!oldtree && !newtree) || /* 4 and 5 */ (!oldtree && newtree && same(current, newtree)) || /* 6 and 7 */ (oldtree && newtree && same(oldtree, newtree)) || /* 14 and 15 */ (oldtree && newtree && !same(oldtree, newtree) && /* 18 and 19*/ same(current, newtree))) { *dst++ = current; return 1; } else if (oldtree && !newtree && same(current, oldtree)) { /* 10 or 11 */ return deleted_entry(oldtree, current, dst); } else if (oldtree && newtree && same(current, oldtree) && !same(current, newtree)) { /* 20 or 21 */ return merged_entry(newtree, current, dst); } else /* all other failures */ return -1; } else if (newtree) return merged_entry(newtree, current, dst); else return deleted_entry(oldtree, current, dst); } /* * Two-way merge emulated with three-way merge. * * This treats "read-tree -m H M" by transforming it internally * into "read-tree -m H I+H M", where I+H is a tree that would * contain the contents of the current index file, overlayed on * top of H. Unlike the traditional two-way merge, this leaves * the stages in the resulting index file and lets the user resolve * the merge conflicts using standard tools for three-way merge. * * This function is just to set-up such an arrangement, and the * actual merge uses threeway_merge() function. */ static void setup_emu23(void) { /* stage0 contains I, stage1 H, stage2 M. * move stage2 to stage3, and create stage2 entries * by scanning stage0 and stage1 entries. */ int i, namelen, size; struct cache_entry *ce, *stage2; for (i = 0; i < active_nr; i++) { ce = active_cache[i]; if (ce_stage(ce) != 2) continue; /* hoist them up to stage 3 */ namelen = ce_namelen(ce); ce->ce_flags = create_ce_flags(namelen, 3); } for (i = 0; i < active_nr; i++) { ce = active_cache[i]; if (ce_stage(ce) > 1) continue; namelen = ce_namelen(ce); size = cache_entry_size(namelen); stage2 = xmalloc(size); memcpy(stage2, ce, size); stage2->ce_flags = create_ce_flags(namelen, 2); if (add_cache_entry(stage2, ADD_CACHE_OK_TO_ADD) < 0) die("cannot merge index and our head tree"); /* We are done with this name, so skip to next name */ while (i < active_nr && ce_namelen(active_cache[i]) == namelen && !memcmp(active_cache[i]->name, ce->name, namelen)) i++; i--; /* compensate for the loop control */ } } /* * One-way merge. * * The rule is: * - take the stat information from stage0, take the data from stage1 */ static int oneway_merge(struct cache_entry **src, struct cache_entry **dst, struct cache_entry **next, int tail) { struct cache_entry *old = src[0]; struct cache_entry *a = src[1]; if (src[2] || src[3]) return -1; if (!a) return 0; if (old && same(old, a)) { *dst++ = old; return 1; } return merged_entry(a, NULL, dst); } static void check_updates(struct cache_entry **src, int nr) { static struct checkout state = { .base_dir = "", .force = 1, .quiet = 1, .refresh_cache = 1, }; unsigned short mask = htons(CE_UPDATE); while (nr--) { struct cache_entry *ce = *src++; if (!ce->ce_mode) { if (update) unlink(ce->name); continue; } if (ce->ce_flags & mask) { ce->ce_flags &= ~mask; if (update) checkout_entry(ce, &state); } } } typedef int (*merge_fn_t)(struct cache_entry **, struct cache_entry **, struct cache_entry **, int); static void merge_cache(struct cache_entry **src, int nr, merge_fn_t fn) { struct cache_entry **dst = src; int tail = nr; while (nr) { int entries; struct cache_entry *name, *ce, *stages[4] = { NULL, }; name = ce = *src; for (;;) { int stage = ce_stage(ce); stages[stage] = ce; ce = *++src; active_nr--; if (!--nr) break; if (!path_matches(ce, name)) break; } entries = fn(stages, dst, src, tail); if (entries < 0) reject_merge(name); dst += entries; active_nr += entries; } check_updates(active_cache, active_nr); } static int read_cache_unmerged(void) { int i, deleted; struct cache_entry **dst; read_cache(); dst = active_cache; deleted = 0; for (i = 0; i < active_nr; i++) { struct cache_entry *ce = active_cache[i]; if (ce_stage(ce)) { deleted++; continue; } if (deleted) *dst = ce; dst++; } active_nr -= deleted; return deleted; } static char *read_tree_usage = "git-read-tree ( | -m [-u] [ []])"; static struct cache_file cache_file; int main(int argc, char **argv) { int i, newfd, merge, reset, emu23; unsigned char sha1[20]; newfd = hold_index_file_for_update(&cache_file, get_index_file()); if (newfd < 0) die("unable to create new cachefile"); merge = 0; reset = 0; emu23 = 0; for (i = 1; i < argc; i++) { const char *arg = argv[i]; /* "-u" means "update", meaning that a merge will update the working directory */ if (!strcmp(arg, "-u")) { update = 1; continue; } /* This differs from "-m" in that we'll silently ignore unmerged entries */ if (!strcmp(arg, "--reset")) { if (stage || merge || emu23) usage(read_tree_usage); reset = 1; merge = 1; stage = 1; read_cache_unmerged(); } /* "-m" stands for "merge", meaning we start in stage 1 */ if (!strcmp(arg, "-m")) { if (stage || merge || emu23) usage(read_tree_usage); if (read_cache_unmerged()) die("you need to resolve your current index first"); stage = 1; merge = 1; continue; } /* "-emu23" uses 3-way merge logic to perform fast-forward */ if (!strcmp(arg, "--emu23")) { if (stage || merge || emu23) usage(read_tree_usage); if (read_cache_unmerged()) die("you need to resolve your current index first"); merge = emu23 = stage = 1; continue; } if (get_sha1(arg, sha1) < 0) usage(read_tree_usage); if (stage > 3) usage(read_tree_usage); if (unpack_tree(sha1) < 0) die("failed to unpack tree object %s", arg); stage++; } if (update && !merge) usage(read_tree_usage); if (merge) { static const merge_fn_t merge_function[] = { [1] = oneway_merge, [2] = twoway_merge, [3] = threeway_merge, }; merge_fn_t fn; if (stage < 2 || stage > 4) die("just how do you expect me to merge %d trees?", stage-1); if (emu23 && stage != 3) die("--emu23 takes only two trees"); fn = merge_function[stage-1]; if (stage == 3 && emu23) { setup_emu23(); fn = merge_function[3]; } merge_cache(active_cache, active_nr, fn); } if (write_cache(newfd, active_cache, active_nr) || commit_index_file(&cache_file)) die("unable to write new index file"); return 0; }