e76b45c2ddcdbd54b944aa72a774b45fa40cbfc3
1#!/bin/bash
2#
3# git-subtree.sh: split/join git repositories in subdirectories of this one
4#
5# Copyright (C) 2009 Avery Pennarun <apenwarr@gmail.com>
6#
7if [ $# -eq 0 ]; then
8 set -- -h
9fi
10OPTS_SPEC="\
11git subtree add --prefix=<prefix> <commit>
12git subtree merge --prefix=<prefix> <commit>
13git subtree pull --prefix=<prefix> <repository> <refspec...>
14git subtree split --prefix=<prefix> <commit...>
15--
16h,help show the help
17q quiet
18d show debug messages
19P,prefix= the name of the subdir to split out
20m,message= use the given message as the commit message for the merge commit
21 options for 'split'
22annotate= add a prefix to commit message of new commits
23b,branch= create a new branch from the split subtree
24ignore-joins ignore prior --rejoin commits
25onto= try connecting new tree to an existing one
26rejoin merge the new branch back into HEAD
27 options for 'add', 'merge', and 'pull'
28squash merge subtree changes as a single commit
29"
30eval $(echo "$OPTS_SPEC" | git rev-parse --parseopt -- "$@" || echo exit $?)
31PATH=$(git --exec-path):$PATH
32. git-sh-setup
33require_work_tree
34
35quiet=
36branch=
37debug=
38command=
39onto=
40rejoin=
41ignore_joins=
42annotate=
43squash=
44message=
45
46debug()
47{
48 if [ -n "$debug" ]; then
49 echo "$@" >&2
50 fi
51}
52
53say()
54{
55 if [ -z "$quiet" ]; then
56 echo "$@" >&2
57 fi
58}
59
60assert()
61{
62 if "$@"; then
63 :
64 else
65 die "assertion failed: " "$@"
66 fi
67}
68
69
70#echo "Options: $*"
71
72while [ $# -gt 0 ]; do
73 opt="$1"
74 shift
75 case "$opt" in
76 -q) quiet=1 ;;
77 -d) debug=1 ;;
78 --annotate) annotate="$1"; shift ;;
79 --no-annotate) annotate= ;;
80 -b) branch="$1"; shift ;;
81 -P) prefix="$1"; shift ;;
82 -m) message="$1"; shift ;;
83 --no-prefix) prefix= ;;
84 --onto) onto="$1"; shift ;;
85 --no-onto) onto= ;;
86 --rejoin) rejoin=1 ;;
87 --no-rejoin) rejoin= ;;
88 --ignore-joins) ignore_joins=1 ;;
89 --no-ignore-joins) ignore_joins= ;;
90 --squash) squash=1 ;;
91 --no-squash) squash= ;;
92 --) break ;;
93 *) die "Unexpected option: $opt" ;;
94 esac
95done
96
97command="$1"
98shift
99case "$command" in
100 add|merge|pull) default= ;;
101 split) default="--default HEAD" ;;
102 *) die "Unknown command '$command'" ;;
103esac
104
105if [ -z "$prefix" ]; then
106 die "You must provide the --prefix option."
107fi
108
109case "$command" in
110 add) [ -e "$prefix" ] &&
111 die "prefix '$prefix' already exists." ;;
112 *) [ -e "$prefix" ] ||
113 die "'$prefix' does not exist; use 'git subtree add'" ;;
114esac
115
116dir="$(dirname "$prefix/.")"
117
118if [ "$command" != "pull" ]; then
119 revs=$(git rev-parse $default --revs-only "$@") || exit $?
120 dirs="$(git rev-parse --no-revs --no-flags "$@")" || exit $?
121 if [ -n "$dirs" ]; then
122 die "Error: Use --prefix instead of bare filenames."
123 fi
124fi
125
126debug "command: {$command}"
127debug "quiet: {$quiet}"
128debug "revs: {$revs}"
129debug "dir: {$dir}"
130debug "opts: {$*}"
131debug
132
133cache_setup()
134{
135 cachedir="$GIT_DIR/subtree-cache/$$"
136 rm -rf "$cachedir" || die "Can't delete old cachedir: $cachedir"
137 mkdir -p "$cachedir" || die "Can't create new cachedir: $cachedir"
138 debug "Using cachedir: $cachedir" >&2
139}
140
141cache_get()
142{
143 for oldrev in $*; do
144 if [ -r "$cachedir/$oldrev" ]; then
145 read newrev <"$cachedir/$oldrev"
146 echo $newrev
147 fi
148 done
149}
150
151cache_set()
152{
153 oldrev="$1"
154 newrev="$2"
155 if [ "$oldrev" != "latest_old" \
156 -a "$oldrev" != "latest_new" \
157 -a -e "$cachedir/$oldrev" ]; then
158 die "cache for $oldrev already exists!"
159 fi
160 echo "$newrev" >"$cachedir/$oldrev"
161}
162
163rev_exists()
164{
165 if git rev-parse "$1" >/dev/null 2>&1; then
166 return 0
167 else
168 return 1
169 fi
170}
171
172rev_is_descendant_of_branch()
173{
174 newrev="$1"
175 branch="$2"
176 branch_hash=$(git rev-parse $branch)
177 match=$(git rev-list -1 $branch_hash ^$newrev)
178
179 if [ -z "$match" ]; then
180 return 0
181 else
182 return 1
183 fi
184}
185
186# if a commit doesn't have a parent, this might not work. But we only want
187# to remove the parent from the rev-list, and since it doesn't exist, it won't
188# be there anyway, so do nothing in that case.
189try_remove_previous()
190{
191 if rev_exists "$1^"; then
192 echo "^$1^"
193 fi
194}
195
196find_latest_squash()
197{
198 debug "Looking for latest squash ($dir)..."
199 dir="$1"
200 sq=
201 main=
202 sub=
203 git log --grep="^git-subtree-dir: $dir/*\$" \
204 --pretty=format:'START %H%n%s%n%n%b%nEND%n' HEAD |
205 while read a b junk; do
206 debug "$a $b $junk"
207 debug "{{$sq/$main/$sub}}"
208 case "$a" in
209 START) sq="$b" ;;
210 git-subtree-mainline:) main="$b" ;;
211 git-subtree-split:) sub="$b" ;;
212 END)
213 if [ -n "$sub" ]; then
214 if [ -n "$main" ]; then
215 # a rejoin commit?
216 # Pretend its sub was a squash.
217 sq="$sub"
218 fi
219 debug "Squash found: $sq $sub"
220 echo "$sq" "$sub"
221 break
222 fi
223 sq=
224 main=
225 sub=
226 ;;
227 esac
228 done
229}
230
231find_existing_splits()
232{
233 debug "Looking for prior splits..."
234 dir="$1"
235 revs="$2"
236 main=
237 sub=
238 git log --grep="^git-subtree-dir: $dir/*\$" \
239 --pretty=format:'START %H%n%s%n%n%b%nEND%n' $revs |
240 while read a b junk; do
241 case "$a" in
242 START) sq="$b" ;;
243 git-subtree-mainline:) main="$b" ;;
244 git-subtree-split:) sub="$b" ;;
245 END)
246 debug " Main is: '$main'"
247 if [ -z "$main" -a -n "$sub" ]; then
248 # squash commits refer to a subtree
249 debug " Squash: $sq from $sub"
250 cache_set "$sq" "$sub"
251 fi
252 if [ -n "$main" -a -n "$sub" ]; then
253 debug " Prior: $main -> $sub"
254 cache_set $main $sub
255 try_remove_previous "$main"
256 try_remove_previous "$sub"
257 fi
258 main=
259 sub=
260 ;;
261 esac
262 done
263}
264
265copy_commit()
266{
267 # We're going to set some environment vars here, so
268 # do it in a subshell to get rid of them safely later
269 debug copy_commit "{$1}" "{$2}" "{$3}"
270 git log -1 --pretty=format:'%an%n%ae%n%ad%n%cn%n%ce%n%cd%n%s%n%n%b' "$1" |
271 (
272 read GIT_AUTHOR_NAME
273 read GIT_AUTHOR_EMAIL
274 read GIT_AUTHOR_DATE
275 read GIT_COMMITTER_NAME
276 read GIT_COMMITTER_EMAIL
277 read GIT_COMMITTER_DATE
278 export GIT_AUTHOR_NAME \
279 GIT_AUTHOR_EMAIL \
280 GIT_AUTHOR_DATE \
281 GIT_COMMITTER_NAME \
282 GIT_COMMITTER_EMAIL \
283 GIT_COMMITTER_DATE
284 (echo -n "$annotate"; cat ) |
285 git commit-tree "$2" $3 # reads the rest of stdin
286 ) || die "Can't copy commit $1"
287}
288
289add_msg()
290{
291 dir="$1"
292 latest_old="$2"
293 latest_new="$3"
294 if [ -n "$message" ]; then
295 commit_message="$message"
296 else
297 commit_message="Add '$dir/' from commit '$latest_new'"
298 fi
299 cat <<-EOF
300 $commit_message
301
302 git-subtree-dir: $dir
303 git-subtree-mainline: $latest_old
304 git-subtree-split: $latest_new
305 EOF
306}
307
308add_squashed_msg()
309{
310 if [ -n "$message" ]; then
311 echo "$message"
312 else
313 echo "Merge commit '$1' as '$2'"
314 fi
315}
316
317rejoin_msg()
318{
319 dir="$1"
320 latest_old="$2"
321 latest_new="$3"
322 if [ -n "$message" ]; then
323 commit_message="$message"
324 else
325 commit_message="Split '$dir/' into commit '$latest_new'"
326 fi
327 cat <<-EOF
328 $commit_message
329
330 git-subtree-dir: $dir
331 git-subtree-mainline: $latest_old
332 git-subtree-split: $latest_new
333 EOF
334}
335
336squash_msg()
337{
338 dir="$1"
339 oldsub="$2"
340 newsub="$3"
341 newsub_short=$(git rev-parse --short "$newsub")
342
343 if [ -n "$oldsub" ]; then
344 oldsub_short=$(git rev-parse --short "$oldsub")
345 echo "Squashed '$dir/' changes from $oldsub_short..$newsub_short"
346 echo
347 git log --pretty=tformat:'%h %s' "$oldsub..$newsub"
348 git log --pretty=tformat:'REVERT: %h %s' "$newsub..$oldsub"
349 else
350 echo "Squashed '$dir/' content from commit $newsub_short"
351 fi
352
353 echo
354 echo "git-subtree-dir: $dir"
355 echo "git-subtree-split: $newsub"
356}
357
358toptree_for_commit()
359{
360 commit="$1"
361 git log -1 --pretty=format:'%T' "$commit" -- || exit $?
362}
363
364subtree_for_commit()
365{
366 commit="$1"
367 dir="$2"
368 git ls-tree "$commit" -- "$dir" |
369 while read mode type tree name; do
370 assert [ "$name" = "$dir" ]
371 assert [ "$type" = "tree" ]
372 echo $tree
373 break
374 done
375}
376
377tree_changed()
378{
379 tree=$1
380 shift
381 if [ $# -ne 1 ]; then
382 return 0 # weird parents, consider it changed
383 else
384 ptree=$(toptree_for_commit $1)
385 if [ "$ptree" != "$tree" ]; then
386 return 0 # changed
387 else
388 return 1 # not changed
389 fi
390 fi
391}
392
393new_squash_commit()
394{
395 old="$1"
396 oldsub="$2"
397 newsub="$3"
398 tree=$(toptree_for_commit $newsub) || exit $?
399 if [ -n "$old" ]; then
400 squash_msg "$dir" "$oldsub" "$newsub" |
401 git commit-tree "$tree" -p "$old" || exit $?
402 else
403 squash_msg "$dir" "" "$newsub" |
404 git commit-tree "$tree" || exit $?
405 fi
406}
407
408copy_or_skip()
409{
410 rev="$1"
411 tree="$2"
412 newparents="$3"
413 assert [ -n "$tree" ]
414
415 identical=
416 nonidentical=
417 p=
418 gotparents=
419 for parent in $newparents; do
420 ptree=$(toptree_for_commit $parent) || exit $?
421 [ -z "$ptree" ] && continue
422 if [ "$ptree" = "$tree" ]; then
423 # an identical parent could be used in place of this rev.
424 identical="$parent"
425 else
426 nonidentical="$parent"
427 fi
428
429 # sometimes both old parents map to the same newparent;
430 # eliminate duplicates
431 is_new=1
432 for gp in $gotparents; do
433 if [ "$gp" = "$parent" ]; then
434 is_new=
435 break
436 fi
437 done
438 if [ -n "$is_new" ]; then
439 gotparents="$gotparents $parent"
440 p="$p -p $parent"
441 fi
442 done
443
444 if [ -n "$identical" ]; then
445 echo $identical
446 else
447 copy_commit $rev $tree "$p" || exit $?
448 fi
449}
450
451ensure_clean()
452{
453 if ! git diff-index HEAD --exit-code --quiet; then
454 die "Working tree has modifications. Cannot add."
455 fi
456 if ! git diff-index --cached HEAD --exit-code --quiet; then
457 die "Index has modifications. Cannot add."
458 fi
459}
460
461cmd_add()
462{
463 if [ -e "$dir" ]; then
464 die "'$dir' already exists. Cannot add."
465 fi
466 ensure_clean
467
468 set -- $revs
469 if [ $# -ne 1 ]; then
470 die "You must provide exactly one revision. Got: '$revs'"
471 fi
472 rev="$1"
473
474 debug "Adding $dir as '$rev'..."
475 git read-tree --prefix="$dir" $rev || exit $?
476 git checkout -- "$dir" || exit $?
477 tree=$(git write-tree) || exit $?
478
479 headrev=$(git rev-parse HEAD) || exit $?
480 if [ -n "$headrev" -a "$headrev" != "$rev" ]; then
481 headp="-p $headrev"
482 else
483 headp=
484 fi
485
486 if [ -n "$squash" ]; then
487 rev=$(new_squash_commit "" "" "$rev") || exit $?
488 commit=$(add_squashed_msg "$rev" "$dir" |
489 git commit-tree $tree $headp -p "$rev") || exit $?
490 else
491 commit=$(add_msg "$dir" "$headrev" "$rev" |
492 git commit-tree $tree $headp -p "$rev") || exit $?
493 fi
494 git reset "$commit" || exit $?
495
496 say "Added dir '$dir'"
497}
498
499cmd_split()
500{
501 debug "Splitting $dir..."
502 cache_setup || exit $?
503
504 if [ -n "$onto" ]; then
505 debug "Reading history for --onto=$onto..."
506 git rev-list $onto |
507 while read rev; do
508 # the 'onto' history is already just the subdir, so
509 # any parent we find there can be used verbatim
510 debug " cache: $rev"
511 cache_set $rev $rev
512 done
513 fi
514
515 if [ -n "$ignore_joins" ]; then
516 unrevs=
517 else
518 unrevs="$(find_existing_splits "$dir" "$revs")"
519 fi
520
521 # We can't restrict rev-list to only $dir here, because some of our
522 # parents have the $dir contents the root, and those won't match.
523 # (and rev-list --follow doesn't seem to solve this)
524 grl='git rev-list --reverse --parents $revs $unrevs'
525 revmax=$(eval "$grl" | wc -l)
526 revcount=0
527 createcount=0
528 eval "$grl" |
529 while read rev parents; do
530 revcount=$(($revcount + 1))
531 say -n "$revcount/$revmax ($createcount)
"
532 debug "Processing commit: $rev"
533 exists=$(cache_get $rev)
534 if [ -n "$exists" ]; then
535 debug " prior: $exists"
536 continue
537 fi
538 createcount=$(($createcount + 1))
539 debug " parents: $parents"
540 newparents=$(cache_get $parents)
541 debug " newparents: $newparents"
542
543 tree=$(subtree_for_commit $rev "$dir")
544 debug " tree is: $tree"
545
546 # ugly. is there no better way to tell if this is a subtree
547 # vs. a mainline commit? Does it matter?
548 if [ -z $tree ]; then
549 cache_set $rev $rev
550 continue
551 fi
552
553 newrev=$(copy_or_skip "$rev" "$tree" "$newparents") || exit $?
554 debug " newrev is: $newrev"
555 cache_set $rev $newrev
556 cache_set latest_new $newrev
557 cache_set latest_old $rev
558 done || exit $?
559 latest_new=$(cache_get latest_new)
560 if [ -z "$latest_new" ]; then
561 die "No new revisions were found"
562 fi
563
564 if [ -n "$rejoin" ]; then
565 debug "Merging split branch into HEAD..."
566 latest_old=$(cache_get latest_old)
567 git merge -s ours \
568 -m "$(rejoin_msg $dir $latest_old $latest_new)" \
569 $latest_new >&2 || exit $?
570 fi
571 if [ -n "$branch" ]; then
572 if rev_exists "refs/heads/$branch"; then
573 if ! rev_is_descendant_of_branch $latest_new $branch; then
574 die "Branch '$branch' is not an ancestor of commit '$latest_new'."
575 fi
576 action='Updated'
577 else
578 action='Created'
579 fi
580 git update-ref -m 'subtree split' "refs/heads/$branch" $latest_new || exit $?
581 say "$action branch '$branch'"
582 fi
583 echo $latest_new
584 exit 0
585}
586
587cmd_merge()
588{
589 ensure_clean
590
591 set -- $revs
592 if [ $# -ne 1 ]; then
593 die "You must provide exactly one revision. Got: '$revs'"
594 fi
595 rev="$1"
596
597 if [ -n "$squash" ]; then
598 first_split="$(find_latest_squash "$dir")"
599 if [ -z "$first_split" ]; then
600 die "Can't squash-merge: '$dir' was never added."
601 fi
602 set $first_split
603 old=$1
604 sub=$2
605 if [ "$sub" = "$rev" ]; then
606 say "Subtree is already at commit $rev."
607 exit 0
608 fi
609 new=$(new_squash_commit "$old" "$sub" "$rev") || exit $?
610 debug "New squash commit: $new"
611 rev="$new"
612 fi
613
614 if [ -n "$message" ]; then
615 git merge -s subtree --message="$message" $rev
616 else
617 git merge -s subtree $rev
618 fi
619}
620
621cmd_pull()
622{
623 ensure_clean
624 git fetch "$@" || exit $?
625 revs=FETCH_HEAD
626 cmd_merge
627}
628
629"cmd_$command" "$@"