Code

allow using --branch with existing branches if it makes sense
[git.git] / git-subtree.sh
1 #!/bin/bash
2 #
3 # git-subtree.sh: split/join git repositories in subdirectories of this one
4 #
5 # Copyright (C) 2009 Avery Pennarun <apenwarr@gmail.com>
6 #
7 if [ $# -eq 0 ]; then
8     set -- -h
9 fi
10 OPTS_SPEC="\
11 git subtree add   --prefix=<prefix> <commit>
12 git subtree merge --prefix=<prefix> <commit>
13 git subtree pull  --prefix=<prefix> <repository> <refspec...>
14 git subtree split --prefix=<prefix> <commit...>
15 --
16 h,help        show the help
17 q             quiet
18 d             show debug messages
19 p,prefix=     the name of the subdir to split out
20 m,message=    use the given message as the commit message for the merge commit
21  options for 'split'
22 annotate=     add a prefix to commit message of new commits
23 b,branch=     create a new branch from the split subtree
24 ignore-joins  ignore prior --rejoin commits
25 onto=         try connecting new tree to an existing one
26 rejoin        merge the new branch back into HEAD
27  options for 'add', 'merge', and 'pull'
28 squash        merge subtree changes as a single commit
29 "
30 eval $(echo "$OPTS_SPEC" | git rev-parse --parseopt -- "$@" || echo exit $?)
31 PATH=$(git --exec-path):$PATH
32 . git-sh-setup
33 require_work_tree
35 quiet=
36 branch=
37 debug=
38 command=
39 onto=
40 rejoin=
41 ignore_joins=
42 annotate=
43 squash=
44 message=
46 debug()
47 {
48         if [ -n "$debug" ]; then
49                 echo "$@" >&2
50         fi
51 }
53 say()
54 {
55         if [ -z "$quiet" ]; then
56                 echo "$@" >&2
57         fi
58 }
60 assert()
61 {
62         if "$@"; then
63                 :
64         else
65                 die "assertion failed: " "$@"
66         fi
67 }
70 #echo "Options: $*"
72 while [ $# -gt 0 ]; do
73         opt="$1"
74         shift
75         case "$opt" in
76                 -q) quiet=1 ;;
77                 -d) debug=1 ;;
78                 --annotate) annotate="$1"; shift ;;
79                 --no-annotate) annotate= ;;
80                 -b) branch="$1"; shift ;;
81                 -p) prefix="$1"; shift ;;
82                 -m) message="$1"; shift ;;
83                 --no-prefix) prefix= ;;
84                 --onto) onto="$1"; shift ;;
85                 --no-onto) onto= ;;
86                 --rejoin) rejoin=1 ;;
87                 --no-rejoin) rejoin= ;;
88                 --ignore-joins) ignore_joins=1 ;;
89                 --no-ignore-joins) ignore_joins= ;;
90                 --squash) squash=1 ;;
91                 --no-squash) squash= ;;
92                 --) break ;;
93                 *) die "Unexpected option: $opt" ;;
94         esac
95 done
97 command="$1"
98 shift
99 case "$command" in
100         add|merge|pull) default= ;;
101         split) default="--default HEAD" ;;
102         *) die "Unknown command '$command'" ;;
103 esac
105 if [ -z "$prefix" ]; then
106         die "You must provide the --prefix option."
107 fi
108 dir="$(dirname "$prefix/.")"
110 if [ "$command" != "pull" ]; then
111         revs=$(git rev-parse $default --revs-only "$@") || exit $?
112         dirs="$(git rev-parse --no-revs --no-flags "$@")" || exit $?
113         if [ -n "$dirs" ]; then
114                 die "Error: Use --prefix instead of bare filenames."
115         fi
116 fi
118 debug "command: {$command}"
119 debug "quiet: {$quiet}"
120 debug "revs: {$revs}"
121 debug "dir: {$dir}"
122 debug "opts: {$*}"
123 debug
125 cache_setup()
127         cachedir="$GIT_DIR/subtree-cache/$$"
128         rm -rf "$cachedir" || die "Can't delete old cachedir: $cachedir"
129         mkdir -p "$cachedir" || die "Can't create new cachedir: $cachedir"
130         debug "Using cachedir: $cachedir" >&2
133 cache_get()
135         for oldrev in $*; do
136                 if [ -r "$cachedir/$oldrev" ]; then
137                         read newrev <"$cachedir/$oldrev"
138                         echo $newrev
139                 fi
140         done
143 cache_set()
145         oldrev="$1"
146         newrev="$2"
147         if [ "$oldrev" != "latest_old" \
148              -a "$oldrev" != "latest_new" \
149              -a -e "$cachedir/$oldrev" ]; then
150                 die "cache for $oldrev already exists!"
151         fi
152         echo "$newrev" >"$cachedir/$oldrev"
155 rev_exists()
157         if git rev-parse "$1" >/dev/null 2>&1; then
158                 return 0
159         else
160                 return 1
161         fi
164 rev_is_descendant_of_branch()
166         newrev="$1"
167         branch="$2"
168         branch_hash=$(git rev-parse $branch)
169         match=$(git rev-list $newrev | grep $branch_hash)
171         if [ -n "$match" ]; then
172                 return 0
173         else
174                 return 1
175         fi
178 # if a commit doesn't have a parent, this might not work.  But we only want
179 # to remove the parent from the rev-list, and since it doesn't exist, it won't
180 # be there anyway, so do nothing in that case.
181 try_remove_previous()
183         if rev_exists "$1^"; then
184                 echo "^$1^"
185         fi
188 find_latest_squash()
190         debug "Looking for latest squash ($dir)..."
191         dir="$1"
192         sq=
193         main=
194         sub=
195         git log --grep="^git-subtree-dir: $dir/*\$" \
196                 --pretty=format:'START %H%n%s%n%n%b%nEND%n' HEAD |
197         while read a b junk; do
198                 debug "$a $b $junk"
199                 debug "{{$sq/$main/$sub}}"
200                 case "$a" in
201                         START) sq="$b" ;;
202                         git-subtree-mainline:) main="$b" ;;
203                         git-subtree-split:) sub="$b" ;;
204                         END)
205                                 if [ -n "$sub" ]; then
206                                         if [ -n "$main" ]; then
207                                                 # a rejoin commit?
208                                                 # Pretend its sub was a squash.
209                                                 sq="$sub"
210                                         fi
211                                         debug "Squash found: $sq $sub"
212                                         echo "$sq" "$sub"
213                                         break
214                                 fi
215                                 sq=
216                                 main=
217                                 sub=
218                                 ;;
219                 esac
220         done
223 find_existing_splits()
225         debug "Looking for prior splits..."
226         dir="$1"
227         revs="$2"
228         main=
229         sub=
230         git log --grep="^git-subtree-dir: $dir/*\$" \
231                 --pretty=format:'START %H%n%s%n%n%b%nEND%n' $revs |
232         while read a b junk; do
233                 case "$a" in
234                         START) sq="$b" ;;
235                         git-subtree-mainline:) main="$b" ;;
236                         git-subtree-split:) sub="$b" ;;
237                         END)
238                                 debug "  Main is: '$main'"
239                                 if [ -z "$main" -a -n "$sub" ]; then
240                                         # squash commits refer to a subtree
241                                         debug "  Squash: $sq from $sub"
242                                         cache_set "$sq" "$sub"
243                                 fi
244                                 if [ -n "$main" -a -n "$sub" ]; then
245                                         debug "  Prior: $main -> $sub"
246                                         cache_set $main $sub
247                                         try_remove_previous "$main"
248                                         try_remove_previous "$sub"
249                                 fi
250                                 main=
251                                 sub=
252                                 ;;
253                 esac
254         done
257 copy_commit()
259         # We're going to set some environment vars here, so
260         # do it in a subshell to get rid of them safely later
261         debug copy_commit "{$1}" "{$2}" "{$3}"
262         git log -1 --pretty=format:'%an%n%ae%n%ad%n%cn%n%ce%n%cd%n%s%n%n%b' "$1" |
263         (
264                 read GIT_AUTHOR_NAME
265                 read GIT_AUTHOR_EMAIL
266                 read GIT_AUTHOR_DATE
267                 read GIT_COMMITTER_NAME
268                 read GIT_COMMITTER_EMAIL
269                 read GIT_COMMITTER_DATE
270                 export  GIT_AUTHOR_NAME \
271                         GIT_AUTHOR_EMAIL \
272                         GIT_AUTHOR_DATE \
273                         GIT_COMMITTER_NAME \
274                         GIT_COMMITTER_EMAIL \
275                         GIT_COMMITTER_DATE
276                 (echo -n "$annotate"; cat ) |
277                 git commit-tree "$2" $3  # reads the rest of stdin
278         ) || die "Can't copy commit $1"
281 add_msg()
283         dir="$1"
284         latest_old="$2"
285         latest_new="$3"
286         if [ -n "$message" ]; then
287                 commit_message="$message"
288         else
289                 commit_message="Add '$dir/' from commit '$latest_new'"
290         fi
291         cat <<-EOF
292                 $commit_message
293                 
294                 git-subtree-dir: $dir
295                 git-subtree-mainline: $latest_old
296                 git-subtree-split: $latest_new
297         EOF
300 add_squashed_msg()
302         if [ -n "$message" ]; then
303                 echo "$message"
304         else
305                 echo "Merge commit '$1' as '$2'"
306         fi
309 rejoin_msg()
311         dir="$1"
312         latest_old="$2"
313         latest_new="$3"
314         if [ -n "$message" ]; then
315                 commit_message="$message"
316         else
317                 commit_message="Split '$dir/' into commit '$latest_new'"
318         fi
319         cat <<-EOF
320                 $message
321                 
322                 git-subtree-dir: $dir
323                 git-subtree-mainline: $latest_old
324                 git-subtree-split: $latest_new
325         EOF
328 squash_msg()
330         dir="$1"
331         oldsub="$2"
332         newsub="$3"
333         newsub_short=$(git rev-parse --short "$newsub")
334         
335         if [ -n "$oldsub" ]; then
336                 oldsub_short=$(git rev-parse --short "$oldsub")
337                 echo "Squashed '$dir/' changes from $oldsub_short..$newsub_short"
338                 echo
339                 git log --pretty=tformat:'%h %s' "$oldsub..$newsub"
340                 git log --pretty=tformat:'REVERT: %h %s' "$newsub..$oldsub"
341         else
342                 echo "Squashed '$dir/' content from commit $newsub_short"
343         fi
344         
345         echo
346         echo "git-subtree-dir: $dir"
347         echo "git-subtree-split: $newsub"
350 toptree_for_commit()
352         commit="$1"
353         git log -1 --pretty=format:'%T' "$commit" -- || exit $?
356 subtree_for_commit()
358         commit="$1"
359         dir="$2"
360         git ls-tree "$commit" -- "$dir" |
361         while read mode type tree name; do
362                 assert [ "$name" = "$dir" ]
363                 assert [ "$type" = "tree" ]
364                 echo $tree
365                 break
366         done
369 tree_changed()
371         tree=$1
372         shift
373         if [ $# -ne 1 ]; then
374                 return 0   # weird parents, consider it changed
375         else
376                 ptree=$(toptree_for_commit $1)
377                 if [ "$ptree" != "$tree" ]; then
378                         return 0   # changed
379                 else
380                         return 1   # not changed
381                 fi
382         fi
385 new_squash_commit()
387         old="$1"
388         oldsub="$2"
389         newsub="$3"
390         tree=$(toptree_for_commit $newsub) || exit $?
391         if [ -n "$old" ]; then
392                 squash_msg "$dir" "$oldsub" "$newsub" | 
393                         git commit-tree "$tree" -p "$old" || exit $?
394         else
395                 squash_msg "$dir" "" "$newsub" |
396                         git commit-tree "$tree" || exit $?
397         fi
400 copy_or_skip()
402         rev="$1"
403         tree="$2"
404         newparents="$3"
405         assert [ -n "$tree" ]
407         identical=
408         nonidentical=
409         p=
410         gotparents=
411         for parent in $newparents; do
412                 ptree=$(toptree_for_commit $parent) || exit $?
413                 [ -z "$ptree" ] && continue
414                 if [ "$ptree" = "$tree" ]; then
415                         # an identical parent could be used in place of this rev.
416                         identical="$parent"
417                 else
418                         nonidentical="$parent"
419                 fi
420                 
421                 # sometimes both old parents map to the same newparent;
422                 # eliminate duplicates
423                 is_new=1
424                 for gp in $gotparents; do
425                         if [ "$gp" = "$parent" ]; then
426                                 is_new=
427                                 break
428                         fi
429                 done
430                 if [ -n "$is_new" ]; then
431                         gotparents="$gotparents $parent"
432                         p="$p -p $parent"
433                 fi
434         done
435         
436         if [ -n "$identical" ]; then
437                 echo $identical
438         else
439                 copy_commit $rev $tree "$p" || exit $?
440         fi
443 ensure_clean()
445         if ! git diff-index HEAD --exit-code --quiet; then
446                 die "Working tree has modifications.  Cannot add."
447         fi
448         if ! git diff-index --cached HEAD --exit-code --quiet; then
449                 die "Index has modifications.  Cannot add."
450         fi
453 cmd_add()
455         if [ -e "$dir" ]; then
456                 die "'$dir' already exists.  Cannot add."
457         fi
458         ensure_clean
459         
460         set -- $revs
461         if [ $# -ne 1 ]; then
462                 die "You must provide exactly one revision.  Got: '$revs'"
463         fi
464         rev="$1"
465         
466         debug "Adding $dir as '$rev'..."
467         git read-tree --prefix="$dir" $rev || exit $?
468         git checkout -- "$dir" || exit $?
469         tree=$(git write-tree) || exit $?
470         
471         headrev=$(git rev-parse HEAD) || exit $?
472         if [ -n "$headrev" -a "$headrev" != "$rev" ]; then
473                 headp="-p $headrev"
474         else
475                 headp=
476         fi
477         
478         if [ -n "$squash" ]; then
479                 rev=$(new_squash_commit "" "" "$rev") || exit $?
480                 commit=$(add_squashed_msg "$rev" "$dir" |
481                          git commit-tree $tree $headp -p "$rev") || exit $?
482         else
483                 commit=$(add_msg "$dir" "$headrev" "$rev" |
484                          git commit-tree $tree $headp -p "$rev") || exit $?
485         fi
486         git reset "$commit" || exit $?
487         
488         say "Added dir '$dir'"
491 cmd_split()
493         debug "Splitting $dir..."
494         cache_setup || exit $?
495         
496         if [ -n "$onto" ]; then
497                 debug "Reading history for --onto=$onto..."
498                 git rev-list $onto |
499                 while read rev; do
500                         # the 'onto' history is already just the subdir, so
501                         # any parent we find there can be used verbatim
502                         debug "  cache: $rev"
503                         cache_set $rev $rev
504                 done
505         fi
506         
507         if [ -n "$ignore_joins" ]; then
508                 unrevs=
509         else
510                 unrevs="$(find_existing_splits "$dir" "$revs")"
511         fi
512         
513         # We can't restrict rev-list to only $dir here, because some of our
514         # parents have the $dir contents the root, and those won't match.
515         # (and rev-list --follow doesn't seem to solve this)
516         grl='git rev-list --reverse --parents $revs $unrevs'
517         revmax=$(eval "$grl" | wc -l)
518         revcount=0
519         createcount=0
520         eval "$grl" |
521         while read rev parents; do
522                 revcount=$(($revcount + 1))
523                 say -n "$revcount/$revmax ($createcount)
525                 debug "Processing commit: $rev"
526                 exists=$(cache_get $rev)
527                 if [ -n "$exists" ]; then
528                         debug "  prior: $exists"
529                         continue
530                 fi
531                 createcount=$(($createcount + 1))
532                 debug "  parents: $parents"
533                 newparents=$(cache_get $parents)
534                 debug "  newparents: $newparents"
535                 
536                 tree=$(subtree_for_commit $rev "$dir")
537                 debug "  tree is: $tree"
538                 
539                 # ugly.  is there no better way to tell if this is a subtree
540                 # vs. a mainline commit?  Does it matter?
541                 [ -z $tree ] && continue
543                 newrev=$(copy_or_skip "$rev" "$tree" "$newparents") || exit $?
544                 debug "  newrev is: $newrev"
545                 cache_set $rev $newrev
546                 cache_set latest_new $newrev
547                 cache_set latest_old $rev
548         done || exit $?
549         latest_new=$(cache_get latest_new)
550         if [ -z "$latest_new" ]; then
551                 die "No new revisions were found"
552         fi
553         
554         if [ -n "$rejoin" ]; then
555                 debug "Merging split branch into HEAD..."
556                 latest_old=$(cache_get latest_old)
557                 git merge -s ours \
558                         -m "$(rejoin_msg $dir $latest_old $latest_new)" \
559                         $latest_new >&2 || exit $?
560         fi
561         if [ -n "$branch" ]; then
562                 if rev_exists "refs/heads/$branch"; then
563                         if ! rev_is_descendant_of_branch $latest_new $branch; then
564                                 die "Branch '$branch' is not an ancestor of commit '$latest_new'."
565                         fi
566                         action='Updated'
567                 else
568                         action='Created'
569                 fi
570                 git update-ref -m 'subtree split' "refs/heads/$branch" $latest_new || exit $?
571                 say "$action branch '$branch'"
572         fi
573         echo $latest_new
574         exit 0
577 cmd_merge()
579         ensure_clean
580         
581         set -- $revs
582         if [ $# -ne 1 ]; then
583                 die "You must provide exactly one revision.  Got: '$revs'"
584         fi
585         rev="$1"
586         
587         if [ -n "$squash" ]; then
588                 first_split="$(find_latest_squash "$dir")"
589                 if [ -z "$first_split" ]; then
590                         die "Can't squash-merge: '$dir' was never added."
591                 fi
592                 set $first_split
593                 old=$1
594                 sub=$2
595                 if [ "$sub" = "$rev" ]; then
596                         say "Subtree is already at commit $rev."
597                         exit 0
598                 fi
599                 new=$(new_squash_commit "$old" "$sub" "$rev") || exit $?
600                 debug "New squash commit: $new"
601                 rev="$new"
602         fi
603         
604         git merge -s subtree --message="$message" $rev
607 cmd_pull()
609         ensure_clean
610         git fetch "$@" || exit $?
611         revs=FETCH_HEAD
612         cmd_merge
615 "cmd_$command" "$@"