summaryrefslogtreecommitdiff
path: root/bin/hstow
blob: c7f783edc1b0053ee1f95ec3ff112defccbb8328 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
#!/bin/sh

# hstow -- POSIX sh minimal reimplementation of GNU Stow for dotfiles
#
# Copyright (C) 2022-2023  Sean Whitton <spwhitton@spwhitton.name>
#
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or (at
# your option) any later version.
#
# This program is distributed in the hope that it will be useful, but
# WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
# General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.

# The point of this script is to obtain minimally functional dotfiles
# handling in one's home directory on even machines that lack a Perl
# interpreter.  As such, many of GNU Stow's more advanced features are
# not reimplemented.  Git depends on Perl, for now, but my two methods
# for deploying my dotfiles to remote machines -- my INSINUATE-DOTFILES
# Consfigurator property and 'insinuate-dotfiles' shell script -- do not
# depend on having Git on the remote side.  See also 'bstraph' script.
#
# We completely skip filenames containing control characters, including
# newline and tab, as POSIX find(1) lacks -print0, and it's unlikely
# you'd need to stow any such files.
# Technique from <https://dwheeler.com/essays/filenames-in-shell.html>.

set -efu
IFS="$(printf '\n\t')"
export LC_ALL=C
. ~/src/dotfiles/lib-src/posix-defuns.sh

# readlink(1) is not POSIX, so we require an alternative.
# For simplicity, always use this even if readlink(1) is installed.
readlinks () {
    local restc=$1 assume="${2:-false}" first= rest=
    local fields_temp="$(mkstemp)" targets_temp="$(mkstemp)"
    # This first pipeline involves a safe parse of ls(1) output given
    # its POSIX specification.
    # We want the ninth field onwards in the output of ls(1) in awk's
    # sense -- i.e. collapsing runs of multiple blanks between the first
    # nine fields -- but we mustn't collapse blanks from there onwards.
    exec 3>&1
    while read -r first rest; do
	[ -n "$rest" ] && rest="$tab$rest"
	if $assume || [ -h "$first" ]; then
	    echo "$first"
	    echo "$first$rest" >>"$fields_temp"
	else
	    echo "$first$rest" >&3
	fi
    done \
	| awk '{ gsub(/"/, "\"'"'"'\"'"'"'\"")
		 printf "\"%s\"\n", $0 }' | xargs -E '' -- ls -ld \
	| sed -E 's/^([^[:blank:]]+[[:blank:]]+){8}//; /^\.$/d' \
	| sort -o "$targets_temp" # undo how ls(1) sorts non-dirs first
    sort -t"$tab" -k1 -o "$fields_temp" "$fields_temp"

    if [ "$(wc -l <"$fields_temp")" \
	     -ne "$(wc -l <"$targets_temp")" ]; then
	rm "$fields_temp" "$targets_temp"
	fail "line counts unequal; are there newlines in link targets?"
    fi

    # Only BREs have backreferences in POSIX.
    paste "$fields_temp" "$targets_temp" \
	| sed 's/^\([^\t]\{1,\}\)\t\('\
"$(printf "%${restc}s" | sed 's/ /[^\\t]\\{1,\\}\\t/g')"\
'\)\1 -> /\1\t\2/' \
	| awk -F'\t' 'NF == '$((2+$restc))' && $NF !~ /[\001-\037\177]/'

    rm "$fields_temp" "$targets_temp"
}

disjoin_file () {
    while read -r line; do
	[ -n "$line" ] && printf "|$2" "$line"
    done <"$DIR/$1" | sed 's#^.##; s#/#\\/#g'
}

globs_to_find_args () {
    local file="$DIR/$1"; shift
    printf '%s\n' "$@" | cat - $([ -e "$file" ] && echo "$file") \
	| awk -F'\n' -vOFS='\t' \
	      '/\/\*$/ { sub(/..$/, ""); prune[++c] = "./" $0; next }
	       $0 { notpath[++d] = "./" $0 }
	       # We want to prevent find(1) recursing into directories
	       # of these names, but not prevent the remainder of the
	       # find(1) expression from matching the names themselves.
	       # This is what is correct for globs of the form "dir/*".
	       # While it is true that neither of the find(1) commands
	       # which use globs_to_find_args() match directories, such
	       # that it would not make sense to add a line to one of
	       # .hstow-*-ignore with the aim of excluding the contents
	       # of a directory but not the directory itself, it could
	       # be that the name is currently a symlink that we should
	       # unstow.  (Also note that we do not pass -L to find(1),
	       # so we will not recurse into symlinks to dirs anyway.)
	       END { if (c) {
			 print "(", "(", "-path", prune[1]
			 for (i = 2; i <= c; i++)
			     print "-o", "-path", prune[i]
			 print ")", "-prune", "-o", "-name", "*", ")"
		     }
		     for (j in notpath) print "!", "-path", notpath[j]
		   }'
}

usage () {
    fail "usage: hstow stow|unstow|restow|adopt DIRECTORY"
}

stow () {
    cd "$DIR"
    [ -d "$HOME/.STOW" ] || mkdir "$HOME/.STOW"
    [ -f "$HOME/.STOW/.stow" ] || touch "$HOME/.STOW/.stow"
    [ -h "$HOME/.STOW/$NAME" ] \
	|| ( cd "$HOME/.STOW"; ln -s "$DIR" "$NAME" )

    conflicts="$(stow1)"
    [ -z "$conflicts" ] && return
    echo >&2 "hstow: encountered conflicts:"
    for conflict in $conflicts; do echo >&2 "  $conflict"; done
    exit 127
}

stow1 () {
    if $always_adopt; then
	adoptp=1
    elif ! [ -e .hstow-always-adopt ]; then
	adoptp=0
    else
	# EREs matching files that (i) always/often have their symlinks
	# replaced with regular files when applications access them; and
	# (ii) we don't ever want to edit the copy under $DIR directly,
	# but only via the link/copy under $HOME.
	# We might list globs in this file & convert them to EREs here.
	adoptp="$(printf 'rel ~ /^(%s)/' \
			 "$(disjoin_file .hstow-always-adopt "%s")")"
    fi
    find . $(globs_to_find_args .hstow-local-ignore ".git/*") \
	 ! -name . ! -type d ! -name "$cchars" ! -name .gitignore \
	 ! -name .hstow-local-ignore ! -name .hstow-always-adopt \
	 ! -name .hstow-unstow-ignore -print \
	| awk -F'\n' -vOFS='\t' '
{ rel = $1; gsub(/\/dot[-.]/, "/.", rel); gsub(/^\.\//, "", rel)
  dotdotslashes = rel
  sub(/[^\/]*$/, "", dotdotslashes)
  gsub(/[^\/]+/, "..", dotdotslashes)
  $2 = $1
  $3 = $1; sub(/\/[^/]+$/, "", $3)
  $1 = ENVIRON["HOME"] "/" rel
  $4 = '"$adoptp"' ? "true" : "false"
  $5 = dotdotslashes ".STOW/'"$NAME"'/" rel
  print
}' | readlinks 4 \
	| while read -r link file file_dir adopt target link_target; do
	if [ "$target" = "$link_target" ]; then
	    continue
	elif [ -n "$link_target" ]; then # implies $link is a symlink
	    # With at least GNU ln(1), passing -f, but not also -T, does
	    # not replace an existing link in some cases.
	    # -T is not POSIX, so we remove any existing link first.
	    rm "$link"
	    ln -s "$target" "$link"
	elif $adopt && [ ! -h "$file" -a -f "$link" ]; then
	    mv -f "$link" "$file"
	    ln -s "$target" "$link"
	elif [ -d "$link" ] && rmdir "$link" 2>/dev/null; then
	    ln -s "$target" "$link"
	elif [ -e "$link" ]; then
	    echo "$file" 	# into $conflicts
	else
	    mkdir -p "$HOME/$file_dir"
	    ln -s "$target" "$link"
	fi
    done
}

unstow () {
    cd "$HOME"

    # .hstow-unstow-ignore is a list of globs matching dirs into which
    # we'll never stow anything.  We have this for the sake of speed.
    #
    # awk's close() calls pclose(3), completing all the link deletions.
    # POSIX.1 "Utility Description Defaults", "Consequences of Errors"
    # implies that should rmdir(1) encounter a non-empty directory, it
    # should proceed to attempt to remove the next operand.
    # Thus, here, -p means that we do not need to sort the operands.
    # We don't know the code with which rmdir(1) will exit, and if it is
    # 255 then xargs will give up.  So we wrap in a call to sh -c.
    find . ! \( -user "$(id -un)" -o -group "$(id -gn)" \) -prune -o \
	 $(globs_to_find_args \
	       .hstow-unstow-ignore ".STOW/*" \
	       "$(echo "$DIR" \
		      | cut -c$((1 + $(echo "$HOME" | wc -m)))-)/*") \
	 -type l ! -name . ! -name "$cchars" -print \
	| readlinks 0 true \
	| awk -F'\t' -vOFS='\t' '$2 ~ /^(\.\.\/)*\.STOW\/'"$NAME"'\// \
{ gsub(/"/, "\"'"'"'\"'"'"'\"", $1)
  printf "\"%s\"\n", $1 | "xargs -E '' -- rm -f"
  sub(/^.\//, "", $1)
  sub(/\/?[^/]+$/, "", $1)
  if ($1) dirs[++i] = $1
} END { close("xargs -E '' -- rm -f")
	for (d in dirs) printf "\"%s\"\n", dirs[d]
}' | xargs -E '' -- sh -c 'rmdir -p -- "$@" 2>/dev/null ||:' --

    [ -e "$HOME/.STOW/$NAME" ] && rm "$HOME/.STOW/$NAME"
    if [ -d "$HOME/.STOW" ] \
	   && [ "$(dir_contents $HOME/.STOW)" = "./.stow" ]; then
	rm "$HOME/.STOW/.stow"
	rmdir "$HOME/.STOW"
    fi
}

[ $# = 2 ] || usage
[ -d "$2" ] || fail "$2 is not an existing directory"
DIR="$(cd $2; pwd)"
[ "$(echo $DIR | cut -c-$(($(echo $HOME | wc -m) - 1)))" = "$HOME" ] \
    || fail "$DIR is not below $HOME"

NAME="$(echo $DIR | tr / _)"
always_adopt=false
case "$1" in
    'stow')   stow			;;
    'unstow') unstow			;;
    'restow') unstow; stow		;;
    'adopt')  always_adopt=true; stow	;;
    *)        usage                     ;;
esac