X-Git-Url: https://iankelling.org/git/?p=distro-setup;a=blobdiff_plain;f=btrbk-run;h=6908018f61fbafda774339f4f299699e479a388b;hp=c59faf99c9eecb0e976a532bd6e2ef00225c59f7;hb=8a6b446c7e336596af614c853e1c6177e55a7983;hpb=82b146c2299fce1aec68d492e4bd881d81e8e6c9 diff --git a/btrbk-run b/btrbk-run old mode 100755 new mode 100644 index c59faf9..6908018 --- a/btrbk-run +++ b/btrbk-run @@ -1,98 +1,303 @@ #!/bin/bash +# Copyright (C) 2016 Ian Kelling + +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at + +# http://www.apache.org/licenses/LICENSE-2.0 + +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + + +# todo: if we cancel in the middle of a btrfs send, then run again immediately, the received subvolume doesn't get a Received UUID: field, and we won't mount it. Need to figure out a solution that will fix this. set -eE -o pipefail trap 'echo "$0:$LINENO:error: \"$BASH_COMMAND\" returned $?" >&2' ERR [[ $EUID == 0 ]] || exec sudo -E "$BASH_SOURCE" "$@" + usage() { - echo "top of script file:" - sed -n '1,/^[# ]*end command line/{p;b};q' "$0" - exit $1 + cat <<'EOF' +btrbk-run [OPTIONS] +usually -t TARGET_HOST or -s SOURCE_HOST + +Note, at source location, intentionally not executable, run and read +install-my-scripts. + +EOF + echo "top of script file:" + sed -n '1,/^[# ]*end command line/{p;b};q' "$0" + exit $1 +} + +rsync-dirs() { + local host=$1 + local path=$2 + m rsync $dry_run_arg -ahi --relative --delete "$path" "root@$host:/" } -script_dir=$(dirname $(readlink "$BASH_SOURCE")) -# todo: finish figuring out fai / distro-setup -# initial fstab / subvol setup. +m() { if $verbose; then printf "$pre %s\n" "$*"; fi; "$@"; } +die() { printf "$pre %s\n" "$*" >&2; exit 1; } + +# latest $MAIL_HOST +if [[ -e /b/bash_unpublished/source-semi-priv ]]; then + source /b/bash_unpublished/source-semi-priv +fi + +# note q is owned by root:1000 + +mountpoints=() +rsync_mountpoint=/q + +# default options conf_only=false dry_run=false # mostly for testing -resume_arg= +rate_limit=no +verbose=true; verbose_arg=-v +progress_arg="--progress" +pull_reexec=false + +default_args_file=/etc/btrbk-run.conf +if [[ -s $default_args_file ]]; then + set -- $(< $default_args_file) "$@" + # i havent used this feature yet, so warn about it + echo "$0: warning: default btrbk-run options set in $default_args_file (sleeping 5 seconds):" + cat $default_args_file + sleep 5 +fi -temp=$(getopt -l help hcnrt: "$@") || usage 1 +pre="${0##*/}:" +cron=false +orig_args=("$@") +temp=$(getopt -l cron,pull-reexec,help cl:m:npqs:t:vh "$@") || usage 1 eval set -- "$temp" while true; do - case $1 in - -c) conf_only=true; shift ;; - -n) dry_run=true; dry_run_arg=-n; shift ;; - -r) resume_arg=-r; shift ;; - -t) IFS=, targets=($2); shift 2 ;; - -h|--help) usage ;; - --) shift; break ;; - *) echo "$0: Internal error!" ; exit 1 ;; - esac + case $1 in + --cron) + cron=true + pre= + shift + ;; + # only creates the config file, does not run btrbk + -c) conf_only=true; shift ;; + # bytes per second, suffix k m g + -l) rate_limit=$2; shift 2 ;; + # Comma separated mountpoints to backup. This has defaults set below. + -m) IFS=, mountpoints=($2); unset IFS; shift 2 ;; + -n) dry_run=true; dry_run_arg=-n; shift ;; + -p) progress_arg="--progress"; shift ;; + --pull-reexec) pull_reexec=true; shift ;; + -q) verbose=false; verbose_arg=; progress_arg=; shift ;; + # source host to receive a backup from + -s) source=$2; shift 2 ;; + # target hosts to send to. empty is valid for just doing local + # snapshot. we have default hosts we will populate. + -t) IFS=, targets=($2); unset IFS; shift 2 ;; + -v) verbose=true; verbose_arg=-v; shift ;; + -h|--help) usage ;; + --) shift; break ;; + *) die "Internal error!" ;; + esac done -read primary <<<"$@" -##### end command line parsing ######## +# usefull commands are resume and archive +cmd_arg=${1:-run} -target-section() { - local root=$1 - local subvol=$2 - mountpoint $root &>/dev/null || return - cat >>/etc/btrbk.conf </dev/null; then + home=iank.vpn.office.fsf.org + else + home=$HOME_DOMAIN + fi + ;;& + kw) + targets=($home x2) + ;; + x2) + targets=($home kw) + ;; + tp) + targets=(frodo kd) + # might not be connected to the vpn + if timeout -s 9 10 ssh kw :; then + targets+=(kw) + fi + ;; + kd) + targets=(frodo tp) + # might not be connected to the vpn + if timeout -s 9 10 ssh kw :; then + targets+=(kw) + fi + ;; + *) + die "error: no default targets for this host, use -t" + ;; + esac +fi -rsync-dirs() { - local host=$1 - local path=$2 - rsync $dry_run_arg -ahi --relative --delete "$path" "root@$host:/" -} +if [[ -v targets ]]; then + echo "targets: ${targets[*]}" +fi +if [[ $source ]]; then + echo "source: $source" +fi -# note q is owned by root:1000 -# note p is owned 1000:1000 and chmod 700 -mountpoints=(/q) -if awk '{print $2}' /etc/fstab | grep -xF /p &>/dev/null; then - mountpoints+=(/p) + +if [[ $mountpoints ]]; then + for mp in ${mountpoints[@]}; do # default mountpoints to sync + if [[ -e /nocow/btrfs-stale/$mp ]]; then + die "error: $mp is stale, mount-latest-subvol first" + fi + done +else + # set default mountpoints + case $HOSTNAME in + # no remote backups atm. note, if we do enable this, configuration below will need some changes. + # frodo) + # prospective_mps=(/i) + # ;; + *) + prospective_mps=(/a /q) + if [[ $HOSTNAME == "$MAIL_HOST" ]]; then + prospective_mps+=(/o) + fi + ;; + esac + for mp in ${prospective_mps[@]}; do # default mountpoints to sync + if [[ -e /nocow/btrfs-stale/$mp ]]; then + echo "$pre warning: $mp stale, not adding to default mountpoints" + continue + fi + if awk '{print $2}' /etc/fstab | grep -xF $mp &>/dev/null; then + mountpoints+=($mp) + fi + done +fi + +echo "mountpoints: ${mountpoints[*]}" + + + +# pull_reexec stops us from getting into an infinite loop if there is some +# kind of weird problem +pulla=false +for m in "${mountpoints[@]}"; do + if [[ $m == /a ]]; then + pulla=true + break + fi +done +if ! $pull_reexec && [[ $source ]] && $pulla ; then + tmpf=$(mktemp) + scp $source:/a/bin/distro-setup/btrbk-run $tmpf + if ! diff -q $tmpf $BASH_SOURCE; then + echo "$pre found newer version on host $source. reexecing" + install -T $tmpf /usr/local/bin/btrbk-run + m /usr/local/bin/btrbk-run --pull-reexec "${orig_args[@]}" + exit + fi fi + +##### end command line parsing ######## + + + +if ! which btrbk &>/dev/null; then + die "error: no btrbk binary found" +fi # if our mountpoints are from stale snapshots, # it doesn't make sense to do a backup. -check-subvol-stale ${mountpoints[@]} || exit 1 - -if [[ ! $targets ]]; then - case $HOSTNAME in - tp|x2) - if ! timeout -s 9 10 ssh frodo :; then - targets=($HOME_DOMAIN) - fi - ;; - esac - targets=(frodo) +check-subvol-stale ${mountpoints[@]} || die "found stale mountpoints in ${mountpoints[*]}" + +# for an initial run, btrbk requires the dir to exist. +mkdir -p /mnt/root/btrbk +local_zone=$(date +%z) + +if [[ $source ]]; then + if ! zone=$(ssh root@$source date +%z); then + die failed to ssh to root@$source + fi + if [[ $zone != $local_zone ]]; then + die "error: dont confuse yourself with multiple time zones. $h has different timezone than localhost" + fi + +else + + sshable=() + sshfail=() + min_idle_ms=$((1000 * 60 * 15)) + for h in ${targets[@]}; do + if zone=$(ssh root@$h "mkdir -p /mnt/root/btrbk && date +%z"); then + if $cron && DISPLAY=:0 xprintidle; then + # This is a separate ssh because xprintidle can fail and thats ok. + # Ignore this host. i sometimes use a non-main machine for testing or web browsing, knowing that + # everything will be wiped by the next backup, but I dont want it to happen as Im using + # it from cronjob. + continue + fi + sshable+=($h) + if [[ $zone != $local_zone ]]; then + die "error: dont confuse yourself with multiple time zones. $h has different timezone than localhost" + fi + else + sshfail+=($h) + fi + done + if [[ ! $sshable ]] || { ! $cron && [[ $sshfail ]]; }; then + die "failed to ssh to hosts: ${sshfail[*]}" + else + if [[ $sshfail ]]; then + ret=1 + echo "$pre error: failed to ssh to ${sshfail[*]} but continuing with other hosts" + fi + targets=(${sshable[@]}) + fi fi -# todo: make bash shell prompt show something when -# a subvol on current host is not fresh. -# umount first to ensure we don't have any errors -# todo: do some kill fuser stuff to make umount more reliable -# todo: run this on a systemd timer on $primary, once per hour, -# and if primary is, change that timer over to primary, and make -# sure we mount the latest -# todo: setup lock so that if this is already running, we exit out, so -# that manual runs don't interfere with cronjobs. +cat >/etc/btrbk.conf </etc/btrbk.conf <<'EOF' -ssh_identity /root/.ssh/id_rsa -transaction_syslog daemon +# note, i had this because man said 20% speedup, but ran into +# this issue, https://github.com/digint/btrbk/issues/275 +#stream_buffer 512m # so we only run one at a time lockfile /var/lock/btrbk.lock @@ -102,70 +307,100 @@ timestamp_format long-iso # only make a snapshot if things have changed snapshot_create onchange -# much less snapshots because I have less space on the -# local filesystem. -#snapshot_preserve 2h 2d -# for now, keeping them equal for simplicity sake -snapshot_preserve 48h 14d 8w 24m -snapshot_preserve_min 6h +# I could make this different from target_preserve, +# if one disk had less space. +# for now, keeping them equal. +snapshot_preserve 36h 14d 8w 24m +snapshot_preserve_min 4h snapshot_dir btrbk # so, total backups = ~89 -target_preserve 48h 14d 8w 24m -target_preserve_min 6h +target_preserve 36h 14d 8w 24m +target_preserve_min 4h # if something fails and it's not obvious, try doing # btrbk -l debug -v dryrun + +rate_limit $rate_limit EOF - remote_target="target send-receive ssh://${tg}/mnt/root/btrbk" - if [[ $tg == frodo && $HOSTNAME == treetowl ]]; then - target-section /mnt/iroot i - fi - for d in ${mountpoints[@]}; do - target-section /mnt/root ${d##*/} + + + +vol=/mnt/root +for m in ${mountpoints[@]}; do + sub=${m##*/} + if [[ $source ]]; then + cat >>/etc/btrbk.conf <>/etc/btrbk.conf <>/etc/btrbk.conf </dev/null; then + +if $dry_run; then + m btrbk -v -n $cmd_arg + exit 0 +elif [[ $cmd_arg == archive ]]; then + if [[ $source ]]; then + m btrbk $verbose_arg $progress_arg $cmd_arg ssh://$source$vol $vol + else for tg in ${targets[@]}; do - case $tg in - tp|li|lk) - for x in /p/c/machine_specific/*.hosts; do - if grep -qxF $tg $x; then - dir=${x%.hosts} - rsync-dirs $tg $dir - fi - done - ;; - esac + m btrbk $verbose_arg $progress_arg $cmd_arg $vol ssh://$tg$vol done + fi + exit 0 +fi +# -q and just using the syslog option seemed nice, +# but it doesn't show when a send has a parent and when it doesn't. +m btrbk $verbose_arg $progress_arg $cmd_arg + +# if we have it, sync to systems which don't +if mountpoint $rsync_mountpoint >/dev/null; then + for tg in ${targets[@]}; do + case $tg in + li|lk) + for x in /p/c/machine_specific/*.hosts; do + if grep -qxF $tg $x; then + dir=${x%.hosts} + rsync-dirs $tg $dir + fi + done + ;; + esac + done fi -if ! $dry_run; then - for tg in ${targets[@]}; do - scp $script_dir/{mount-latest-subvol,check-subvol-stale} \ - root@$tg:/usr/local/bin - ssh root@$tg bash <<'EOF' -set -e -chmod +x /usr/local/bin/{mount-latest-subvol,check-subvol-stale} -mount-latest-subvol -EOF - done +if [[ $source ]]; then + m mount-latest-subvol $verbose_arg +else + m /a/exe/mount-latest-remote ${targets[@]} fi +exit $ret # todo: move variable data we don't care about backing up # to /nocow and symlink it.