X-Git-Url: https://iankelling.org/git/?a=blobdiff_plain;ds=sidebyside;f=btrbk-run;h=dde230ee85f6b5ece47163eaf2b3448fb595b4d0;hb=HEAD;hp=c33ed66904832bff7ecdcf0b5873413098395ed5;hpb=2632836241e21fb97fa826b64a1886353bacd84f;p=distro-setup diff --git a/btrbk-run b/btrbk-run index c33ed66..9bd6e9b 100644 --- a/btrbk-run +++ b/btrbk-run @@ -1,17 +1,22 @@ #!/bin/bash -# Copyright (C) 2016 Ian Kelling -# Licensed under the Apache License, Version 2.0 (the "License"); -# you may not use this file except in compliance with the License. -# You may obtain a copy of the License at +# Configure & run btrbk & related work on Ian's computers. +# Copyright (C) 2024 Ian Kelling -# http://www.apache.org/licenses/LICENSE-2.0 +# This program is free software: you can redistribute it and/or modify +# it under the terms of the GNU General Public License as published by +# the Free Software Foundation, either version 3 of the License, or +# (at your option) any later version. -# Unless required by applicable law or agreed to in writing, software -# distributed under the License is distributed on an "AS IS" BASIS, -# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -# See the License for the specific language governing permissions and -# limitations under the License. +# This program is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU General Public License for more details. + +# You should have received a copy of the GNU General Public License +# along with this program. If not, see . + +# SPDX-License-Identifier: GPL-3.0-or-later # todo: if we cancel in the middle of a btrfs send, then run again @@ -22,7 +27,8 @@ [[ $EUID == 0 ]] || exec sudo -E "${BASH_SOURCE[0]}" "$@" -source /usr/local/lib/err +set -e; . /usr/local/lib/bash-bear; set +e +shopt -s nullglob usage() { cat <<'EOF' @@ -40,12 +46,135 @@ EOF +pre=btrbk-run + + + script_name="${BASH_SOURCE[0]}" script_name="${script_name##*/}" -m() { if $verbose; then printf "%s\n" "$*"; fi; "$@"; } -e() { printf "%s\n" "$*"; } -die() { printf "%s\n" "$*" >&2; echo "exiting with status 1" >&2; exit 1; } -mexit() { echo ": exiting with status $1"; exit $1; } + + +log-setup() { + if [[ ! $log_path ]]; then + mkdir -p /var/log/btrbk + log_path=/var/log/btrbk/$(date +%F_%T%:::z).log + fi +} +d() { + if $dry_run || $conf_only; then + printf "$pre dry-run: %s\n" "$*" + else + log-setup + printf "$pre running: %s\n" "$*" |& pee cat 'ts "%F %T" >>'$log_path + "$@" |& pee cat 'ts "%F %T" >>'$log_path + fi +} +m() { if $verbose; then printf "$pre %s\n" "$*"; fi; "$@"; } +e() { printf "$pre %s\n" "$*"; } + +logq() { + local exit_code + exit_code=0 + log-setup + printf "$pre running: %s\n" "$*" | pee cat 'ts "%F %T" >>'$log_path + e logging to $log_path + "$@" |& ts "%F %T" >>$log_path || exit_code=$? + printf "$pre exit code:%s of %s\n" "$exit_code" "$*" | pee cat 'ts "%F %T" >>'$log_path + if (( exit_code > 0 )); then + e "error: command exit code: $exit_code. exiting after tail -n50 $log_path" + tail -n50 $log_path + exit $exit_code + fi +} + +die() { printf "$pre error: %s\n" "$*" >&2; echo "$pre exiting with status 1" >&2; exit 1; } +mexit() { echo "$pre exiting with status $1"; exit $1; } + +uninstalled-file-die() { + die "file $1 is not latest. run install-my-scripts or rerun with -f" +} + +set-location() { + case $HOSTNAME in + kw) + at_work=true + ;; + kd|frodo) + at_home=true + ;; + x2|x3|sy|so) + if [[ $(dig +short @10.2.0.1 -x 10.2.0.2 2>&1 ||:) == kd.b8.nz. ]] \ + && ip n show 10.2.0.1 | grep . &>/dev/null; then + # note: logic duplicated in 11-iank + at_home=true + elif ping -q -c1 -w1 hal.office.fsf.org &>/dev/null \ + && ip n show 192.168.0.26 | grep . &>/dev/null; then + at_work=true + fi + ;; + esac +} + +exit-if-no-default-targets() { + if ! $force && [[ $HOSTNAME != "$MAIL_HOST" ]]; then + echo "MAIL_HOST=$MAIL_HOST, nothing to do" + mexit 0 + fi + case $HOSTNAME in + kw|kd|frodo|x2|x3|sy|so) : ;; + *) + die "error: no default targets for this host, use -t" + ;; + esac +} + +add-x3-target() { + # main work machine + if ping -q -c1 -w1 x3.office.fsf.org &>/dev/null; then + targets+=(x3.office.fsf.org) + elif ping -q -c1 -w1 x3.b8.nz &>/dev/null; then + # in case we took it home + targets+=(x3.b8.nz) + elif ping -q -c1 -w1 x3w.b8.nz &>/dev/null; then + targets+=(x3w.b8.nz) + else + targets+=(x3wg.b8.nz) + fi +} + +add-wireless-target() { + local host + if [[ ! $1 ]]; then + set -- $h + fi + for host; do + # c = cabled, w = wireless + if ping -q -c1 -w1 ${host}c.b8.nz &>/dev/null; then + targets+=(${host}c.b8.nz) + elif ping -q -c1 -w1 $host.b8.nz &>/dev/null; then + targets+=($host.b8.nz) + elif ping -q -c1 -w1 ${host}w.b8.nz &>/dev/null; then + targets+=(${host}w.b8.nz) + fi + done +} + +qconf() { + case $sub in + q) + # q has sensitive data i dont want to backup for so long + cat >>/etc/btrbk$conf_suf.conf < >(sed '/No such file or directory/d'); then + # shellcheck disable=SC2046 # we want word splitting + set -- $(< $once_args_file-tmp) "$@" + # i havent used this feature yet, so warn about it + echo "$0: btrbk-run options set in $once_args_file:" + cat $once_args_file-tmp + rm -f $once_args_file-tmp +fi + + targets=() early=false fast=false kd_spread=false +check_installed=false orig_args=("$@") -temp=$(getopt -l fast,pull-reexec,help 23cefikl:m:npqrs:t:vh "$@") || usage 1 +temp=$(getopt -l check-installed,fast,pull-reexec,help 23acefikl:m:npqrs:t:vh "$@") || usage 1 eval set -- "$temp" while true; do case $1 in # for the rare case we want to run multiple instances at the same time -2) conf_suf=2 ;; -3) conf_suf=3 ;; + -a) + # all moiuntpoints + mountpoints=(/a /o /qr /qd /q) + ;; # only creates the config file, does not run btrbk -c) conf_only=true ;; + --check-installed) + check_installed=true + ;; # quit early, just btrbk, no extra remounting etc. -e) early=true ;; # avoids some default behaviors: @@ -110,7 +258,9 @@ while true; do # switch mail-host, no need to repeat the same checks again. --fast) fast=true ;; -i) incremental_strict=true ;; - # note this implies resume and -p + # note this implies resume and -p because it is just meant to make + # other hosts have the same snapshots, not do any expiry or new + # backups. -k) kd_spread=true ;; # bytes per second, suffix k m g -l) rate_limit=$2; shift ;; @@ -136,7 +286,9 @@ while true; do # snapshot. we have default hosts we will populate. -t) IFS=, targets=($2); unset IFS; shift ;; # verbose. - -v) verbose=true; verbose_arg=-v ;; + -v) + verbose=true; verbose_arg="-l trace" + ;; -h|--help) usage ;; --) shift; break ;; *) die "Internal error!" ;; @@ -146,6 +298,28 @@ done cmd_arg="$1" + + +if ! $force && { $check_installed || [[ ! $source ]]; } ; then + install_bin_files=( + mount-latest-subvol + check-subvol-stale + btrbk-run + ) + for f in ${install_bin_files[@]}; do + if ! diff -q /a/bin/ds/$f /usr/local/bin/$f; then + uninstalled-file-die $f + fi + done + if ! diff -q /a/bin/bash-bear-trap/bash-bear /usr/local/lib/bash-bear; then + uninstalled-file-die bash-bear + fi + if $check_installed; then + exit 0 + fi +fi + + if $kd_spread; then if [[ $cmd_arg && $cmd_arg != resume ]]; then die "dont pass -k without resume or empty run arg" @@ -158,8 +332,7 @@ if $kd_spread; then fi cmd_arg=resume preserve_arg=-p - h=sy - add-wireless-target-h + add-wireless-target sy so fi if [[ ! $cmd_arg ]]; then @@ -211,6 +384,7 @@ if [[ /a/opt/btrbk/btrbk -nt /usr/bin/btrbk ]]; then fi cd /a/opt/btrbk m make install + cd / fi # TODO: i wonder if there should be an option to send to the default @@ -221,60 +395,6 @@ at_work=false at_home=false -set-location() { - case $HOSTNAME in - kw) - at_work=true - ;; - kd|frodo) - at_home=true - ;; - x2|x3|sy) - if [[ $(dig +short @10.2.0.1 -x 10.2.0.2 2>&1 ||:) == kd.b8.nz. ]] \ - && ip n show 10.2.0.1 | grep . &>/dev/null; then - at_home=true - elif ping -q -c1 -w1 hal.office.fsf.org &>/dev/null \ - && ip n show 192.168.0.26 | grep . &>/dev/null; then - at_work=true - fi - ;; - esac -} - -exit-if-no-default-targets() { - if ! $force && [[ $HOSTNAME != "$MAIL_HOST" ]]; then - echo "MAIL_HOST=$MAIL_HOST, nothing to do" - mexit 0 - fi - case $HOSTNAME in - kw|kd|frodo|x2|x3|sy) : ;; - *) - die "error: no default targets for this host, use -t" - ;; - esac -} - -add-x3-target() { - # main work machine - if ping -q -c1 -w1 x3.office.fsf.org &>/dev/null; then - targets+=(x3.office.fsf.org) - elif ping -q -c1 -w1 $h.b8.nz &>/dev/null; then - # in case we took it home - targets+=(x3.b8.nz) - else - targets+=(x3wg.b8.nz) - fi -} - -add-wireless-target-h() { - if ping -q -c1 -w1 $h.b8.nz &>/dev/null; then - targets+=($h.b8.nz) - elif ping -q -c1 -w1 ${h}w.b8.nz &>/dev/null; then - targets+=(${h}w.b8.nz) - fi -} - - # set default targets if [[ ! -v targets && ! $source ]]; then exit-if-no-default-targets @@ -289,14 +409,15 @@ if [[ ! -v targets && ! $source ]]; then wireless_home_hosts=( x2 sy + so ) for h in ${wireless_home_hosts[@]}; do if [[ $HOSTNAME != "$h" ]]; then - add-wireless-target-h + add-wireless-target fi done elif $at_work; then - targets+=(i.b8.nz) + targets+=(b8.nz) for h in x2 x3 kw; do if [[ $HOSTNAME == "$h" ]]; then continue @@ -306,7 +427,7 @@ if [[ ! -v targets && ! $source ]]; then fi done else - targets+=(i.b8.nz) + targets+=(b8.nz) fi fi @@ -325,24 +446,24 @@ else *) prospective_mps=() if [[ $source ]]; then - source_state="$(ssh $source cat /a/bin/bash_unpublished/source-state)" + source_state="$(ssh $source 'cat /a/bin/bash_unpublished/source-state; echo source_host=$HOSTNAME')" eval "$source_state" - source_host="$(ssh $source cat /etc/hostname)" + # shellcheck disable=SC2154 # assigned in the above eval. if [[ $source_host == "$MAIL_HOST" ]]; then prospective_mps+=(/o) fi if [[ $source_host == "$HOST2" ]]; then - prospective_mps+=(/a /ar /qr /qd /q) + prospective_mps+=(/a /qr /qd /q) fi else if [[ $HOSTNAME == "$MAIL_HOST" ]]; then prospective_mps+=(/o) fi if [[ $HOSTNAME == "$HOST2" ]]; then - prospective_mps+=(/a /ar /qr /qd /q) + prospective_mps+=(/a /qr /qd /q) fi if $kd_spread; then - prospective_mps=(/a /ar /o /qr /qd /q) + prospective_mps=(/a /o /qr /qd /q) fi fi # note: put q last just in case its specific retention options were to @@ -361,7 +482,8 @@ else done fi -if (( ! ${#mountpoints[@]} )); then +tmp=$(( ${#mountpoints[@]} == 0 )) +if (( tmp )); then die didnt get mountpoint arg and had no defaults fi @@ -386,34 +508,6 @@ if ! command -v btrbk &>/dev/null; then die "error: no btrbk binary found" fi - -#### end pre-checks ##### - -mkdir -p /var/log/btrbk -# The journal doesnt go back to my oldest backups, and I've found myself -# wanting older logs. Not going to bother expiring old logs, since it is -# fine if they go back years. -log_path=/var/log/btrbk/$(date +%F_%T%:::z).log -echo copying output to $log_path -exec &> >(ts "%F %T" | tee -a $log_path) - - -if $verbose; then - printf " options: conf_only=%s\ndry_run=%s\nrate_limit=%s\nverbose=%s\ncmd_arg=%s" "$conf_only" "$dry_run" "$rate_limit" "$verbose" "$cmd_arg" -fi - -if [[ -v targets ]]; then - echo "targets: ${targets[*]}" -fi - -if [[ $source ]]; then - echo "source: $source" -fi - -echo "mountpoints: ${mountpoints[*]}" - - - # pull_reexec stops us from getting into an infinite loop if there is some # kind of weird problem pulla=false @@ -423,10 +517,50 @@ for m in "${mountpoints[@]}"; do break fi done + +if ! $pull_reexec && [[ $source ]] && $pulla && ! $force ; then + ssh root@$source btrbk-run --check-installed +fi + +#### end pre-checks ##### + + + + +# print some non-default opts +if $verbose; then + opts_show=() + if ! $conf_only; then + opts_show+=(conf_only=true) + fi + if ! $dry_run; then + opts_show+=(dry_run=true) + fi + if [[ $rate_limit != no ]]; then + opts_show+=("rate_limit=$rate_limit") + fi + if [[ $cmd_arg != run ]]; then + opts_show+=(cmd_arg=$cmd_arg) + fi + if (( ${#opts_show[@]} >= 1 )); then + first=true + for opt in ${opts_show[@]}; do + if $first; then + printf "%s" "$opt" + first=false + else + printf " %s" "$opt" + fi + done + echo + fi +fi + + if ! $pull_reexec && [[ $source ]] && $pulla ; then tmpf=$(mktemp) m rsync -ra $source:/usr/local/bin/{mount-latest-subvol,check-subvol-stale} /usr/local/bin - m rsync -ra $source:/usr/local/lib/err /usr/local/lib + m rsync -ra $source:/usr/local/lib/bash-bear /usr/local/lib m scp $source:/a/bin/distro-setup/btrbk-run $tmpf if ! diff -q $tmpf ${BASH_SOURCE[0]}; then e "found different version on host $source. reexecing" @@ -437,6 +571,19 @@ if ! $pull_reexec && [[ $source ]] && $pulla ; then fi +if [[ -v targets ]]; then + echo "targets: ${targets[*]}" +fi +if [[ $source ]]; then + echo "source: $source" +fi +echo "mountpoints: ${mountpoints[*]}" + + +# todo: check if we have no snapshots yet, because I always want to run +# archive instead of run. Likely, I should give an error unless a cli +# override is passed. perhaps check-subvol-stale could give the error. +# see the error message "no snapshots found" in that file. if ! $fast; then # if our mountpoints are from stale snapshots, # it doesn't make sense to do a backup. @@ -466,19 +613,24 @@ else sshable=() sshfail=() + remote_str_cmd="mkdir -p /mnt/root/btrbk /mnt/o/btrbk && \ +date +%z && \ +df --output=size,pcent / | tail -n1" + for h in ${targets[@]}; do if $fast || $conf_only; then # Use some typical values in this case root_size=$(( 1024 * 1024 * 2000 )) #2tb percent_used=10 zone=$(date +%z) - elif remote_str=$(timeout -s 9 6 ssh root@$h "mkdir -p /mnt/root/btrbk /mnt/o/btrbk && date +%z && df --output=size,pcent / | tail -n1"); then + elif remote_str=$(timeout -s 9 6 ssh root@$h "$remote_str_cmd"); then mapfile -t tmp_array <<<"$remote_str" zone="${tmp_array[0]}" IFS=" " read -r root_size percent_used <<<"${tmp_array[1]}" percent_used=${percent_used%%%} - if (( ${#tmp_array[@]} != 2 )); then + tmp=$(( ${#tmp_array[@]} != 2 )) + if (( tmp )); then die "error: didnt get 2 lines in test ssh to target $h. investigate" fi case $percent_used in @@ -494,11 +646,14 @@ else # we may be booted into a bootstrap fs or something min_root_kb=$(( 1024 * 1024 * 200 )) # 200 gb - if (( root_size < min_root_kb )); then + tmp=$(( root_size < min_root_kb )) + if (( tmp )); then + e "warning: $h: root_size=$root_size < 200gb, perhaps it is booted to bootstrap vol. skipping for now" continue fi - if (( percent_used >= 98 )); then + tmp=$(( percent_used >= 98 )) + if (( tmp )); then die "error: filesystem on target $h is $percent_used % full" fi @@ -531,7 +686,7 @@ else fi done if [[ ! ${sshable[*]} ]] || { $force && [[ ${sshfail[*]} ]]; }; then - die "failed to ssh to hosts: ${sshfail[*]}" + die "see skipped host warning above or sshfail hosts: ${sshfail[*]}" else if [[ ${sshfail[*]} ]]; then ret=1 @@ -546,14 +701,6 @@ cat >/etc/btrbk$conf_suf.conf <>/etc/btrbk$conf_suf.conf <>/etc/btrbk$conf_suf.conf <>/etc/btrbk$conf_suf.conf <>/etc/btrbk$conf_suf.conf < 1 && tg_snap_count == orphan_mp_count )) + if (( tmp )) ; then + die "something went wrong checking orphans on $tg: for mountpoint ${mountpoints[$i]}, $orphan_mp_count" + fi + done +} + +if [[ $source ]]; then + for snap in $(ssh root@$source "shopt -s nullglob; ${snap_list_cmds[*]}"); do + source_snaps[$snap]=t + done + get-orphan-tg-snaps + tmp=$(( ${#orphan_tg_snaps[*]} >= 1 )) + if (( tmp )); then + d btrfs sub del ${orphan_tg_snaps[*]} + fi +else # we have targets + for tg in ${targets[@]}; do + tmp_str=$(ssh root@$tg "shopt -s nullglob; ${snap_list_cmds[*]}") + mapfile -t tg_snaps <<<"$tmp_str" + get-orphan-tg-snaps + tmp=$(( ${#orphan_tg_snaps[*]} >= 1 )) + if (( tmp )); then + d ssh root@$tg "btrfs sub del ${orphan_tg_snaps[*]}" + fi + done +fi + # todo: umount first to ensure we don't have any errors # todo: do some kill fuser stuff to make umount more reliable @@ -670,7 +867,7 @@ if $dry_run; then fi # -q and just using the syslog option seemed nice, # but it doesn't show when a send has a parent and when it doesn't. -m btrbk -c /etc/btrbk$conf_suf.conf $preserve_arg $verbose_arg $progress_arg $cmd_arg +logq btrbk -c /etc/btrbk$conf_suf.conf $preserve_arg $verbose_arg $progress_arg $cmd_arg if $early; then exit 0 @@ -699,24 +896,26 @@ for mp in "${mountpoints[@]}"; do subvols+=("${mp##*/}") done if [[ $source ]]; then - m mount-latest-subvol "${subvols[@]}" + d mount-latest-subvol "${subvols[@]}" else for tg in ${targets[@]}; do - m /a/exe/mount-latest-remote "$tg" "${subvols[@]}" || ret=$? + d /a/exe/mount-latest-remote "$tg" "${subvols[@]}" || ret=$? done fi +# todo, we get hostnames earlier, reuse that. if [[ $ret == 0 ]]; then for tg in ${targets[@]}; do h=$(ssh $tg hostname) if [[ $h == kd && $HOSTNAME == x3 && $HOSTNAME == "$MAIL_HOST" ]]; then - ssh root$tg systemctl --no-block start btrbk-spread + d ssh root@$tg 'btrbk-spread-wrap &>/dev/null