ccollect/ccollect.sh

546 lines
11 KiB
Bash
Raw Normal View History

2005-11-17 11:33:49 +00:00
#!/bin/sh
# Nico Schottelius
2007-08-14 12:33:22 +00:00
# Initially written for SyGroup (www.sygroup.ch)
2005-11-17 11:33:49 +00:00
# Date: Mon Nov 14 11:45:11 CET 2005
# Last Modified: (See ls -l or git)
2005-11-17 11:33:49 +00:00
#
2005-12-06 14:55:07 +00:00
# where to find our configuration and temporary file
#
CCOLLECT_CONF=${CCOLLECT_CONF:-/etc/ccollect}
2007-08-16 18:17:54 +00:00
CSOURCES=${CCOLLECT_CONF}/sources
CDEFAULTS=${CCOLLECT_CONF}/defaults
CPREEXEC="${CDEFAULTS}/pre_exec"
CPOSTEXEC="${CDEFAULTS}/post_exec"
2007-08-16 18:17:54 +00:00
TMP=$(mktemp "/tmp/$(basename $0).XXXXXX")
VERSION=0.6
2007-08-16 18:17:54 +00:00
RELEASE="2007-08-16/17"
HALF_VERSION="ccollect ${VERSION}"
FULL_VERSION="ccollect ${VERSION} (${RELEASE})"
#
# CDATE: how we use it for naming of the archives
# DDATE: how the user should see it in our output (DISPLAY)
#
2007-08-16 18:17:54 +00:00
CDATE="date +%Y%m%d-%H%M"
2007-08-14 12:33:22 +00:00
DDATE="date +%Y-%m-%d-%H:%M:%S"
#
# unset parallel execution
#
PARALLEL=""
2005-12-06 14:55:07 +00:00
#
# catch signals
#
2007-08-16 18:17:54 +00:00
trap "rm -f \"${TMP}\"" 1 2 15
2005-11-17 11:33:49 +00:00
2007-01-20 15:41:38 +00:00
#
# Functions
#
# time displaying echo
_techo()
{
2007-08-16 18:17:54 +00:00
echo "$(${DDATE}): " "$@"
}
# exit on error
2007-01-20 15:41:38 +00:00
_exit_err()
{
_techo "$@"
2007-08-16 18:17:54 +00:00
rm -f "${TMP}"
2007-01-20 15:41:38 +00:00
exit 1
}
add_name()
{
2007-08-16 18:17:54 +00:00
sed "s:^:\[${name}\] :"
}
#
2005-12-06 12:45:37 +00:00
# Tell how to use us
#
2005-12-06 12:45:37 +00:00
usage()
{
echo "$(basename $0): <interval name> [args] <sources to backup>"
2005-12-06 12:45:37 +00:00
echo ""
2006-01-24 21:36:28 +00:00
echo " ccollect creates (pseudo) incremental backups"
2005-12-06 12:45:37 +00:00
echo ""
echo " -h, --help: Show this help screen"
2006-01-24 21:58:39 +00:00
echo " -p, --parallel: Parallelise backup processes"
echo " -a, --all: Backup all sources specified in ${CSOURCES}"
2007-03-13 07:47:04 +00:00
echo " -v, --verbose: Be very verbose (uses set -x)"
2005-12-06 12:45:37 +00:00
echo ""
echo " This is version ${VERSION}, released on ${RELEASE}"
echo " (the first version was written on 2005-12-05 by Nico Schottelius)."
2006-01-24 21:58:39 +00:00
echo ""
2006-10-15 19:56:55 +00:00
echo " Retrieve latest ccollect at http://unix.schottelius.org/ccollect/"
2005-12-06 12:45:37 +00:00
exit 0
}
#
# need at least interval and one source or --all
#
if [ $# -lt 2 ]; then
usage
fi
#
# check for configuraton directory
#
[ -d "${CCOLLECT_CONF}" ] || _exit_err "No configuration found in " \
2007-08-16 18:17:54 +00:00
"\"${CCOLLECT_CONF}\" (is \$CCOLLECT_CONF properly set?)"
2005-12-06 12:45:37 +00:00
#
# Filter arguments
#
2007-05-31 09:52:33 +00:00
export INTERVAL="$1"; shift
2005-12-06 12:45:37 +00:00
i=1
2006-04-29 10:58:57 +00:00
no_sources=0
2005-12-06 12:45:37 +00:00
#
# Create source "array"
#
while [ "$#" -ge 1 ]; do
2007-08-14 13:30:00 +00:00
eval arg=\"\$1\"; shift
2006-10-25 12:48:48 +00:00
2007-08-16 18:17:54 +00:00
if [ "${NO_MORE_ARGS}" = 1 ]; then
eval source_${no_sources}=\"${arg}\"
no_sources=$((${no_sources}+1))
2007-05-31 09:55:37 +00:00
# make variable available for subscripts
eval export source_${no_sources}
else
2007-08-16 18:17:54 +00:00
case "${arg}" in
-a|--all)
ALL=1
;;
2005-12-08 15:14:46 +00:00
-v|--verbose)
VERBOSE=1
;;
-p|--parallel)
PARALLEL=1
;;
-h|--help)
usage
;;
--)
NO_MORE_ARGS=1
;;
*)
2006-04-29 10:58:57 +00:00
eval source_${no_sources}=\"$arg\"
no_sources=$(($no_sources+1))
;;
esac
fi
2005-12-06 12:45:37 +00:00
i=$(($i+1))
2005-12-06 12:45:37 +00:00
done
2007-05-31 09:55:37 +00:00
# also export number of sources
export no_sources
2005-12-08 15:14:46 +00:00
#
# be really, really, really verbose
2005-12-08 15:14:46 +00:00
#
2007-08-16 18:17:54 +00:00
if [ "${VERBOSE}" = 1 ]; then
2005-12-08 15:14:46 +00:00
set -x
fi
2005-12-06 14:35:29 +00:00
#
# Look, if we should take ALL sources
#
2007-08-16 18:17:54 +00:00
if [ "${ALL}" = 1 ]; then
2005-12-06 14:35:29 +00:00
# reset everything specified before
2006-04-29 10:58:57 +00:00
no_sources=0
2006-10-25 12:48:48 +00:00
2005-12-06 14:55:07 +00:00
#
# get entries from sources
#
cwd=$(pwd -P)
2007-08-14 13:30:00 +00:00
( cd "${CSOURCES}" && ls > "${TMP}" ); ret=$?
2006-10-15 14:50:12 +00:00
2007-08-14 13:30:00 +00:00
[ "${ret}" -eq 0 ] || _exit_err "Listing of sources failed. Aborting."
2006-10-25 12:48:48 +00:00
2005-12-06 14:55:07 +00:00
while read tmp; do
2007-08-16 18:17:54 +00:00
eval source_${no_sources}=\"${tmp}\"
no_sources=$((${no_sources}+1))
done < "${TMP}"
2005-12-06 14:35:29 +00:00
fi
#
# Need at least ONE source to backup
#
if [ "${no_sources}" -lt 1 ]; then
usage
else
_techo "${HALF_VERSION}: Beginning backup using interval ${INTERVAL}"
fi
#
# Look for pre-exec command (general)
#
if [ -x "${CPREEXEC}" ]; then
2007-08-16 18:17:54 +00:00
_techo "Executing ${CPREEXEC} ..."
"${CPREEXEC}"; ret=$?
2007-08-16 18:17:54 +00:00
_techo "Finished ${CPREEXEC}."
[ "${ret}" -eq 0 ] || _exit_err "${CPREEXEC} exited with return code ${ret}" \
2007-08-16 18:17:54 +00:00
", aborting backup."
fi
#
# check default configuration
#
D_FILE_INTERVAL="${CDEFAULTS}/intervals/${INTERVAL}"
D_INTERVAL=$(cat "${D_FILE_INTERVAL}" 2>/dev/null)
#
# Let's do the backup
#
i=0
2007-08-16 18:17:54 +00:00
while [ "${i}" -lt "${no_sources}" ]; do
2005-11-17 11:33:49 +00:00
#
2006-04-29 10:58:57 +00:00
# Get current source
#
2006-11-14 23:01:19 +00:00
eval name=\"\$source_${i}\"
2007-08-16 18:17:54 +00:00
i=$((${i}+1))
export name
#
# start ourself, if we want parallel execution
#
if [ "${PARALLEL}" ]; then
"$0" "${INTERVAL}" "${name}" &
continue
fi
#
# Start subshell for easy log editing
#
(
#
# Stderr to stdout, so we can produce nice logs
#
exec 2>&1
#
# Configuration
#
backup="${CSOURCES}/${name}"
c_source="${backup}/source"
c_dest="${backup}/destination"
c_exclude="${backup}/exclude"
c_verbose="${backup}/verbose"
c_vverbose="${backup}/very_verbose"
c_rsync_extra="${backup}/rsync_options"
c_summary="${backup}/summary"
c_pre_exec="${backup}/pre_exec"
c_post_exec="${backup}/post_exec"
c_incomplete="$backup/delete_incomplete"
2006-10-26 08:30:14 +00:00
2007-01-20 15:41:38 +00:00
#
# Times
2007-01-20 15:41:38 +00:00
#
c_marker=".ccollect-$(${CDATE}).$$"
begin_s=$(date +%s)
#
# unset possible options
#
EXCLUDE=""
RSYNC_EXTRA=""
SUMMARY=""
VERBOSE=""
VVERBOSE=""
_techo "Beginning to backup"
#
# Standard configuration checks
#
2007-03-13 07:47:04 +00:00
if [ ! -e "${backup}" ]; then
2007-08-16 18:17:54 +00:00
_exit_err "Source does not exist."
fi
2006-10-25 12:48:48 +00:00
#
# configuration _must_ be a directory
#
2007-03-13 07:47:04 +00:00
if [ ! -d "${backup}" ]; then
2007-08-16 18:17:54 +00:00
_exit_err "\"${name}\" is not a cconfig-directory. Skipping."
fi
#
# first execute pre_exec, which may generate destination or other
# parameters
#
2007-03-13 07:47:04 +00:00
if [ -x "${c_pre_exec}" ]; then
_techo "Executing ${c_pre_exec} ..."
2007-03-13 07:47:04 +00:00
"${c_pre_exec}"; ret="$?"
_techo "Finished ${c_pre_exec} (return code ${ret})."
2007-03-13 07:47:04 +00:00
if [ "${ret}" -ne 0 ]; then
_exit_err "${c_pre_exec} failed. Skipping."
fi
fi
#
# interval definition: First try source specific, fallback to default
#
2007-03-13 07:47:04 +00:00
c_interval="$(cat "${backup}/intervals/${INTERVAL}" 2>/dev/null)"
2007-03-13 07:47:04 +00:00
if [ -z "${c_interval}" ]; then
c_interval="${D_INTERVAL}"
2007-03-13 07:47:04 +00:00
if [ -z "${c_interval}" ]; then
_exit_err "No definition for interval \"${INTERVAL}\" found. Skipping."
fi
fi
#
# Source checks
#
2007-03-13 07:47:04 +00:00
if [ ! -f "${c_source}" ]; then
_exit_err "Source description \"${c_source}\" is not a file. Skipping."
else
source=$(cat "${c_source}"); ret=$?
if [ ${ret} -ne 0 ]; then
_exit_err "Source ${c_source} is not readable. Skipping."
fi
fi
#
# destination _must_ be a directory
#
2007-03-13 07:47:04 +00:00
if [ ! -d "${c_dest}" ]; then
2007-08-16 18:08:23 +00:00
_exit_err "Destination ${c_dest} is not a directory. Skipping."
fi
2007-08-16 18:08:23 +00:00
# NEW method as of 0.6:
# - insert ccollect default parameters
# - insert options
# - insert user options
2007-08-14 13:30:00 +00:00
2007-08-14 13:40:23 +00:00
#
# rsync standard options
#
2007-08-16 18:08:23 +00:00
set -- "$@" "--archive" "--delete" "--numeric-ids" "--relative" \
"--delete-excluded" "--sparse"
#
# exclude list
#
if [ -f "${c_exclude}" ]; then
2007-08-16 18:17:54 +00:00
set -- "$@" "--exclude-from=${c_exclude}"
fi
2006-10-25 12:48:48 +00:00
#
2006-01-24 20:46:49 +00:00
# Output a summary
#
2007-03-13 07:47:04 +00:00
if [ -f "${c_summary}" ]; then
2007-08-14 13:40:23 +00:00
set -- "$@" "--stats"
2006-01-24 20:46:49 +00:00
fi
2006-10-25 12:48:48 +00:00
#
# Verbosity for rsync
#
2007-08-14 13:40:23 +00:00
if [ -f "${c_vverbose}" ]; then
set -- "$@" "-vv"
elif [ -f "${c_verbose}" ]; then
set -- "$@" "-v"
2006-03-19 00:10:58 +00:00
fi
2006-10-25 12:48:48 +00:00
#
2007-08-14 13:40:23 +00:00
# extra options for rsync provided by the user
#
2007-08-14 13:40:23 +00:00
if [ -f "${c_rsync_extra}" ]; then
while read line; do
set -- "$@" "$line"
done < "${c_rsync_extra}"
fi
2006-10-25 12:48:48 +00:00
2007-08-16 18:08:23 +00:00
#
# Check for incomplete backups
#
(
set -x
cd "${c_dest}"
ls
ls "${INTERVAL}"*/.ccollect-* > "${TMP}"
cat "${TMP}"
while read broken; do
realbroken=$(echo $broken | sed 's/.ccollect-*/')
echo "Broken backup"
done
)
sleep 10
while read incomplete; do
echo "${incomplete} is incomplete"
done < "${TMP}"
2007-08-16 18:17:54 +00:00
last_dir=$(ls -d "${c_dest}/${INTERVAL}."?* 2>/dev/null | sort -n | tail -n 1)
2007-08-16 18:08:23 +00:00
#
# check if maximum number of backups is reached, if so remove
#
2006-10-25 12:48:48 +00:00
2007-08-16 18:08:23 +00:00
#
# Check for backup directory to clone from
#
found_old=0
(
# can we use ls? or will it produce broken results?
#cd "${c_dest}" && ls -dp1 | grep "^${INTERVAL}\..*/\$" | wc -l | sed 's/^ *//g')
cd "${c_dest}" && ls -dp1 "${INTERVAL}".* > "${TMP}"
)
while read old; do
echo "Found ${old}"
done < "${TMP}"
#
# Check for backups on other intervals, if we did not find any
#
2007-03-13 07:47:04 +00:00
count=$(cd "${c_dest}" && ls -p1 | grep "^${INTERVAL}\..*/\$" | wc -l | sed 's/^ *//g')
# FIXME: check return value
2007-08-16 18:08:23 +00:00
_techo "Existing backups: ${count} Total keeping backups: ${c_interval}"
2007-03-13 07:47:04 +00:00
if [ "${count}" -ge "${c_interval}" ]; then
2006-10-15 19:01:28 +00:00
substract=$((${c_interval} - 1))
remove=$(($count - $substract))
2006-01-13 16:39:17 +00:00
echo "Removing $remove backup(s)..."
2007-01-17 18:32:21 +00:00
ls -d "$c_dest/${INTERVAL}."?* | sort -n | head -n "$remove" > "$TMP"
2006-11-14 22:35:10 +00:00
#( cd "$c_dest" && ls -p1 | grep "^${INTERVAL}\..*/\$" | sort -n | head -n $remove > "$TMP"
while read to_remove; do
dir="$to_remove"
2006-01-13 16:39:17 +00:00
echo "Removing $dir ..."
rm $VVERBOSE -rf "$dir"
done < "$TMP"
fi
2006-10-25 12:48:48 +00:00
2005-12-06 16:08:38 +00:00
#
# clone the old directory with hardlinks
#
destination_date=$($CDATE)
destination_dir="$c_dest/${INTERVAL}.${destination_date}.$$"
2006-10-25 12:48:48 +00:00
2007-01-19 19:01:53 +00:00
#
2007-01-19 19:07:34 +00:00
# FIXME: In 0.6 add search for the latest available backup!
2007-01-19 19:01:53 +00:00
#
last_dir=$(ls -d "$c_dest/${INTERVAL}."?* 2>/dev/null | sort -n | tail -n 1)
2006-10-25 12:48:48 +00:00
# give some info
2006-01-13 16:39:17 +00:00
echo "Beginning to backup, this may take some time..."
echo "Creating $destination_dir ..."
2007-01-27 17:27:27 +00:00
mkdir $VVERBOSE "$destination_dir" || \
_exit_err "Creating $destination_dir failed. Skipping."
2006-10-25 13:16:37 +00:00
#
2006-10-31 06:58:00 +00:00
# make an absolute path, perhaps $CCOLLECT_CONF is relative!
2006-10-25 13:16:37 +00:00
#
abs_destination_dir="$(cd "$destination_dir" && pwd -P)"
2006-10-25 13:16:37 +00:00
#
2007-08-14 13:40:23 +00:00
# added mark in 0.6 (and remove it, if successful later)
#
2007-08-14 13:40:23 +00:00
touch "${abs_destination_dir}/${c_marker}"
2005-12-06 16:08:38 +00:00
#
# the rsync part
# options partly stolen from rsnapshot
2005-12-06 16:08:38 +00:00
#
2006-10-25 12:48:48 +00:00
2007-08-14 13:40:23 +00:00
_techo "Transferring files..."
2006-10-15 14:37:07 +00:00
2007-01-17 18:18:42 +00:00
#
# FIXME:useropts / rsync extra: one parameter per line!
# 0.5.3!
#
2007-08-16 18:08:23 +00:00
set -x
rsync "$@" "$source" "$abs_destination_dir"; ret=$?
# abs_last_dir="$(cd "$last_dir" && pwd -P)"
# if [ -z "$abs_last_dir" ]; then
# echo "Changing to the last backup directory failed. Skipping."
# exit 1
# fi
# rsync_hardlink="--link-dest=$abs_last_dir"
set +x
2006-10-20 09:27:09 +00:00
if [ "$ret" -ne 0 ]; then
2007-08-14 12:36:33 +00:00
echo "Warning: rsync exited non-zero, the backup may be broken (see rsync errors)."
fi
2006-10-25 13:16:37 +00:00
#
2007-08-16 18:08:23 +00:00
# remove marking here
2006-10-25 13:16:37 +00:00
#
2007-08-16 18:08:23 +00:00
rm -f "${abs_destination_dir}/${c_marker}"
_techo "Finished backup (rsync return code: $ret)."
2006-10-25 13:16:37 +00:00
#
# post_exec
#
2007-08-16 18:08:23 +00:00
if [ -x "${c_post_exec}" ]; then
_techo "Executing ${c_post_exec} ..."
"${c_post_exec}"; ret=$?
_techo "Finished ${c_post_exec}."
2006-03-19 00:13:38 +00:00
2007-08-16 18:08:23 +00:00
if [ ${ret} -ne 0 ]; then
_exit_err "${c_post_exec} failed."
2006-03-19 00:13:38 +00:00
fi
fi
2007-08-16 18:08:23 +00:00
# Calculation
end_s=$(date +%s)
2006-10-15 19:01:28 +00:00
full_seconds=$((${end_s} - ${begin_s}))
hours=$(($full_seconds / 3600))
seconds=$(($full_seconds - ($hours * 3600)))
minutes=$(($seconds / 60))
seconds=$((${seconds} - (${minutes} * 60)))
2007-08-16 18:08:23 +00:00
_techo "Backup lasted: ${hours}:${minutes}:${seconds} (h:m:s)"
) | add_name
done
2005-12-06 14:55:07 +00:00
2005-12-06 16:08:38 +00:00
#
# Be a good parent and wait for our children, if they are running wild parallel
#
2007-08-16 18:08:23 +00:00
if [ "${PARALLEL}" ]; then
_techo "Waiting for child jobs to complete..."
2005-12-06 16:08:38 +00:00
wait
fi
#
# Look for post-exec command (general)
#
2007-08-16 18:08:23 +00:00
if [ -x "${CPOSTEXEC}" ]; then
_techo "Executing ${CPOSTEXEC} ..."
"${CPOSTEXEC}"
2006-10-31 07:18:58 +00:00
ret=$?
2007-08-16 18:08:23 +00:00
_techo "Finished ${CPOSTEXEC}."
2006-10-25 12:48:48 +00:00
2007-08-16 18:08:23 +00:00
if [ ${ret} -ne 0 ]; then
echo "${CPOSTEXEC} failed."
2006-03-19 00:13:38 +00:00
fi
fi
2007-08-16 18:08:23 +00:00
rm -f "${TMP}"
_techo "Finished ${WE}"