ccollect/ccollect.sh

342 lines
6.7 KiB
Bash
Raw Permalink Normal View History

2005-11-17 11:33:49 +00:00
#!/bin/sh
# Nico Schottelius
# written for SyGroup (www.sygroup.ch)
# Date: Mon Nov 14 11:45:11 CET 2005
# Last Modified: (See ls -l or git)
2005-11-17 11:33:49 +00:00
#
2005-12-06 14:55:07 +00:00
# where to find our configuration and temporary file
#
CCOLLECT_CONF=${CCOLLECT_CONF:-/etc/ccollect}
CSOURCES=$CCOLLECT_CONF/sources
CDEFAULTS=$CCOLLECT_CONF/defaults
2005-12-06 14:55:07 +00:00
TMP=$(mktemp /tmp/$(basename $0).XXXXXX)
WE=$(basename $0)
#
# unset parallel execution
#
PARALLEL=""
2005-12-06 14:55:07 +00:00
#
# catch signals
#
trap "rm -f \"$TMP\"" 1 2 15
2005-11-17 11:33:49 +00:00
add_name()
{
sed "s/^/\[$name\] /"
}
#
2005-12-06 12:45:37 +00:00
# Tell how to use us
#
2005-12-06 12:45:37 +00:00
usage()
{
echo "$WE: <intervall name> [args] <sources to backup>"
2005-12-06 12:45:37 +00:00
echo ""
echo " Nico Schottelius (nico-linux-ccollect schottelius.org) - 2005-12-06"
echo ""
echo " Backup data pseudo incremental"
echo ""
echo " -h, --help: Show this help screen"
echo " -p, --parallel: Parellize backup process"
2005-12-06 14:35:29 +00:00
echo " -a, --all: Backup all sources specified in $CSOURCES"
2005-12-08 15:14:46 +00:00
echo " -v, --verbose: Be very verbose."
2005-12-06 12:45:37 +00:00
echo ""
echo " Retrieve latest ccollect at http://linux.schottelius.org/ccollect/."
2005-12-06 12:45:37 +00:00
echo ""
exit 0
}
#
# need at least intervall and one source or --all
#
if [ $# -lt 2 ]; then
usage
fi
#
# check for configuraton directory
#
if [ ! -d "$CCOLLECT_CONF" ]; then
echo "Configuration \"$CCOLLECT_CONF\" not found."
exit 1
fi
2005-12-06 12:45:37 +00:00
#
# Filter arguments
#
INTERVALL=$1; shift
2005-12-06 12:45:37 +00:00
i=1
no_shares=0
while [ $i -le $# ]; do
eval arg=\$$i
if [ "$NO_MORE_ARGS" = 1 ]; then
eval share_${no_shares}=\"$arg\"
no_shares=$[$no_shares+1]
else
case $arg in
-a|--all)
ALL=1
;;
2005-12-08 15:14:46 +00:00
-v|--verbose)
VERBOSE=1
;;
-p|--parallel)
PARALLEL="1"
;;
-h|--help)
usage
;;
--)
NO_MORE_ARGS=1
;;
*)
eval share_${no_shares}=\"$arg\"
no_shares=$[$no_shares+1]
;;
esac
fi
2005-12-06 12:45:37 +00:00
i=$[$i+1]
2005-12-06 12:45:37 +00:00
done
2005-12-08 15:14:46 +00:00
#
# be really really really verbose
#
if [ "$VERBOSE" = 1 ]; then
set -x
fi
2005-12-06 14:35:29 +00:00
#
# Look, if we should take ALL sources
#
if [ "$ALL" = 1 ]; then
# reset everything specified before
no_shares=0
2005-12-06 14:55:07 +00:00
#
# get entries from sources
#
cwd=$(pwd)
cd "$CSOURCES";
2005-12-06 14:55:07 +00:00
ls > "$TMP"
while read tmp; do
eval share_${no_shares}=\"$tmp\"
no_shares=$[$no_shares+1]
2005-12-06 14:55:07 +00:00
done < "$TMP"
2005-12-06 14:35:29 +00:00
fi
#
# Need at least ONE source to backup
#
if [ "$no_shares" -lt 1 ]; then
usage
else
echo "==> $WE: Beginning backup using intervall $INTERVALL <=="
2005-12-06 14:35:29 +00:00
fi
#
# check default configuration
#
D_FILE_INTERVALL="$CDEFAULTS/intervalls/$INTERVALL"
D_INTERVALL=$(cat $D_FILE_INTERVALL 2>/dev/null)
#
# Let's do the backup
#
i=0
while [ "$i" -lt "$no_shares" ]; do
2005-11-17 11:33:49 +00:00
#
# Get current share
#
eval name=\$share_${i}
i=$[$i+1]
export name
#
# start ourself, if we want parallel execution
#
if [ "$PARALLEL" ]; then
$0 "$INTERVALL" "$name" &
continue
fi
#
# Start subshell for easy log editing
#
(
#
# Stderr to stdout, so we can produce nice logs
#
exec 2>&1
#
# Standard locations
#
backup="$CSOURCES/$name"
c_source="$backup/source"
c_dest="$backup/destination"
c_exclude="$backup/exclude"
2005-12-08 10:08:15 +00:00
c_verbose="$backup/verbose"
c_rsync_extra="$backup/rsync_options"
echo "Beginning to backup this source ..."
#
# Standard configuration checks
#
if [ ! -e "$backup" ]; then
echo "Source does not exist."
2006-01-13 16:39:17 +00:00
exit 1
fi
if [ ! -d "$backup" ]; then
echo "\"$name\" is not a cconfig-directory. Skipping."
2006-01-13 16:39:17 +00:00
exit 1
fi
#
# intervall definition: First try source specific, fallback to default
#
c_intervall="$(cat "$backup/intervalls/$INTERVALL" 2>/dev/null)"
if [ -z "$c_intervall" ]; then
c_intervall=$D_INTERVALL
if [ -z "$c_intervall" ]; then
2006-01-13 16:39:17 +00:00
echo "Default and source specific intervall missing. Skipping."
exit 1
fi
fi
#
# standard rsync options
#
VERBOSE=""
EXCLUDE=""
RSYNC_EXTRA=""
#
# next configuration checks
#
if [ ! -f "$c_source" ]; then
2006-01-13 16:39:17 +00:00
echo "Source description $c_source is not a file. Skipping."
exit 1
else
source=$(cat "$c_source")
if [ $? -ne 0 ]; then
echo "Skipping: Source $c_source is not readable"
2006-01-13 16:39:17 +00:00
exit 1
fi
fi
if [ ! -d "$c_dest" ]; then
2006-01-13 16:39:17 +00:00
echo "Destination $c_dest does not link to a directory. Skipping"
exit 1
fi
2005-12-08 10:08:15 +00:00
# exclude
if [ -f "$c_exclude" ]; then
EXCLUDE="--exclude-from=$c_exclude"
fi
# extra options for rsync
if [ -f "$c_rsync_extra" ]; then
RSYNC_EXTRA="$(cat "$c_rsync_extra")"
fi
2005-12-08 10:08:15 +00:00
# verbose
if [ -f "$c_verbose" ]; then
VERBOSE="-v"
fi
#
# check if maximum number of backups is reached, if so remove
#
2005-12-07 17:43:33 +00:00
# the created directories are named $INTERVALL.$DA
count=$(ls -d "$c_dest/${INTERVALL}."?* 2>/dev/null | wc -l)
2006-01-13 16:39:17 +00:00
echo "Currently $count backup(s) exist, total keeping $c_intervall backup(s)."
if [ "$count" -ge "$c_intervall" ]; then
substract=$(echo $c_intervall - 1 | bc)
remove=$(echo $count - $substract | bc)
2006-01-13 16:39:17 +00:00
echo "Removing $remove backup(s)..."
ls -d "$c_dest/${INTERVALL}."?* | sort -n | head -n $remove > "$TMP"
while read to_remove; do
dir="$to_remove"
2006-01-13 16:39:17 +00:00
echo "Removing $dir ..."
rm -rf "$dir"
done < "$TMP"
fi
2005-12-06 16:08:38 +00:00
#
# clone the old directory with hardlinks
#
destination_date=$(date +%Y-%m-%d-%H:%M)
destination_dir="$c_dest/${INTERVALL}.${destination_date}.$$"
last_dir=$(ls -d "$c_dest/${INTERVALL}."?* 2>/dev/null | sort -n | tail -n 1)
# give some info
2006-01-13 16:39:17 +00:00
echo "Beginning to backup, this may take some time..."
# only copy if a directory exists
if [ "$last_dir" ]; then
echo "Hard linking..."
cp -al $VERBOSE "$last_dir" "$destination_dir"
else
echo "Creating $destination_dir"
mkdir "$destination_dir"
fi
if [ $? -ne 0 ]; then
2006-01-13 16:39:17 +00:00
echo "Creating/cloning backup directory failed. Skipping backup."
exit 1
fi
2005-12-06 16:08:38 +00:00
#
# the rsync part
# options partly stolen from rsnapshot
2005-12-06 16:08:38 +00:00
#
echo "Transferring files..."
rsync -a $VERBOSE $RSYNC_EXTRA $EXCLUDE \
--delete --numeric-ids --relative --delete-excluded \
"$source" "$destination_dir"
if [ "$?" -ne 0 ]; then
2006-01-13 16:39:17 +00:00
echo "rsync failed, backup may be broken (see rsync errors)"
exit 1
fi
echo "Successfully finished backup."
) | add_name
done
2005-12-06 14:55:07 +00:00
2005-12-06 16:08:38 +00:00
#
# Be a good parent and wait for our children, if they are running wild parallel
#
if [ "$PARALLEL" ]; then
echo "Waiting for child jobs to complete..."
2005-12-06 16:08:38 +00:00
wait
fi
2005-12-06 14:55:07 +00:00
rm -f "$TMP"
echo "==> Finished $WE <=="