Last active
January 13, 2019 04:23
-
-
Save erincerys/3f51119f3b3229168744af0525eaaff8 to your computer and use it in GitHub Desktop.
Backup directories and directory listings to a LUKS container and sync everything to S3
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#!/bin/bash | |
## Description: | |
# Sync files to and create lists of directory contents in a LUKS container volume and upload it to S3 | |
# Good for periodic backup jobs | |
# Supports rate limiting, encryption in transit and at rest and file path exclusions | |
## Usage: | |
# bash $0 | |
## Dependencies | |
# Packages: | |
# - awscli | |
# - cryptsetup | |
# - gawk | |
# - sha256sum | |
# - grep | |
# - rsync | |
# Setup: | |
# - luks file container | |
# - configuration parameters below set properly | |
# - if this will be used in cron, youll need to set environment variables for awscli in the crontab | |
# WARNING: | |
# If you experience bitrot or otherwise encounter corruption, these is no detecting of this. | |
# You will overwrite the good data with the bad | |
# This can be mitigated by using versioning, either implemented through this script or enabled in the S3 bucket. | |
## --- | |
## Configuration | |
Debug=0 | |
# encrypted container | |
ScriptWorkingPath='/media/data/backups/syncops' | |
ContainerFileName='cloudsync.img' | |
ContainerFile="${ScriptWorkingPath}/${ContainerFileName}" | |
ContainerMapperName='cloudsync' | |
ContainerMountPath='/media/tmpcrypt' | |
ContainerKeyFile='/media/data/personal/keyfiles/cloudsync.pem' | |
RunFailedFile="${ScriptWorkingPath}/last_run_failed" | |
## Escape slashes and use globs in these file path arrays | |
# Path exclusions from objects within SourcePaths | |
ExcludedPaths=( \ | |
'tech/virtualmachines' \ | |
'tech/caches' \ | |
) | |
# Do not leave trailing slash on the end of directory sources | |
SourcePaths=( \ | |
'/media/raid/backups/configuration' \ | |
'/media/raid/backups/drive-order-in-case.txt' \ | |
'/media/raid/misc/papers' \ | |
'/media/raid/personal/text' \ | |
'/media/raid/personal/resumes' \ | |
'/media/raid/personal/keyfiles' \ | |
'/media/raid/personal/finances' \ | |
'/media/raid/personal/health' \ | |
'/media/raid/games/saves' \ | |
'/media/raid/tech' \ | |
'/media/raid/backups/Dropbox/Text/Markdown' \ | |
) | |
DestinationPath="${ContainerMountPath}/" | |
LogFile="${ScriptWorkingPath}/`date '+%Y%m%d'`.log" | |
# Pathes to create file lists for the contents of to be included in backup | |
FileListSources=( \ | |
'/media/raid/backups' \ | |
'/media/raid/misc/applications' \ | |
'/media/raid/misc/ebooks' \ | |
'/media/raid/music' \ | |
'/media/raid/video/anime' \ | |
'/media/raid/video/porn' \ | |
'/media/raid/games' \ | |
) | |
# Files to exclude when syncing to S3 - eg if anything else was uploaded there, we want to exclude it so its not deleted | |
S3ExcludedPaths=( \ | |
'education.tar.gz' \ | |
) | |
# SNS ARN for notifications | |
SnsTopic='arn:aws:sns:us-west-1:183912708525:Ian' | |
# awscli / s3cmd | |
AwsProfile='default' | |
#S3CmdConfigFile='/home/ian/.s3cfg' | |
AwsConfigFile='/home/ian/.aws/config' | |
AwsCredentialFile='/home/ian/.aws/credentials' | |
AwsRegion='us-west-1' | |
#ThrottleLimit=500 # how fast to upload the file to s3 in kilobytes | |
# s3 paths | |
S3BucketName='ians-backups' | |
S3Prefix='personal-workstation' | |
## awscli support rate limiting | |
## set this in ~/.aws/config if desired | |
## s3 = | |
## max_bandwidth = 500KB/s | |
AwsCliOptions="--storage-class=STANDARD_IA --profile=${AwsProfile} --region=${AwsRegion}" | |
#S3CmdOptions="--storage-class=STANDARD_IA --region=${AwsRegion} --config=${S3CmdConfigFile} --limit-rate=${ThrottleLimit}k" | |
## END CONFIGURATION | |
if [ $Debug -eq 1 ] ; then | |
AwsCliOptions="${AwsCliOptions} --debug" | |
#S3CmdOptions="${S3CmdOptions} --debug" | |
#else | |
# AwsCliOptions="${AwsCliOptions} --only-show-errors" | |
fi | |
## Stuf begins | |
# Configure environment vars for Aws CLI | |
#export AWS_DEFAULT_PROFILE=$AwsProfile | |
export AWS_CONFIG_FILE=$AwsConfigFile | |
export AWS_SHARED_CREDENTIALS_FILE=$AwsCredentialFile | |
function SnsPublication () { | |
local ErrorCode=$1 | |
if [ $ErrorCode -gt 0 ] ; then | |
local ScriptResultCode='Failure' | |
else | |
local ScriptResultCode='Success' | |
local ScriptPostMessage="Successfully synchronized file changes to S3. See $LogFile for incremental changes" | |
fi | |
if [ $ErrorCode -eq 1 ] ; then | |
local ScriptPostMessage="Failed to complete rsync operation." | |
elif [ $ErrorCode -eq 2 ] ; then | |
local ScriptPostMessage="Failed to copy to S3." | |
fi | |
# Publish to SNS topic to notify admin | |
aws sns publish \ | |
--region $AwsRegion \ | |
--topic-arn $SnsTopic \ | |
--subject "Workstation backup job notification ($ScriptResultCode)" \ | |
--message "$ScriptPostMessage" \ | |
2>&1 >> $LogFile | |
} | |
function CloseContainer () { | |
# Immediately flush pending cache writes to disk | |
sync -f ${ContainerMountPath} | |
# Unmount container | |
umount $ContainerMountPath | |
# Close container | |
cryptsetup luksClose $ContainerMapperName | |
} | |
# Open the crypted container | |
cryptsetup --key-file $ContainerKeyFile luksOpen $ContainerFile $ContainerMapperName | |
# Mount it | |
mount /dev/mapper/$ContainerMapperName $ContainerMountPath | |
# Assemble the one-liner | |
CommandPrefix="rsync --archive --delete --checksum --verbose --log-file=${LogFile}" | |
if [ $Debug -eq 1 ] ; then | |
CommandPrefix="${CommandPrefix} --msgs2stderr --debug=ALL" | |
fi | |
for e in "${ExcludedPaths[@]}" ; do | |
CommandExclusions="${CommandExclusions} --exclude=$e" | |
done | |
for i in "${SourcePaths[@]}" ; do | |
CommandSources="${CommandSources} $i" | |
done | |
Command="$CommandPrefix $CommandExclusions $CommandSources $DestinationPath" | |
# rsync | |
RsyncTempLog=`mktemp` | |
$Command 2>&1 > $RsyncTempLog | |
if [[ `grep -ic error $RsyncTempLog` -gt 0 ]] ; then | |
echo "There was an error. Check $LogFile for more info. Response is below." | |
echo $RsyncResponse | |
SnsPublication 2 | |
CloseContainer | |
exit 1 | |
fi | |
cat $RsyncTempLog >> $LogFile | |
# Create file list for each source | |
for fl in "${FileListSources[@]}" ; do | |
FlName=`echo $fl | grep -Po '[a-zA-Z_]+$'` | |
ls -Rla $fl 2>&1 > "${ScriptWorkingPath}/${FlName}.filelist" | |
done | |
# Get hash of container contents | |
ContainerFileList=`ls -Rla $ContainerMountPath` | |
ContainerChecksum=`echo $ContainerFileList | sha256sum | awk '{ print $1 }'` | |
ContainerChecksumFile="${ScriptWorkingPath}/${ContainerMapperName}.sha256sum" | |
[ -f ] ; mv $ContainerChecksumFile ${ContainerChecksumFile}.old | |
echo $ContainerChecksum > $ContainerChecksumFile | |
# if the container hash hasnt changed since last time, dont sync anything | |
if [[ \ | |
! -e $RunFailedFile \ | |
&& -e ${ContainerChecksumFile} \ | |
&& "$(cat ${ContainerChecksumFile}.old)" == "$ContainerChecksum" \ | |
]] ; then | |
echo "No changes since last sync!" | |
exit 0 | |
fi | |
# Sync working directory to S3 | |
# Effectively copies file lists but NOT container or logs | |
for el in "${S3ExcludedPaths[@]}" ; do | |
S3ExclusionArgs="${S3ExclusionArgs} --exclude ${el}" | |
done | |
AwsResponse=`aws s3 sync --exclude "*.log" --exclude "$ContainerFileName" ${S3ExclusionArgs} --size-only $AwsCliOptions $ScriptWorkingPath s3://${S3BucketName}/${S3Prefix}/ 2>&1` | |
AwsReturnCode=$? | |
echo $AwsResponse >> $LogFile | |
[ $AwsReturnCode -ne 0 ] && { echo 'Error copying file lists to S3!' >> $LogFile ; Errors=1 ; } | |
# Sync logfile | |
AwsResponse=`aws s3 cp $AwsCliOptions $LogFile s3://${S3BucketName}/${S3Prefix}/ 2>&1` | |
AwsReturnCode=$? | |
echo $AwsResponse >> $LogFile | |
[ $AwsReturnCode -ne 0 ] && { echo 'Error copying log file to S3!' >> $LogFile ; Errors=1 ; } | |
# Copy container, if necessary | |
if [[ \ | |
-e ${RunFailedFile} \ | |
|| ! -e ${ContainerChecksumFile} \ | |
|| "$(cat ${ContainerChecksumFile}.old)" != "$ContainerChecksum" \ | |
]] ; then | |
AwsTempLog=`mktemp` | |
# s3cmd $S3CmdOptions put ${ScriptWorkingPath}/${ContainerFileName} s3://${S3BucketName}/${S3Prefix}/ 2>&1 > $AwsTempLog | |
aws $AwsCliOptions s3 cp ${ScriptWorkingPath}/${ContainerFileName} s3://${S3BucketName}/${S3Prefix}/ 2>&1 > $AwsTempLog | |
AwsReturnCode=$? | |
echo $AwsResponse >> $LogFile | |
# Catch S3 errors | |
if [[ \ | |
$AwsReturnCode -ne 0 \ | |
|| `grep -Pic "(ERROR|(XAmzContentSHA256Mismatch|Error copying|BadDigest|Client error|stacktrace|unable|does not match MD5 checksum|exit status is '1')" $AwsTempLog` -gt 0 \ | |
]] ; then | |
echo 'Error copying container to S3!' >> $LogFile | |
echo "There were errors copying to S3. Review the log at ${LogFile}" | |
SnsPublication 2 | |
Errors=1 | |
fi | |
fi | |
CloseContainer | |
if [ "$Errors" == 1 ] ; then | |
touch ${RunFailedFile} | |
exit 1 | |
else | |
[ -e $RunFailedFile ] && rm $RunFailedFile | |
SnsPublication 0 | |
fi | |
echo 'All done successfully!' | |
exit 0 |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment