1
|
#!/bin/bash
|
2
|
|
3
|
#
|
4
|
# Backup files needed for metacat. This script creates a directory in /var/metacat/backup,
|
5
|
# backs up the postgres database, metacat data files, and certificate and web config files,
|
6
|
# then syncs those files to an Amazon S3 bucket for backup.
|
7
|
#
|
8
|
# To run this file, install it in /usr/sbin or a similar location and add an
|
9
|
# entry in the root user's crontab to run the command periodically. The
|
10
|
# following crontab entry would run it every night at 2:00 am
|
11
|
# 0 2 * * * /usr/sbin/backup-aws.sh >> $HOME/cron-output 2>&1
|
12
|
#
|
13
|
# This is really just an example script and may not work in your environment
|
14
|
# uless you modify it appropriately.
|
15
|
#
|
16
|
# 25 Apr 2017 Matt Jones
|
17
|
|
18
|
# Name of the metacat database in postgres to be backed up
|
19
|
DBNAME=metacat
|
20
|
|
21
|
# Number of days of backups to keep online, anything older is removed
|
22
|
DAYSTOKEEP=7
|
23
|
|
24
|
# AWS S3 bucket to be used for backup
|
25
|
BUCKET=s3://arcticdata.io/backup
|
26
|
|
27
|
# Location of the metacat.properties file
|
28
|
METACATPROPERTIESPATH=/var/lib/tomcat7/webapps/metacat/WEB-INF/metacat.properties
|
29
|
|
30
|
# Location of the apache configuration file
|
31
|
APACHECONF=/etc/apache2/sites-enabled
|
32
|
|
33
|
#Location of the server key
|
34
|
KEYLOCATION=/etc/ssl/private
|
35
|
|
36
|
#Location of the server certificate
|
37
|
CERTLOCATION=/etc/ssl/certs/www_arcticdata_io.crt
|
38
|
|
39
|
# Location of the AWS client utility
|
40
|
AWS=/usr/local/bin/aws
|
41
|
|
42
|
#
|
43
|
# Below here lie demons
|
44
|
#
|
45
|
|
46
|
# Set up our umask to protect files from prying eyes
|
47
|
umask 007
|
48
|
|
49
|
# Make a temp dir for the backed up files
|
50
|
TAG=`date +%F-%H%M%S`
|
51
|
DATADIR="/var/metacat"
|
52
|
ARCHROOT="/var/metacat/metacat-backup"
|
53
|
mkdir -p $ARCHROOT
|
54
|
chgrp postgres $ARCHROOT
|
55
|
chmod g+rwxs $ARCHROOT
|
56
|
|
57
|
ARCHDIR="$ARCHROOT"
|
58
|
mkdir -p $ARCHDIR
|
59
|
|
60
|
# Locations of file lists already archived
|
61
|
DATALIST=${ARCHDIR}/data-list
|
62
|
METALIST=${ARCHDIR}/meta-list
|
63
|
|
64
|
# Shut down the tomcat server so nobody else changes anything while we backup
|
65
|
#/etc/init.d/tomcat7 stop
|
66
|
|
67
|
echo Generate a list of new metadata files since the last backup
|
68
|
if [ ! -e ${METALIST} ];
|
69
|
then
|
70
|
$AWS s3 ls ${BUCKET}/documents/ |awk -F" " '{print $4}' > ${METALIST}
|
71
|
fi
|
72
|
diff --old-line-format="" --unchanged-line-format="" <(sort ${METALIST}) <(ls -1 ${DATADIR}/documents | sort) > ${METALIST}-new
|
73
|
|
74
|
echo Generate a list of new data files since the last backup
|
75
|
if [ ! -e ${DATALIST} ];
|
76
|
then
|
77
|
$AWS s3 ls ${BUCKET}/data/ |awk -F" " '{print $4}' > ${DATALIST}
|
78
|
fi
|
79
|
diff --old-line-format="" --unchanged-line-format="" <(sort ${DATALIST}) <(ls -1 ${DATADIR}/data | sort) > ${DATALIST}-new
|
80
|
|
81
|
echo Copy the metacat.properties file to /var/metacat
|
82
|
cp $METACATPROPERTIESPATH $ARCHDIR
|
83
|
|
84
|
echo Backup postgres
|
85
|
su - postgres -c "pg_dumpall | gzip > $ARCHDIR/metacat-postgres-backup.gz"
|
86
|
|
87
|
echo Copy the apache configuration files
|
88
|
tar czhf $ARCHDIR/apache-config-backup.tgz $APACHECONF $KEYLOCATION $CERTLOCATION
|
89
|
|
90
|
echo Sync the backup directory to Amazon S3
|
91
|
echo Handle each of the subdirectories independently
|
92
|
$AWS s3 sync $DATADIR/certs $BUCKET/certs
|
93
|
$AWS s3 sync $DATADIR/dataone $BUCKET/dataone
|
94
|
$AWS s3 sync $DATADIR/inline-data $BUCKET/inline-data
|
95
|
$AWS s3 sync $DATADIR/logs $BUCKET/logs
|
96
|
$AWS s3 sync $DATADIR/.metacat $BUCKET/.metacat
|
97
|
$AWS s3 sync $DATADIR/metacat-backup $BUCKET/metacat-backup
|
98
|
#$AWS s3 sync $DATADIR/solr-home $BUCKET/solr-home
|
99
|
#$AWS s3 sync $DATADIR/tdb $BUCKET/tdb
|
100
|
#$AWS s3 sync $DATADIR/temporary $BUCKET/temporary
|
101
|
|
102
|
echo Backup metadata files to S3
|
103
|
cat ${METALIST}-new | xargs -n1 -P30 -I {} $AWS s3 cp ${DATADIR}/documents/{} $BUCKET/documents/{}
|
104
|
cat ${METALIST}-new >> ${METALIST}
|
105
|
|
106
|
echo Backup data files to S3
|
107
|
cat ${DATALIST}-new | xargs -n1 -P30 -I {} $AWS s3 cp ${DATADIR}/data/{} $BUCKET/data/{}
|
108
|
cat ${DATALIST}-new >> ${DATALIST}
|
109
|
|
110
|
# Restart tomcat
|
111
|
#/etc/init.d/tomcat7 start
|
112
|
|
113
|
# Clean up the temp files
|
114
|
#rm -rf $ARCHDIR
|
115
|
|
116
|
# clean up any of the backup files that are older than DAYSTOKEEP
|
117
|
#find $ARCHROOT -mtime +$DAYSTOKEEP -exec rm -f {} \;
|
118
|
|
119
|
echo "DONE backup for $TAG"
|
120
|
|