Skip to content

Commit

Permalink
feat: d4g-s3-backup Docker image
Browse files Browse the repository at this point in the history
  • Loading branch information
pagbrl committed Dec 18, 2023
1 parent ccf6762 commit e38a639
Show file tree
Hide file tree
Showing 6 changed files with 301 additions and 53 deletions.
1 change: 1 addition & 0 deletions .dockerignore
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
.DS_Store
38 changes: 38 additions & 0 deletions .github/workflows/main.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,38 @@
name: main

on:
push:
branches:
- main

env:
REGISTRY: ghcr.io
IMAGE_NAME: ${{ github.repository }}

jobs:
main:
runs-on: ubuntu-latest
steps:
- name: Checkout
uses: actions/checkout@v2
- name: Set up QEMU
uses: docker/setup-qemu-action@v1
- name: Set up Docker Buildx
uses: docker/setup-buildx-action@v1
- name: Log in to the Container registry
uses: docker/login-action@65b78e6e13532edd9afa3aa52ac7964289d1a9c1
with:
registry: ${{ env.REGISTRY }}
username: ${{ github.actor }}
password: ${{ secrets.GITHUB_TOKEN }}
- name: Extract metadata (tags, labels) for Docker
id: meta
uses: docker/metadata-action@9ec57ed1fcdbf14dcef7dfbe97b2010124a938b7
with:
images: ${{ env.REGISTRY }}/${{ env.IMAGE_NAME }}
- name: Run Buildx
run: |
docker buildx build \
--push \
--platform=linux/amd64,linux/arm64,linux/armhf \
-t ${{ env.REGISTRY }}/${{ env.IMAGE_NAME }}:latest -f ./Dockerfile ./
53 changes: 1 addition & 52 deletions .gitignore
Original file line number Diff line number Diff line change
@@ -1,52 +1 @@
# Prerequisites
*.d

# Object files
*.o
*.ko
*.obj
*.elf

# Linker output
*.ilk
*.map
*.exp

# Precompiled Headers
*.gch
*.pch

# Libraries
*.lib
*.a
*.la
*.lo

# Shared objects (inc. Windows DLLs)
*.dll
*.so
*.so.*
*.dylib

# Executables
*.exe
*.out
*.app
*.i*86
*.x86_64
*.hex

# Debug files
*.dSYM/
*.su
*.idb
*.pdb

# Kernel Module Compile Results
*.mod*
*.cmd
.tmp_versions/
modules.order
Module.symvers
Mkfile.old
dkms.conf
.DS_Store
10 changes: 10 additions & 0 deletions Dockerfile
Original file line number Diff line number Diff line change
@@ -0,0 +1,10 @@
FROM debian:sid-slim

LABEL org.opencontainers.image.source = "https://github.com/dataforgoodfr/d4g-s3cmd"
LABEL org.opencontainers.image.authors = "Data For Good"

RUN apt update && apt install -y s3cmd && apt clean

ADD ./entrypoint.sh /opt/entrypoint.sh

ENTRYPOINT ["/opt/entrypoint.sh"]
13 changes: 12 additions & 1 deletion README.md
Original file line number Diff line number Diff line change
@@ -1,2 +1,13 @@
# d4g-s3cmd
s3cmd Dockerizing for dataforgood

This repository is an attempt at creating a standard Docker image for our use of `s3cmd` at @dataforgoodfr.

The result is a lightweight image that can be configured fully with environment variables.
We use Scaleway so some configuration is tailored to their platform (notably the `host_base` and `host_bucket` configurations).

## Usage
Usage is documented in-script, to display the help menu use

```
docker run -it --rm ghcr.io/dataforgoodfr/d4g-s3cmd:latest help
```
239 changes: 239 additions & 0 deletions entrypoint.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,239 @@
#!/usr/bin/env bash
set -Eeuo pipefail

trap cleanup SIGINT SIGTERM ERR EXIT

usage() {
cat <<EOF
USAGE docker run -it --rm -v /var/data:/data -v /opt/backups:/backups ghcr.io/dataforgoodfr/d4g-s3-backup \\
[--access-key="<access_key>"] \\
[--secret-key="<secret_key>"] \\
[--bucket-name="backups"] \\
[--host-base="%(bucket)s.s3.fr-par.scw.cloud"] \\
[--data-dir="/data"] \\
[--backups-dir="/backups"] \\
[--service-name="service"] \\
[--retention-days=30] \\
[--bucket-region="fr-par"] \\
[--prom-metrics] \\
[--debug] \\
[--help]
Create backups for a specific dir easily and sync them to an s3 compatible bucket.
This script also supports publishing prometheu-compatible metrics through the Textfile Collector.
Data from <data_dir> will be backed up to <backups-dir>/<service-name>/<service-name>-$(date +%Y-%m-%d).tar.gz
Files will be keps around for <retention-days> days.
Files will be synced to s3 under s3://<bucket-name>/<service-name> using supplied credentials and configuration.
Supported parameters :
-h, --help : display this message
--debug : Print configuration before running (Optional)
--access-key : AWS access key (Required)
--secret-key : AWS secret key (Required)
--bucket-name : name of the bucket to sync backups to (Optional, Default backups)
--data-dir : directory to backup (Optional, Default ./data)
--service-name : name of the service to backup (Optional, Default service)
--backups-dir : backups root directory where will be stored (Optional, Default /opt/backups/)
--host-base : S3 host base (Optional, Default %(bucket)s.s3.fr-par.scw.cloud)
--bucket-region : S3 bucket region (Optional, Default fr-par)
--retention-days : number of days to keep backups (Default 30)
--prom-metrics : enable prometheus metrics (Default false)
EOF
exit 1
}

cleanup() {
trap - SIGINT SIGTERM ERR EXIT
if [ "$PROM_METRICS" == "true" ]; then
write_metrics
fi
exit 0
}

function write_metrics() {
# Write out metrics to a temporary file.
END="$(date +%s)"
# Last successful timestamp is now
TIMESTAMP="$END"
if [ "$FAILURE" != 0 ]; then
TIMESTAMP="0"
fi
cat << EOF > "$TEXTFILE_COLLECTOR_DIR/${SERVICE_NAME}_backup.prom.$$"
# HELP ${SERVICE_NAME}_backup_duration Duration of the planned ${SERVICE_NAME} backup
# TYPE ${SERVICE_NAME}_backup_duration counter
${SERVICE_NAME}_backup_duration $((END - START))
# HELP ${SERVICE_NAME}_backup_failure Result of the planned ${SERVICE_NAME} backup
# TYPE ${SERVICE_NAME}_backup_failure gauge
${SERVICE_NAME}_backup_failure $FAILURE
# HELP ${SERVICE_NAME}_backup_last_time Timestamp of last successful backup
# TYPE ${SERVICE_NAME}_backup_last_time gauge
${SERVICE_NAME}_backup_last_time $TIMESTAMP
EOF

# Rename the temporary file atomically.
# This avoids the node exporter seeing half a file.
mv "$TEXTFILE_COLLECTOR_DIR/${SERVICE_NAME}_backup.prom.$$" \
"$TEXTFILE_COLLECTOR_DIR/${SERVICE_NAME}_backup.prom"
}

setup_colors() {
if [[ -t 2 ]] && [[ -z "${NO_COLOR-}" ]] && [[ "${TERM-}" != "dumb" ]]; then
# shellcheck disable=SC2034
NOCOLOR='\033[0m' RED='\033[0;31m' GREEN='\033[0;32m' ORANGE='\033[0;33m' BLUE='\033[0;34m' PURPLE='\033[0;35m' CYAN='\033[0;36m' YELLOW='\033[1;33m'
else
echo "coucou"
NOCOLOR='' RED='' GREEN='' ORANGE='' BLUE='' PURPLE='' CYAN='' YELLOW=''
fi
}

info() {
echo -e "${GREEN}$*${NOCOLOR}"
}

error() {
echo -e "${RED}$*${NOCOLOR}"
}

debug() {
if [ "$DEBUG" == 'true' ]; then
echo -e "$1"
fi
}

parse_params() {
if [ $# -gt 12 ]; then
echo "Too many parameters provided"
usage
fi

# Internal variables
FAILURE=1
START="$(date +%s)"

# Sane defaults
DEBUG="false"
DATA_DIR="/data"
SERVICE_NAME="app"
BACKUPS_DIR="/backups"
BUCKET_NAME="backups"
HOST_BASE="%(bucket)s.s3.fr_par.scw.cloud"
BUCKET_REGION="fr-par"
RETENTION_DAYS="30"
PROM_METRICS="false"
ACCESS_KEY=""
SECRET_KEY=""

while :; do
case "${1-}" in
-h | --help)
usage
;;
--debug)
DEBUG="true"
;;
--access-key=*)
ACCESS_KEY="${1#*=}"
shift
;;
--secret-key=*)
SECRET_KEY="${1#*=}"
shift
;;
--data-dir=*)
DATA_DIR="${1#*=}"
shift
;;
--service-name=*)
SERVICE_NAME="${1#*=}"
shift
;;
--backups-dir=*)
BACKUPS_DIR="${1#*=}"
shift
;;
--bucket-name=*)
BUCKET_NAME="${1#*=}"
shift
;;
--host-base=*)
HOST_BASE="${1#*=}"
shift
;;
--bucket-region=*)
BUCKET_REGION="${1#*=}"
shift
;;
--retention-days=*)
RETENTION_DAYS="${1#*=}"
shift
;;
--prom-metrics*)
PROM_METRICS="true"
shift
;;
-?*)
echo "Unknown option: $1"
usage
;;
*)
break
;;
esac
shift
done

# Validate required parameters
if [ -z "${ACCESS_KEY}" ]; then
error "Missing required parameter: --access-key"
usage
fi
if [ -z "${SECRET_KEY}" ]; then
error "Missing required parameter: --secret-key"
usage
fi

return 0
}


# Create the s3 configuration
create_s3_config() {
echo "" >> /.s3cfg
echo "use_https = True" >> /.s3cfg
echo "access_key = ${ACCESS_KEY}" >> /.s3cfg
echo "secret_key = ${SECRET_KEY}" >> /.s3cfg
if [ -z "${HOST_BASE}" ]; then
echo "host_base = ${HOST_BASE}" >> /.s3cfg
fi
if [ -z "${HOST_BUCKET}" ]; then
echo "host_bucket = ${HOST_BUCKET}" >> /.s3cfg
fi
if [ -z "${BUCKET_REGION}" ]; then
echo "bucket_location = ${BUCKET_REGION}" >> /.s3cfg
fi

debug "S3 configuration :"
debug "$(cat /.s3cfg)"
}

setup_colors
parse_params "$@"
create_s3_config

# Create backup directory for service if it doesn't exist.
mkdir -p "${BACKUPS_DIR}/${SERVICE_NAME}"

# Cleanup backups that are older than RETENTION_DAYS days
find "$BACKUPS_DIR/${SERVICE_NAME}" -type f -name "${SERVICE_NAME}-*.tar.gz" -mtime +"$RETENTION_DAYS" -exec rm -f {} \;

cd $DATA_DIR
tar -czf "${BACKUPS_DIR}/${SERVICE_NAME}-$(date +%Y-%m-%d).tar.gz" ./

/opt/s3cmd/s3cmd --config=/.s3cfg sync "${BACKUPS_DIR}/${SERVICE_NAME}" "s3://${BUCKET_NAME}/${SERVICE_NAME}"
FAILURE=0

info "Backup completed successfully."
if [ "$PROM_METRICS" == "true" ]; then
write_metrics
fi

0 comments on commit e38a639

Please sign in to comment.