2021-12-10 11:53:00 +03:00
|
|
|
import datetime
|
2020-03-25 06:35:49 +05:30
|
|
|
import os
|
|
|
|
import time
|
|
|
|
from glob import glob
|
2021-12-10 11:53:00 +03:00
|
|
|
|
|
|
|
import boto3
|
2020-07-10 23:15:36 +05:30
|
|
|
from constants import DATE_FORMAT
|
2021-12-10 11:53:00 +03:00
|
|
|
from frappe.utils import get_sites
|
|
|
|
from utils import check_s3_environment_variables, get_s3_config, upload_file_to_s3
|
2020-03-25 22:25:24 +05:30
|
|
|
|
2020-04-29 01:45:59 +05:30
|
|
|
|
2020-03-25 06:35:49 +05:30
|
|
|
def get_file_ext():
|
|
|
|
return {
|
|
|
|
"database": "-database.sql.gz",
|
|
|
|
"private_files": "-private-files.tar",
|
2020-06-25 18:57:25 +05:30
|
|
|
"public_files": "-files.tar",
|
2021-12-10 11:52:40 +03:00
|
|
|
"site_config": "-site_config_backup.json",
|
2020-03-25 06:35:49 +05:30
|
|
|
}
|
|
|
|
|
2020-04-29 01:45:59 +05:30
|
|
|
|
2020-03-25 06:35:49 +05:30
|
|
|
def get_backup_details(sitename):
|
|
|
|
backup_details = dict()
|
|
|
|
file_ext = get_file_ext()
|
|
|
|
|
|
|
|
# add trailing slash https://stackoverflow.com/a/15010678
|
|
|
|
site_backup_path = os.path.join(os.getcwd(), sitename, "private", "backups", "")
|
|
|
|
|
|
|
|
if os.path.exists(site_backup_path):
|
|
|
|
for filetype, ext in file_ext.items():
|
2021-12-10 11:52:40 +03:00
|
|
|
site_slug = sitename.replace(".", "_")
|
|
|
|
pattern = site_backup_path + "*-" + site_slug + ext
|
2020-03-25 06:35:49 +05:30
|
|
|
backup_files = list(filter(os.path.isfile, glob(pattern)))
|
|
|
|
|
|
|
|
if len(backup_files) > 0:
|
2021-12-10 11:52:40 +03:00
|
|
|
backup_files.sort(
|
|
|
|
key=lambda file: os.stat(
|
|
|
|
os.path.join(site_backup_path, file)
|
|
|
|
).st_ctime
|
|
|
|
)
|
|
|
|
backup_date = datetime.datetime.strptime(
|
|
|
|
time.ctime(os.path.getmtime(backup_files[0])),
|
|
|
|
"%a %b %d %H:%M:%S %Y",
|
|
|
|
)
|
2020-03-25 06:35:49 +05:30
|
|
|
backup_details[filetype] = {
|
|
|
|
"sitename": sitename,
|
|
|
|
"file_size_in_bytes": os.stat(backup_files[-1]).st_size,
|
|
|
|
"file_path": os.path.abspath(backup_files[-1]),
|
|
|
|
"filename": os.path.basename(backup_files[-1]),
|
2021-12-10 11:52:40 +03:00
|
|
|
"backup_date": backup_date.date().strftime("%Y-%m-%d %H:%M:%S"),
|
2020-03-25 06:35:49 +05:30
|
|
|
}
|
|
|
|
|
|
|
|
return backup_details
|
|
|
|
|
2020-04-29 01:45:59 +05:30
|
|
|
|
2020-03-25 22:25:24 +05:30
|
|
|
def delete_old_backups(limit, bucket, site_name):
|
2020-03-25 06:35:49 +05:30
|
|
|
all_backups = list()
|
2020-03-25 22:25:24 +05:30
|
|
|
all_backup_dates = list()
|
2020-03-25 06:35:49 +05:30
|
|
|
backup_limit = int(limit)
|
2020-07-10 23:15:36 +05:30
|
|
|
check_s3_environment_variables()
|
2021-12-10 11:52:40 +03:00
|
|
|
bucket_dir = os.environ.get("BUCKET_DIR")
|
2020-03-27 16:07:12 +05:30
|
|
|
oldest_backup_date = None
|
2020-03-25 06:35:49 +05:30
|
|
|
|
|
|
|
s3 = boto3.resource(
|
2021-12-10 11:52:40 +03:00
|
|
|
"s3",
|
|
|
|
region_name=os.environ.get("REGION"),
|
|
|
|
aws_access_key_id=os.environ.get("ACCESS_KEY_ID"),
|
|
|
|
aws_secret_access_key=os.environ.get("SECRET_ACCESS_KEY"),
|
|
|
|
endpoint_url=os.environ.get("ENDPOINT_URL"),
|
2020-03-25 06:35:49 +05:30
|
|
|
)
|
|
|
|
|
|
|
|
bucket = s3.Bucket(bucket)
|
2021-12-10 11:52:40 +03:00
|
|
|
objects = bucket.meta.client.list_objects_v2(Bucket=bucket.name, Delimiter="/")
|
2020-03-25 06:35:49 +05:30
|
|
|
|
|
|
|
if objects:
|
2021-12-10 11:52:40 +03:00
|
|
|
for obj in objects.get("CommonPrefixes"):
|
|
|
|
if obj.get("Prefix") == bucket_dir + "/":
|
|
|
|
for backup_obj in bucket.objects.filter(Prefix=obj.get("Prefix")):
|
2020-10-06 20:47:56 +05:30
|
|
|
if backup_obj.get()["ContentType"] == "application/x-directory":
|
|
|
|
continue
|
2020-03-25 06:35:49 +05:30
|
|
|
try:
|
2020-03-25 22:25:24 +05:30
|
|
|
# backup_obj.key is bucket_dir/site/date_time/backupfile.extension
|
2021-12-10 11:52:40 +03:00
|
|
|
(
|
|
|
|
bucket_dir,
|
|
|
|
site_slug,
|
|
|
|
date_time,
|
|
|
|
backupfile,
|
|
|
|
) = backup_obj.key.split("/")
|
2020-03-25 22:25:24 +05:30
|
|
|
date_time_object = datetime.datetime.strptime(
|
|
|
|
date_time, DATE_FORMAT
|
|
|
|
)
|
|
|
|
|
|
|
|
if site_name in backup_obj.key:
|
|
|
|
all_backup_dates.append(date_time_object)
|
|
|
|
all_backups.append(backup_obj.key)
|
|
|
|
except IndexError as error:
|
2020-03-25 06:35:49 +05:30
|
|
|
print(error)
|
|
|
|
exit(1)
|
|
|
|
|
2020-03-27 16:07:12 +05:30
|
|
|
if len(all_backup_dates) > 0:
|
|
|
|
oldest_backup_date = min(all_backup_dates)
|
2020-03-25 22:25:24 +05:30
|
|
|
|
|
|
|
if len(all_backups) / 3 > backup_limit:
|
|
|
|
oldest_backup = None
|
|
|
|
for backup in all_backups:
|
|
|
|
try:
|
|
|
|
# backup is bucket_dir/site/date_time/backupfile.extension
|
2021-12-10 11:52:40 +03:00
|
|
|
backup_dir, site_slug, backup_dt_string, filename = backup.split("/")
|
2020-03-25 22:25:24 +05:30
|
|
|
backup_datetime = datetime.datetime.strptime(
|
|
|
|
backup_dt_string, DATE_FORMAT
|
|
|
|
)
|
|
|
|
if backup_datetime == oldest_backup_date:
|
|
|
|
oldest_backup = backup
|
|
|
|
|
|
|
|
except IndexError as error:
|
|
|
|
print(error)
|
|
|
|
exit(1)
|
|
|
|
|
|
|
|
if oldest_backup:
|
|
|
|
for obj in bucket.objects.filter(Prefix=oldest_backup):
|
|
|
|
# delete all keys that are inside the oldest_backup
|
|
|
|
if bucket_dir in obj.key:
|
2021-12-10 11:54:51 +03:00
|
|
|
print("Deleting " + obj.key)
|
2020-03-25 22:25:24 +05:30
|
|
|
s3.Object(bucket.name, obj.key).delete()
|
2020-03-25 06:35:49 +05:30
|
|
|
|
2020-04-29 01:45:59 +05:30
|
|
|
|
2020-03-25 06:35:49 +05:30
|
|
|
def main():
|
|
|
|
details = dict()
|
|
|
|
sites = get_sites()
|
|
|
|
conn, bucket = get_s3_config()
|
|
|
|
|
|
|
|
for site in sites:
|
|
|
|
details = get_backup_details(site)
|
2021-12-10 11:52:40 +03:00
|
|
|
db_file = details.get("database", {}).get("file_path")
|
|
|
|
folder = os.environ.get("BUCKET_DIR") + "/" + site + "/"
|
2020-03-25 06:35:49 +05:30
|
|
|
if db_file:
|
2021-12-10 11:52:40 +03:00
|
|
|
folder = (
|
|
|
|
os.environ.get("BUCKET_DIR")
|
|
|
|
+ "/"
|
|
|
|
+ site
|
|
|
|
+ "/"
|
|
|
|
+ os.path.basename(db_file)[:15]
|
|
|
|
+ "/"
|
|
|
|
)
|
2020-03-25 06:35:49 +05:30
|
|
|
upload_file_to_s3(db_file, folder, conn, bucket)
|
|
|
|
|
2020-05-09 00:30:15 +05:30
|
|
|
# Archive site_config.json
|
2021-12-10 11:52:40 +03:00
|
|
|
site_config_file = details.get("site_config", {}).get("file_path")
|
2020-06-25 18:57:25 +05:30
|
|
|
if not site_config_file:
|
2021-12-10 11:52:40 +03:00
|
|
|
site_config_file = os.path.join(os.getcwd(), site, "site_config.json")
|
2020-05-09 00:30:15 +05:30
|
|
|
upload_file_to_s3(site_config_file, folder, conn, bucket)
|
|
|
|
|
2021-12-10 11:52:40 +03:00
|
|
|
public_files = details.get("public_files", {}).get("file_path")
|
2020-03-25 06:35:49 +05:30
|
|
|
if public_files:
|
2021-12-10 11:52:40 +03:00
|
|
|
folder = (
|
|
|
|
os.environ.get("BUCKET_DIR")
|
|
|
|
+ "/"
|
|
|
|
+ site
|
|
|
|
+ "/"
|
|
|
|
+ os.path.basename(public_files)[:15]
|
|
|
|
+ "/"
|
|
|
|
)
|
2020-03-25 06:35:49 +05:30
|
|
|
upload_file_to_s3(public_files, folder, conn, bucket)
|
|
|
|
|
2021-12-10 11:52:40 +03:00
|
|
|
private_files = details.get("private_files", {}).get("file_path")
|
2020-03-25 06:35:49 +05:30
|
|
|
if private_files:
|
2021-12-10 11:52:40 +03:00
|
|
|
folder = (
|
|
|
|
os.environ.get("BUCKET_DIR")
|
|
|
|
+ "/"
|
|
|
|
+ site
|
|
|
|
+ "/"
|
|
|
|
+ os.path.basename(private_files)[:15]
|
|
|
|
+ "/"
|
|
|
|
)
|
2020-03-25 06:35:49 +05:30
|
|
|
upload_file_to_s3(private_files, folder, conn, bucket)
|
|
|
|
|
2021-12-10 11:52:40 +03:00
|
|
|
delete_old_backups(os.environ.get("BACKUP_LIMIT", "3"), bucket, site)
|
2020-03-25 06:35:49 +05:30
|
|
|
|
2021-12-10 11:52:40 +03:00
|
|
|
print("push-backup complete")
|
2020-03-25 06:35:49 +05:30
|
|
|
exit(0)
|
|
|
|
|
2020-04-29 01:45:59 +05:30
|
|
|
|
2020-03-25 06:35:49 +05:30
|
|
|
if __name__ == "__main__":
|
|
|
|
main()
|