-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathbackup.py
72 lines (62 loc) · 2.4 KB
/
backup.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
import argparse
import logging
import os
from datetime import datetime
import yaml
import pandas as pd
from sqlalchemy import text
from app import app, db
from lib.push import Push
logging.basicConfig(level='INFO')
LOGGER = logging.getLogger(__name__)
# Create argument parser
parser = argparse.ArgumentParser()
parser.add_argument('--config', '-c', default='config', type=str)
parser.add_argument('--folder', '-f', default='tmp', type=str)
# Parse args
args = parser.parse_args()
credentials = yaml.safe_load(open(f'{args.config}/credentials.yaml'))
notifier = Push(**credentials['push'])
config = yaml.safe_load(open(f'{args.config}/backup.yaml'))
table_names = config['tables']
n_days = config['ttl_days']
# Drop old backup folders when they are older than n_days days
for folder in os.listdir(args.folder):
folder_path = os.path.join(args.folder, folder)
if os.path.isdir(folder_path):
try:
folder_date = datetime.strptime(folder, '%Y-%m-%d')
except ValueError:
continue
if (datetime.today() - folder_date).days > n_days:
LOGGER.info(f'Deleting old backup folder: {folder_path}')
# delete directory even if not empty
for root, dirs, files in os.walk(folder_path, topdown=False):
for name in files:
os.remove(os.path.join(root, name))
for name in dirs:
os.rmdir(os.path.join(root, name))
os.rmdir(folder_path)
# Create a dated folder
folder_path = os.path.join(args.folder, datetime.today().strftime('%Y-%m-%d'))
if not os.path.exists(folder_path):
os.makedirs(folder_path)
# Backup each table
fail_list = []
for table_name in table_names:
try:
# Fetch table into a Pandas dataframe
table_ref = f'{credentials["db"]["schema"]}.{table_name}'
df = pd.read_sql_query(text(f'SELECT * FROM {table_ref}'), db.engine.connect())
# Backup table as CSV
backup_path = os.path.join(folder_path, f'{table_name}.csv')
df.to_csv(backup_path, header=True, index=False)
LOGGER.info(f'Successful backup of {table_ref} table to: {backup_path}')
except Exception as e:
fail_list.append(table_name)
LOGGER.error(str(e))
if fail_list:
notifier.send_message(
message=f'Could not backup table{"s" if len(fail_list) > 1 else ""}: {", ".join(fail_list)}',
title='⚠️ Journal Alert'
)