zsnapper/zsnaplib/__init__.py

285 lines
8.1 KiB
Python
Raw Permalink Normal View History

import datetime
import logging
import re
import subprocess
import sys
time_format='%Y-%m-%d_%H%M'
re_snapshot = re.compile(r'^(.*)@([0-9]{4}-[0-9]{2}-[0-9]{2}_[0-9]{4})$')
re_err_ok = re.compile(r"cannot create snapshot '[^']+': dataset already exists")
logger = 'zsnapper'
class ZFSSnapshotError(Exception):
pass
def do_zfs_command(args, zfs_cmd, pipecmd=None):
cmd = []
cmd.extend(zfs_cmd)
cmd.extend(args)
proc = subprocess.Popen(
cmd,
stdin=subprocess.PIPE,
stdout=subprocess.PIPE,
stderr=subprocess.PIPE)
ctrl_proc = proc
if pipecmd:
proc2 = subprocess.Popen(
pipecmd,
stdin=proc.stdout,
stdout=subprocess.PIPE,
stderr=subprocess.PIPE)
proc.stdout.close()
ctrl_proc = proc2
(out, err) = ctrl_proc.communicate()
# check if we try to create a snapshot that already exists. This can happen
# if the script is run every minute and it takes more time than that to
# create all snapshots
2020-12-21 18:41:13 +01:00
if ctrl_proc.returncode == 1 and re.match(re_err_ok, err.decode('utf-8')):
pass
elif ctrl_proc.returncode != 0:
raise ZFSSnapshotError('Failed to execute {}: {}'.format(cmd, err))
return out
def send_snapshot(
fs,
snap,
remote_zfs_cmd,
remote_target,
zfs_cmd,
send_opts=[],
recv_opts=[],
repl_mode='all',
repl_from=None):
snap = snap.strftime(time_format)
if repl_from:
if repl_mode == 'latest':
inc_flag = '-i'
else:
inc_flag = '-I'
repl_from = repl_from.strftime(time_format)
args = [ 'send' ] + send_opts + [ inc_flag, '{}@{}'.format(fs, repl_from), '{}@{}'.format(fs, snap) ]
else:
args = [ 'send' ] + send_opts + [ '{}@{}'.format(fs, snap) ]
pipecmd = remote_zfs_cmd + [ 'receive' ] + recv_opts + [ remote_target ]
do_zfs_command(args, zfs_cmd, pipecmd=pipecmd)
def create_snapshot(fs, zfs_cmd):
d = datetime.datetime.now().strftime(time_format)
args = ['snapshot', '{}@{}'.format(fs, d)]
do_zfs_command(args, zfs_cmd)
def get_filesystems(zfs_cmd):
args = ['list', '-H']
out = do_zfs_command(args, zfs_cmd)
ret = set()
for row in out.splitlines():
row = row.decode('UTF-8')
2021-08-21 16:31:06 +02:00
ret.add(row.split('\t')[0])
return ret
def get_snapshots(zfs_cmd):
args = [ 'list', '-H', '-t', 'snapshot' ]
out = do_zfs_command(args, zfs_cmd)
snapshots = {}
for row in out.splitlines():
row = row.decode('UTF-8').split('\t')[0]
res = re_snapshot.match(row)
if res:
d = datetime.datetime.strptime(res.group(2), time_format)
if res.group(1) in snapshots:
snapshots[res.group(1)].append(d)
else:
snapshots[res.group(1)] = [d]
for l in snapshots.values():
l.sort(reverse=True)
return snapshots
def remove_snapshot(fs, date, zfs_cmd):
date = date.strftime(time_format)
args = [ 'destroy', '{}@{}'.format(fs, date) ]
do_zfs_command(args, zfs_cmd)
def weed_snapshots(
fs,
dates,
zfs_cmd,
remote = None,
custom_keep_interval = None,
keep_custom = 0,
keep_yearly = 0,
keep_monthly = 0,
keep_weekly = 0,
keep_daily = 0,
keep_hourly = 0,
keep_30min = 0,
keep_15min = 0,
keep_5min = 0,
keep_1min = 0):
log = logging.getLogger(logger)
if '@' in fs:
source_fs, remote = fs.split('@', 1)
else:
source_fs = fs
keep = {
'custom': [],
'year' : [],
'month' : [],
'week' : [],
'day' : [],
'hour' : [],
'min30' : [],
'min15' : [],
'min5' : [],
'min1' : []
}
saved = {
'custom': [],
'year' : [],
'month' : [],
'week' : [],
'day' : [],
'hour' : [],
'min30' : [],
'min15' : [],
'min5' : [],
'min1' : []
}
for date in sorted(dates):
min1 = date-datetime.timedelta(seconds=date.second, microseconds=date.microsecond)
min5 = date-datetime.timedelta(minutes=date.minute%5, seconds=date.second, microseconds=date.microsecond)
min15 = date-datetime.timedelta(minutes=date.minute%15, seconds=date.second, microseconds=date.microsecond)
min30 = date-datetime.timedelta(minutes=date.minute%30, seconds=date.second, microseconds=date.microsecond)
hour = date-datetime.timedelta(minutes=date.minute, seconds=date.second, microseconds=date.microsecond)
day = datetime.datetime.combine(date.date(), datetime.time.min)
week = datetime.datetime.combine(date.date()-datetime.timedelta(days=date.weekday()), datetime.time.min)
month = datetime.datetime(year=date.year, month=date.month, day=1)
year = datetime.datetime(year=date.year, month=1, day=1)
# yearly snapshots
if year not in saved['year']:
saved['year'].append(year)
keep['year'].append(date)
if month not in saved['month']:
saved['month'].append(month)
keep['month'].append(date)
if week not in saved['week']:
saved['week'].append(week)
keep['week'].append(date)
if day not in saved['day']:
saved['day'].append(day)
keep['day'].append(date)
if hour not in saved['hour']:
saved['hour'].append(hour)
keep['hour'].append(date)
if min30 not in saved['min30']:
saved['min30'].append(min30)
keep['min30'].append(date)
if min15 not in saved['min15']:
saved['min15'].append(min15)
keep['min15'].append(date)
if min5 not in saved['min5']:
saved['min5'].append(min5)
keep['min5'].append(date)
if min1 not in saved['min1']:
saved['min1'].append(min1)
keep['min1'].append(date)
if custom_keep_interval:
cur = year
while cur+custom_keep_interval < date:
cur += custom_keep_interval
if cur not in saved['custom']:
saved['custom'].append(cur)
keep['custom'].append(date)
if keep_yearly:
keep['year'] = keep['year'][-keep_yearly:]
else:
keep['year'] = []
if keep_monthly:
keep['month'] = keep['month'][-keep_monthly:]
else:
keep['month'] = []
if keep_weekly:
keep['week'] = keep['week'][-keep_weekly:]
else:
keep['week'] = []
if keep_daily:
keep['day'] = keep['day'][-keep_daily:]
else:
keep['day'] = []
if keep_hourly:
keep['hour'] = keep['hour'][-keep_hourly:]
else:
keep['hour'] = []
if keep_30min:
keep['min30'] = keep['min30'][-keep_30min:]
else:
keep['min30'] = []
if keep_15min:
keep['min15'] = keep['min15'][-keep_15min:]
else:
keep['min15'] = []
if keep_5min:
keep['min5'] = keep['min5'][-keep_5min:]
else:
keep['min5'] = []
if keep_1min:
keep['min1'] = keep['min1'][-keep_1min:]
else:
keep['min1'] = []
if keep_custom:
keep['custom'] = keep['custom'][-keep_custom:]
else:
keep['custom'] = []
all_keep = []
all_keep.extend(keep['year'])
all_keep.extend(keep['month'])
all_keep.extend(keep['week'])
all_keep.extend(keep['day'])
all_keep.extend(keep['hour'])
all_keep.extend(keep['min30'])
all_keep.extend(keep['min15'])
all_keep.extend(keep['min5'])
all_keep.extend(keep['min1'])
all_keep.extend(keep['custom'])
all_keep = set(all_keep)
to_remove = [date for date in dates if date not in all_keep]
for date in to_remove:
try:
log.info('{}: removing snapshot from {}'.format(fs, date))
remove_snapshot(source_fs, date, zfs_cmd)
except ZFSSnapshotError as e:
log.error(str(e))