Compare commits

...

17 Commits

Author SHA1 Message Date
a4155f970e completed --no-thinning option. fixes #54 2021-03-01 00:04:10 +01:00
0c9d14bf32 splitting up more stuff 2021-02-27 21:36:03 +01:00
1f5955ccec splitting up more stuff 2021-02-27 14:35:47 +01:00
1b94a849db splitting up more stuff 2021-02-26 20:10:39 +01:00
98c40c6df5 splitting up more stuff 2021-02-26 20:10:20 +01:00
b479ab9c98 more clear name 2021-02-21 22:25:42 +01:00
a0fb205e75 cleaning up code 2021-02-21 22:08:35 +01:00
d3ce222921 some more refactoring. splitting of smaller cleaner functions. started work on --no-thinning 2021-02-19 00:27:37 +01:00
36e134eb75 Update README.md 2021-02-16 12:28:00 +01:00
628cd75941 fix 2021-02-07 21:17:40 +01:00
1da14c5c3b forgot to document child 2021-02-07 21:09:03 +01:00
c83d0fcff2 explain inheritance 2021-02-07 20:59:19 +01:00
573af341b8 fixes 2021-02-07 18:04:00 +01:00
a64168bee2 fixes 2021-02-07 18:00:58 +01:00
c678ae5f9a fixed --ignore-transfer-errors 2021-02-07 16:57:12 +01:00
e95967db53 update version 2021-02-07 16:23:09 +01:00
29e6c056d1 p2 fix pythonpackages 2021-02-07 16:03:26 +01:00
10 changed files with 354 additions and 213 deletions

View File

@ -28,12 +28,12 @@ jobs:
- name: Install dependencies 3.x - name: Install dependencies 3.x
run: | run: |
python -m pip install --upgrade pip python -m pip install --upgrade pip
pip install setuptools wheel twine pip3 install setuptools wheel twine
- name: Install dependencies 2.x - name: Install dependencies 2.x
run: | run: |
python2 -m pip install --upgrade pip python2 -m pip install --upgrade pip
pip2 install setuptools pip2 install setuptools wheel twine
- name: Build and publish - name: Build and publish
env: env:

1
.gitignore vendored
View File

@ -11,4 +11,3 @@ __pycache__
python2.env python2.env
venv venv
.idea .idea
OQ

View File

@ -148,6 +148,8 @@ rpool/swap autobackup:offsite1 true
... ...
``` ```
ZFS properties are ```inherited``` by child datasets. Since we've set the property on the highest dataset, we're essentially backupping the whole pool.
Because we don't want to backup everything, we can exclude certain filesystem by setting the property to false: Because we don't want to backup everything, we can exclude certain filesystem by setting the property to false:
```console ```console
@ -163,6 +165,13 @@ rpool/swap autobackup:offsite1 false
... ...
``` ```
The autobackup-property can have 3 values:
* ```true```: Backup the dataset and all its children
* ```false```: Dont backup the dataset and all its children. (used to exclude certain datasets)
* ```child```: Only backup the children off the dataset, not the dataset itself.
Only use the zfs-command to set these properties, not the zpool command.
### Running zfs-autobackup ### Running zfs-autobackup
Run the script on the backup server and pull the data from the server specified by --ssh-source. Run the script on the backup server and pull the data from the server specified by --ssh-source.
@ -654,10 +663,10 @@ for HOST in $HOSTS; do
done done
``` ```
This script will also send the backup status to Zabbix. (if you've installed my zabbix-job-status script) This script will also send the backup status to Zabbix. (if you've installed my zabbix-job-status script https://github.com/psy0rz/stuff/tree/master/zabbix-jobs)
# Sponsor list # Sponsor list
This project was sponsorred by: This project was sponsorred by:
* (None so far) * JetBrains (Provided me with a license for their whole professional product line, https://www.jetbrains.com/pycharm/ )

View File

@ -96,7 +96,7 @@ class TestZfsNode(unittest2.TestCase):
#now tries to destroy our own last snapshot (before the final destroy of the dataset) #now tries to destroy our own last snapshot (before the final destroy of the dataset)
self.assertIn("fs1@test-20101111000000: Destroying", buf.getvalue()) self.assertIn("fs1@test-20101111000000: Destroying", buf.getvalue())
#but cant finish because still in use: #but cant finish because still in use:
self.assertIn("fs1: Error during destoy missing", buf.getvalue()) self.assertIn("fs1: Error during --destroy-missing", buf.getvalue())
shelltest("zfs destroy test_target1/clone1") shelltest("zfs destroy test_target1/clone1")

View File

@ -1,7 +1,7 @@
from basetest import * from basetest import *
class TestZfsNode(unittest2.TestCase): class TestExternalFailures(unittest2.TestCase):
def setUp(self): def setUp(self):
prepare_zpools() prepare_zpools()
@ -259,8 +259,28 @@ test_target1/test_source2/fs2/sub@test-20101111000002
with patch('time.strftime', return_value="20101111000001"): with patch('time.strftime', return_value="20101111000001"):
self.assertTrue(ZfsAutobackup("test test_target1 --verbose --allow-empty".split(" ")).run()) self.assertTrue(ZfsAutobackup("test test_target1 --verbose --allow-empty".split(" ")).run())
############# TODO: #UPDATE: offcourse the one thing that wasn't tested had a bug :( (in ExecuteNode.run()).
def test_ignoretransfererrors(self): def test_ignoretransfererrors(self):
self.skipTest( self.skipTest("Not sure how to implement a test for this without some serious hacking and patching.")
"todo: create some kind of situation where zfs recv exits with an error but transfer is still ok (happens in practice with acltype)")
# #recreate target pool without any features
# # shelltest("zfs set compress=on test_source1; zpool destroy test_target1; zpool create test_target1 -o feature@project_quota=disabled /dev/ram2")
#
# with patch('time.strftime', return_value="20101111000000"):
# self.assertFalse(ZfsAutobackup("test test_target1 --verbose --allow-empty --no-progress".split(" ")).run())
#
# r = shelltest("zfs list -H -o name -r -t all test_target1")
#
# self.assertMultiLineEqual(r, """
# test_target1
# test_target1/test_source1
# test_target1/test_source1/fs1
# test_target1/test_source1/fs1@test-20101111000002
# test_target1/test_source1/fs1/sub
# test_target1/test_source1/fs1/sub@test-20101111000002
# test_target1/test_source2
# test_target1/test_source2/fs2
# test_target1/test_source2/fs2/sub
# test_target1/test_source2/fs2/sub@test-20101111000002
# """)

View File

@ -0,0 +1,49 @@
from basetest import *
import time
class TestZfsAutobackup31(unittest2.TestCase):
def setUp(self):
prepare_zpools()
self.longMessage=True
def test_no_thinning(self):
with patch('time.strftime', return_value="20101111000000"):
self.assertFalse(ZfsAutobackup("test test_target1 --verbose --allow-empty".split(" ")).run())
with patch('time.strftime', return_value="20101111000001"):
self.assertFalse(ZfsAutobackup("test test_target1 --verbose --allow-empty --keep-target=0 --keep-source=0 --no-thinning".split(" ")).run())
r=shelltest("zfs list -H -o name -r -t all "+TEST_POOLS)
self.assertMultiLineEqual(r,"""
test_source1
test_source1/fs1
test_source1/fs1@test-20101111000000
test_source1/fs1@test-20101111000001
test_source1/fs1/sub
test_source1/fs1/sub@test-20101111000000
test_source1/fs1/sub@test-20101111000001
test_source2
test_source2/fs2
test_source2/fs2/sub
test_source2/fs2/sub@test-20101111000000
test_source2/fs2/sub@test-20101111000001
test_source2/fs3
test_source2/fs3/sub
test_target1
test_target1/test_source1
test_target1/test_source1/fs1
test_target1/test_source1/fs1@test-20101111000000
test_target1/test_source1/fs1@test-20101111000001
test_target1/test_source1/fs1/sub
test_target1/test_source1/fs1/sub@test-20101111000000
test_target1/test_source1/fs1/sub@test-20101111000001
test_target1/test_source2
test_target1/test_source2/fs2
test_target1/test_source2/fs2/sub
test_target1/test_source2/fs2/sub@test-20101111000000
test_target1/test_source2/fs2/sub@test-20101111000001
""")

View File

@ -115,7 +115,7 @@ test_target1
def test_supportedrecvoptions(self): def test_supportedrecvoptions(self):
logger=LogStub() logger=LogStub()
description="[Source]" description="[Source]"
#NOTE: this couldnt hang via ssh if we dont close filehandles properly. (which was a previous bug) #NOTE: this could hang via ssh if we dont close filehandles properly. (which was a previous bug)
node=ZfsNode("test", logger, description=description, ssh_to='localhost') node=ZfsNode("test", logger, description=description, ssh_to='localhost')
self.assertIsInstance(node.supported_recv_options, list) self.assertIsInstance(node.supported_recv_options, list)

View File

@ -4,6 +4,7 @@ import subprocess
from zfs_autobackup.LogStub import LogStub from zfs_autobackup.LogStub import LogStub
class ExecuteNode(LogStub): class ExecuteNode(LogStub):
"""an endpoint to execute local or remote commands via ssh""" """an endpoint to execute local or remote commands via ssh"""
@ -46,17 +47,23 @@ class ExecuteNode(LogStub):
def run(self, cmd, inp=None, tab_split=False, valid_exitcodes=None, readonly=False, hide_errors=False, pipe=False, def run(self, cmd, inp=None, tab_split=False, valid_exitcodes=None, readonly=False, hide_errors=False, pipe=False,
return_stderr=False): return_stderr=False):
"""run a command on the node cmd: the actual command, should be a list, where the first item is the command """run a command on the node.
and the rest are parameters. input: Can be None, a string or a pipe-handle you got from another run()
tab_split: split tabbed files in output into a list valid_exitcodes: list of valid exit codes for this :param cmd: the actual command, should be a list, where the first item is the command
command (checks exit code of both sides of a pipe) readonly: make this True if the command doesn't make any and the rest are parameters.
changes and is safe to execute in testmode hide_errors: don't show stderr output as error, instead show it as :param inp: Can be None, a string or a pipe-handle you got from another run()
debugging output (use to hide expected errors) pipe: Instead of executing, return a pipe-handle to be used to :param tab_split: split tabbed files in output into a list
input to another run() command. (just like a | in linux) return_stderr: return both stdout and stderr as a :param valid_exitcodes: list of valid exit codes for this command (checks exit code of both sides of a pipe)
tuple. (only returns stderr from this side of the pipe) Use [] to accept all exit codes.
:param readonly: make this True if the command doesn't make any changes and is safe to execute in testmode
:param hide_errors: don't show stderr output as error, instead show it as debugging output (use to hide expected errors)
:param pipe: Instead of executing, return a pipe-handle to be used to
input to another run() command. (just like a | in linux)
:param return_stderr: return both stdout and stderr as a tuple. (normally only returns stdout)
""" """
if not valid_exitcodes: if valid_exitcodes is None:
valid_exitcodes = [0] valid_exitcodes = [0]
encoded_cmd = [] encoded_cmd = []
@ -196,4 +203,4 @@ class ExecuteNode(LogStub):
if return_stderr: if return_stderr:
return output_lines, error_lines return output_lines, error_lines
else: else:
return output_lines return output_lines

View File

@ -12,7 +12,7 @@ from zfs_autobackup.ThinnerRule import ThinnerRule
class ZfsAutobackup: class ZfsAutobackup:
"""main class""" """main class"""
VERSION = "3.0.1-beta4" VERSION = "3.1-beta1"
HEADER = "zfs-autobackup v{} - Copyright 2020 E.H.Eefting (edwin@datux.nl)".format(VERSION) HEADER = "zfs-autobackup v{} - Copyright 2020 E.H.Eefting (edwin@datux.nl)".format(VERSION)
def __init__(self, argv, print_arguments=True): def __init__(self, argv, print_arguments=True):
@ -23,8 +23,7 @@ class ZfsAutobackup:
parser = argparse.ArgumentParser( parser = argparse.ArgumentParser(
description=self.HEADER, description=self.HEADER,
epilog='When a filesystem fails, zfs_backup will continue and report the number of failures at that end. ' epilog='Full manual at: https://github.com/psy0rz/zfs_autobackup')
'Also the exit code will indicate the number of failures. Full manual at: https://github.com/psy0rz/zfs_autobackup')
parser.add_argument('--ssh-config', default=None, help='Custom ssh client config') parser.add_argument('--ssh-config', default=None, help='Custom ssh client config')
parser.add_argument('--ssh-source', default=None, parser.add_argument('--ssh-source', default=None,
help='Source host to get backup from. (user@hostname) Default %(default)s.') help='Source host to get backup from. (user@hostname) Default %(default)s.')
@ -48,7 +47,9 @@ class ZfsAutobackup:
help='Don\'t create new snapshots (useful for finishing uncompleted backups, or cleanups)') help='Don\'t create new snapshots (useful for finishing uncompleted backups, or cleanups)')
parser.add_argument('--no-send', action='store_true', parser.add_argument('--no-send', action='store_true',
help='Don\'t send snapshots (useful for cleanups, or if you want a serperate send-cronjob)') help='Don\'t send snapshots (useful for cleanups, or if you want a serperate send-cronjob)')
# parser.add_argument('--no-thinning', action='store_true', help='Don\'t run the thinner.') parser.add_argument('--no-thinning', action='store_true', help="Do not destroy any snapshots.")
parser.add_argument('--no-holds', action='store_true',
help='Don\'t hold snapshots. (Faster. Allows you to destroy common snapshot.)')
parser.add_argument('--min-change', type=int, default=1, parser.add_argument('--min-change', type=int, default=1,
help='Number of bytes written after which we consider a dataset changed (default %(' help='Number of bytes written after which we consider a dataset changed (default %('
'default)s)') 'default)s)')
@ -57,8 +58,6 @@ class ZfsAutobackup:
parser.add_argument('--ignore-replicated', action='store_true', parser.add_argument('--ignore-replicated', action='store_true',
help='Ignore datasets that seem to be replicated some other way. (No changes since ' help='Ignore datasets that seem to be replicated some other way. (No changes since '
'lastest snapshot. Useful for proxmox HA replication)') 'lastest snapshot. Useful for proxmox HA replication)')
parser.add_argument('--no-holds', action='store_true',
help='Don\'t hold snapshots. (Faster)')
parser.add_argument('--resume', action='store_true', help=argparse.SUPPRESS) parser.add_argument('--resume', action='store_true', help=argparse.SUPPRESS)
parser.add_argument('--strip-path', default=0, type=int, parser.add_argument('--strip-path', default=0, type=int,
@ -103,14 +102,15 @@ class ZfsAutobackup:
help='Show zfs commands and their output/exit codes. (noisy)') help='Show zfs commands and their output/exit codes. (noisy)')
parser.add_argument('--progress', action='store_true', parser.add_argument('--progress', action='store_true',
help='show zfs progress output. Enabled automaticly on ttys. (use --no-progress to disable)') help='show zfs progress output. Enabled automaticly on ttys. (use --no-progress to disable)')
parser.add_argument('--no-progress', action='store_true', help=argparse.SUPPRESS) #needed to workaround a zfs recv -v bug parser.add_argument('--no-progress', action='store_true', help=argparse.SUPPRESS) # needed to workaround a zfs recv -v bug
# note args is the only global variable we use, since its a global readonly setting anyway # note args is the only global variable we use, since its a global readonly setting anyway
args = parser.parse_args(argv) args = parser.parse_args(argv)
self.args = args self.args = args
#auto enable progress? # auto enable progress?
if sys.stderr.isatty() and not args.no_progress: if sys.stderr.isatty() and not args.no_progress:
args.progress = True args.progress = True
@ -148,48 +148,77 @@ class ZfsAutobackup:
self.log.verbose("") self.log.verbose("")
self.log.verbose("#### " + title) self.log.verbose("#### " + title)
# sync datasets, or thin-only on both sides # NOTE: this method also uses self.args. args that need extra processing are passed as function parameters:
# target is needed for this. def thin_missing_targets(self, target_dataset, used_target_datasets):
def sync_datasets(self, source_node, source_datasets): """thin target datasets that are missing on the source."""
description = "[Target]" self.debug("Thinning obsolete datasets")
self.set_title("Target settings") for dataset in target_dataset.recursive_datasets:
try:
if dataset not in used_target_datasets:
dataset.debug("Missing on source, thinning")
dataset.thin()
target_thinner = Thinner(self.args.keep_target) except Exception as e:
target_node = ZfsNode(self.args.backup_name, self, ssh_config=self.args.ssh_config, ssh_to=self.args.ssh_target, dataset.error("Error during thinning of missing datasets ({})".format(str(e)))
readonly=self.args.test, debug_output=self.args.debug_output, description=description,
thinner=target_thinner)
target_node.verbose("Receive datasets under: {}".format(self.args.target_path))
if self.args.no_send: # NOTE: this method also uses self.args. args that need extra processing are passed as function parameters:
self.set_title("Thinning source and target") def destroy_missing_targets(self, target_dataset, used_target_datasets):
else: """destroy target datasets that are missing on the source and that meet the requirements"""
self.set_title("Sending and thinning")
# check if exists, to prevent vague errors self.debug("Destroying obsolete datasets")
target_dataset = ZfsDataset(target_node, self.args.target_path)
if not target_dataset.exists:
self.error("Target path '{}' does not exist. Please create this dataset first.".format(target_dataset))
return 255
if self.args.filter_properties: for dataset in target_dataset.recursive_datasets:
filter_properties = self.args.filter_properties.split(",") try:
else: if dataset not in used_target_datasets:
filter_properties = []
if self.args.set_properties: # cant do anything without our own snapshots
set_properties = self.args.set_properties.split(",") if not dataset.our_snapshots:
else: if dataset.datasets:
set_properties = [] # its not a leaf, just ignore
dataset.debug("Destroy missing: ignoring")
else:
dataset.verbose(
"Destroy missing: has no snapshots made by us. (please destroy manually)")
else:
# past the deadline?
deadline_ttl = ThinnerRule("0s" + self.args.destroy_missing).ttl
now = int(time.time())
if dataset.our_snapshots[-1].timestamp + deadline_ttl > now:
dataset.verbose("Destroy missing: Waiting for deadline.")
else:
if self.args.clear_refreservation: dataset.debug("Destroy missing: Removing our snapshots.")
filter_properties.append("refreservation")
if self.args.clear_mountpoint: # remove all our snaphots, except last, to safe space in case we fail later on
set_properties.append("canmount=noauto") for snapshot in dataset.our_snapshots[:-1]:
snapshot.destroy(fail_exception=True)
# does it have other snapshots?
has_others = False
for snapshot in dataset.snapshots:
if not snapshot.is_ours():
has_others = True
break
if has_others:
dataset.verbose("Destroy missing: Still in use by other snapshots")
else:
if dataset.datasets:
dataset.verbose("Destroy missing: Still has children here.")
else:
dataset.verbose("Destroy missing.")
dataset.our_snapshots[-1].destroy(fail_exception=True)
dataset.destroy(fail_exception=True)
except Exception as e:
dataset.error("Error during --destroy-missing: {}".format(str(e)))
# NOTE: this method also uses self.args. args that need extra processing are passed as function parameters:
def sync_datasets(self, source_node, source_datasets, target_node):
"""Sync datasets, or thin-only on both sides"""
# sync datasets
fail_count = 0 fail_count = 0
target_datasets = [] target_datasets = []
for source_dataset in source_datasets: for source_dataset in source_datasets:
@ -207,86 +236,36 @@ class ZfsAutobackup:
and not target_dataset.parent.exists: and not target_dataset.parent.exists:
target_dataset.parent.create_filesystem(parents=True) target_dataset.parent.create_filesystem(parents=True)
# determine common zpool features # determine common zpool features (cached, so no problem we call it often)
source_features = source_node.get_zfs_pool(source_dataset.split_path()[0]).features source_features = source_node.get_zfs_pool(source_dataset.split_path()[0]).features
target_features = target_node.get_zfs_pool(target_dataset.split_path()[0]).features target_features = target_node.get_zfs_pool(target_dataset.split_path()[0]).features
common_features = source_features and target_features common_features = source_features and target_features
# source_dataset.debug("Common features: {}".format(common_features))
# sync the snapshots of this dataset
source_dataset.sync_snapshots(target_dataset, show_progress=self.args.progress, source_dataset.sync_snapshots(target_dataset, show_progress=self.args.progress,
features=common_features, filter_properties=filter_properties, features=common_features, filter_properties=self.filter_properties_list(),
set_properties=set_properties, set_properties=self.set_properties_list(),
ignore_recv_exit_code=self.args.ignore_transfer_errors, ignore_recv_exit_code=self.args.ignore_transfer_errors,
holds=not self.args.no_holds, rollback=self.args.rollback, holds=not self.args.no_holds, rollback=self.args.rollback,
raw=self.args.raw, other_snapshots=self.args.other_snapshots, raw=self.args.raw, also_other_snapshots=self.args.other_snapshots,
no_send=self.args.no_send, no_send=self.args.no_send,
destroy_incompatible=self.args.destroy_incompatible) destroy_incompatible=self.args.destroy_incompatible,
no_thinning=self.args.no_thinning)
except Exception as e: except Exception as e:
fail_count = fail_count + 1 fail_count = fail_count + 1
source_dataset.error("FAILED: " + str(e)) source_dataset.error("FAILED: " + str(e))
if self.args.debug: if self.args.debug:
raise raise
# if not self.args.no_thinning: target_path_dataset=ZfsDataset(target_node, self.args.target_path)
self.thin_missing_targets(ZfsDataset(target_node, self.args.target_path), target_datasets) if not self.args.no_thinning:
self.thin_missing_targets(target_dataset=target_path_dataset, used_target_datasets=target_datasets)
if self.args.destroy_missing is not None:
self.destroy_missing_targets(target_dataset=target_path_dataset, used_target_datasets=target_datasets)
return fail_count return fail_count
def thin_missing_targets(self, target_dataset, used_target_datasets):
"""thin/destroy target datasets that are missing on the source."""
self.debug("Thinning obsolete datasets")
for dataset in target_dataset.recursive_datasets:
try:
if dataset not in used_target_datasets:
dataset.debug("Missing on source, thinning")
dataset.thin()
# destroy_missing enabled?
if self.args.destroy_missing is not None:
# cant do anything without our own snapshots
if not dataset.our_snapshots:
if dataset.datasets:
dataset.debug("Destroy missing: ignoring")
else:
dataset.verbose(
"Destroy missing: has no snapshots made by us. (please destroy manually)")
else:
# past the deadline?
deadline_ttl = ThinnerRule("0s" + self.args.destroy_missing).ttl
now = int(time.time())
if dataset.our_snapshots[-1].timestamp + deadline_ttl > now:
dataset.verbose("Destroy missing: Waiting for deadline.")
else:
dataset.debug("Destroy missing: Removing our snapshots.")
# remove all our snaphots, except last, to safe space in case we fail later on
for snapshot in dataset.our_snapshots[:-1]:
snapshot.destroy(fail_exception=True)
# does it have other snapshots?
has_others = False
for snapshot in dataset.snapshots:
if not snapshot.is_ours():
has_others = True
break
if has_others:
dataset.verbose("Destroy missing: Still in use by other snapshots")
else:
if dataset.datasets:
dataset.verbose("Destroy missing: Still has children here.")
else:
dataset.verbose("Destroy missing.")
dataset.our_snapshots[-1].destroy(fail_exception=True)
dataset.destroy(fail_exception=True)
except Exception as e:
dataset.error("Error during destoy missing ({})".format(str(e)))
def thin_source(self, source_datasets): def thin_source(self, source_datasets):
self.set_title("Thinning source") self.set_title("Thinning source")
@ -294,6 +273,44 @@ class ZfsAutobackup:
for source_dataset in source_datasets: for source_dataset in source_datasets:
source_dataset.thin(skip_holds=True) source_dataset.thin(skip_holds=True)
def filter_replicated(self, datasets):
if not self.args.ignore_replicated:
return datasets
else:
self.set_title("Filtering already replicated filesystems")
ret = []
for dataset in datasets:
if dataset.is_changed(self.args.min_change):
ret.append(dataset)
else:
dataset.verbose("Ignoring, already replicated")
return(ret)
def filter_properties_list(self):
if self.args.filter_properties:
filter_properties = self.args.filter_properties.split(",")
else:
filter_properties = []
if self.args.clear_refreservation:
filter_properties.append("refreservation")
return filter_properties
def set_properties_list(self):
if self.args.set_properties:
set_properties = self.args.set_properties.split(",")
else:
set_properties = []
if self.args.clear_mountpoint:
set_properties.append("canmount=noauto")
return set_properties
def run(self): def run(self):
try: try:
@ -323,18 +340,8 @@ class ZfsAutobackup:
self.args.backup_name)) self.args.backup_name))
return 255 return 255
source_datasets = []
# filter out already replicated stuff? # filter out already replicated stuff?
if not self.args.ignore_replicated: source_datasets = self.filter_replicated(selected_source_datasets)
source_datasets = selected_source_datasets
else:
self.set_title("Filtering already replicated filesystems")
for selected_source_dataset in selected_source_datasets:
if selected_source_dataset.is_changed(self.args.min_change):
source_datasets.append(selected_source_dataset)
else:
selected_source_dataset.verbose("Ignoring, already replicated")
if not self.args.no_snapshot: if not self.args.no_snapshot:
self.set_title("Snapshotting") self.set_title("Snapshotting")
@ -343,9 +350,37 @@ class ZfsAutobackup:
# if target is specified, we sync the datasets, otherwise we just thin the source. (e.g. snapshot mode) # if target is specified, we sync the datasets, otherwise we just thin the source. (e.g. snapshot mode)
if self.args.target_path: if self.args.target_path:
fail_count = self.sync_datasets(source_node, source_datasets)
# create target_node
self.set_title("Target settings")
target_thinner = Thinner(self.args.keep_target)
target_node = ZfsNode(self.args.backup_name, self, ssh_config=self.args.ssh_config,
ssh_to=self.args.ssh_target,
readonly=self.args.test, debug_output=self.args.debug_output,
description="[Target]",
thinner=target_thinner)
target_node.verbose("Receive datasets under: {}".format(self.args.target_path))
if self.args.no_send:
self.set_title("Thinning source and target")
else:
self.set_title("Sending and thinning")
# check if exists, to prevent vague errors
target_dataset = ZfsDataset(target_node, self.args.target_path)
if not target_dataset.exists:
raise(Exception(
"Target path '{}' does not exist. Please create this dataset first.".format(target_dataset)))
# do the actual sync
fail_count = self.sync_datasets(
source_node=source_node,
source_datasets=source_datasets,
target_node=target_node)
else: else:
self.thin_source(source_datasets) if not self.args.no_thinning:
self.thin_source(source_datasets)
fail_count = 0 fail_count = 0
if not fail_count: if not fail_count:

View File

@ -102,10 +102,10 @@ class ZfsDataset:
else: else:
return ZfsDataset(self.zfs_node, self.rstrip_path(1)) return ZfsDataset(self.zfs_node, self.rstrip_path(1))
def find_prev_snapshot(self, snapshot, other_snapshots=False): def find_prev_snapshot(self, snapshot, also_other_snapshots=False):
"""find previous snapshot in this dataset. None if it doesn't exist. """find previous snapshot in this dataset. None if it doesn't exist.
other_snapshots: set to true to also return snapshots that where not created by us. (is_ours) also_other_snapshots: set to true to also return snapshots that where not created by us. (is_ours)
""" """
if self.is_snapshot: if self.is_snapshot:
@ -114,11 +114,11 @@ class ZfsDataset:
index = self.find_snapshot_index(snapshot) index = self.find_snapshot_index(snapshot)
while index: while index:
index = index - 1 index = index - 1
if other_snapshots or self.snapshots[index].is_ours(): if also_other_snapshots or self.snapshots[index].is_ours():
return self.snapshots[index] return self.snapshots[index]
return None return None
def find_next_snapshot(self, snapshot, other_snapshots=False): def find_next_snapshot(self, snapshot, also_other_snapshots=False):
"""find next snapshot in this dataset. None if it doesn't exist""" """find next snapshot in this dataset. None if it doesn't exist"""
if self.is_snapshot: if self.is_snapshot:
@ -127,7 +127,7 @@ class ZfsDataset:
index = self.find_snapshot_index(snapshot) index = self.find_snapshot_index(snapshot)
while index is not None and index < len(self.snapshots) - 1: while index is not None and index < len(self.snapshots) - 1:
index = index + 1 index = index + 1
if other_snapshots or self.snapshots[index].is_ours(): if also_other_snapshots or self.snapshots[index].is_ours():
return self.snapshots[index] return self.snapshots[index]
return None return None
@ -277,7 +277,6 @@ class ZfsDataset:
def snapshots(self): def snapshots(self):
"""get all snapshots of this dataset""" """get all snapshots of this dataset"""
if not self.exists: if not self.exists:
return [] return []
@ -414,7 +413,7 @@ class ZfsDataset:
# progress output # progress output
if show_progress: if show_progress:
cmd.append("-v") # cmd.append("-v")
cmd.append("-P") cmd.append("-P")
# resume a previous send? (don't need more parameters in that case) # resume a previous send? (don't need more parameters in that case)
@ -431,9 +430,6 @@ class ZfsDataset:
cmd.append(self.name) cmd.append(self.name)
# if args.buffer and args.ssh_source!="local":
# cmd.append("|mbuffer -m {}".format(args.buffer))
# NOTE: this doesn't start the send yet, it only returns a subprocess.Pipe # NOTE: this doesn't start the send yet, it only returns a subprocess.Pipe
return self.zfs_node.run(cmd, pipe=True) return self.zfs_node.run(cmd, pipe=True)
@ -489,15 +485,12 @@ class ZfsDataset:
if self.zfs_node.readonly: if self.zfs_node.readonly:
self.force_exists = True self.force_exists = True
# check if transfer was really ok (exit codes have been wrong before due to bugs in zfs-utils and can be # check if transfer was really ok (exit codes have been wrong before due to bugs in zfs-utils and some
# ignored by some parameters) # errors should be ignored, thats where the ignore_exitcodes is for.)
if not self.exists: if not self.exists:
self.error("error during transfer") self.error("error during transfer")
raise (Exception("Target doesn't exist after transfer, something went wrong.")) raise (Exception("Target doesn't exist after transfer, something went wrong."))
# if args.buffer and args.ssh_target!="local":
# cmd.append("|mbuffer -m {}".format(args.buffer))
def transfer_snapshot(self, target_snapshot, features, prev_snapshot=None, show_progress=False, def transfer_snapshot(self, target_snapshot, features, prev_snapshot=None, show_progress=False,
filter_properties=None, set_properties=None, ignore_recv_exit_code=False, resume_token=None, filter_properties=None, set_properties=None, ignore_recv_exit_code=False, resume_token=None,
raw=False): raw=False):
@ -609,21 +602,24 @@ class ZfsDataset:
target_dataset.error("Cant find common snapshot with source.") target_dataset.error("Cant find common snapshot with source.")
raise (Exception("You probably need to delete the target dataset to fix this.")) raise (Exception("You probably need to delete the target dataset to fix this."))
def find_start_snapshot(self, common_snapshot, other_snapshots): def find_start_snapshot(self, common_snapshot, also_other_snapshots):
"""finds first snapshot to send""" """finds first snapshot to send
:rtype: ZfsDataset or None if we cant find it.
"""
if not common_snapshot: if not common_snapshot:
if not self.snapshots: if not self.snapshots:
start_snapshot = None start_snapshot = None
else: else:
# start from beginning # no common snapshot, start from beginning
start_snapshot = self.snapshots[0] start_snapshot = self.snapshots[0]
if not start_snapshot.is_ours() and not other_snapshots: if not start_snapshot.is_ours() and not also_other_snapshots:
# try to start at a snapshot thats ours # try to start at a snapshot thats ours
start_snapshot = self.find_next_snapshot(start_snapshot, other_snapshots) start_snapshot = self.find_next_snapshot(start_snapshot, also_other_snapshots)
else: else:
start_snapshot = self.find_next_snapshot(common_snapshot, other_snapshots) # normal situation: start_snapshot is the one after the common snapshot
start_snapshot = self.find_next_snapshot(common_snapshot, also_other_snapshots)
return start_snapshot return start_snapshot
@ -659,50 +655,25 @@ class ZfsDataset:
return allowed_filter_properties, allowed_set_properties return allowed_filter_properties, allowed_set_properties
def sync_snapshots(self, target_dataset, features, show_progress=False, filter_properties=None, set_properties=None, def _add_virtual_snapshots(self, source_dataset, source_start_snapshot, also_other_snapshots):
ignore_recv_exit_code=False, holds=True, rollback=False, raw=False, other_snapshots=False, """add snapshots from source to our snapshot list. (just the in memory list, no disk operations)"""
no_send=False, destroy_incompatible=False):
"""sync this dataset's snapshots to target_dataset, while also thinning out old snapshots along the way."""
if set_properties is None: self.debug("Creating virtual target snapshots")
set_properties = [] snapshot = source_start_snapshot
if filter_properties is None: while snapshot:
filter_properties = [] # create virtual target snapsho
# NOTE: with force_exist we're telling the dataset it doesnt exist yet. (e.g. its virtual)
# determine common and start snapshot virtual_snapshot = ZfsDataset(self.zfs_node,
target_dataset.debug("Determining start snapshot") self.filesystem_name + "@" + snapshot.snapshot_name,
common_snapshot = self.find_common_snapshot(target_dataset)
start_snapshot = self.find_start_snapshot(common_snapshot, other_snapshots)
# should be destroyed before attempting zfs recv:
incompatible_target_snapshots = target_dataset.find_incompatible_snapshots(common_snapshot)
# make target snapshot list the same as source, by adding virtual non-existing ones to the list.
target_dataset.debug("Creating virtual target snapshots")
source_snapshot = start_snapshot
while source_snapshot:
# create virtual target snapshot
virtual_snapshot = ZfsDataset(target_dataset.zfs_node,
target_dataset.filesystem_name + "@" + source_snapshot.snapshot_name,
force_exists=False) force_exists=False)
target_dataset.snapshots.append(virtual_snapshot) self.snapshots.append(virtual_snapshot)
source_snapshot = self.find_next_snapshot(source_snapshot, other_snapshots) snapshot = source_dataset.find_next_snapshot(snapshot, also_other_snapshots)
# now let thinner decide what we want on both sides as final state (after all transfers are done) def _pre_clean(self, common_snapshot, target_dataset, source_obsoletes, target_obsoletes, target_keeps):
if self.our_snapshots: """cleanup old stuff before starting snapshot syncing"""
self.debug("Create thinning list")
(source_keeps, source_obsoletes) = self.thin_list(keeps=[self.our_snapshots[-1]])
else:
source_obsoletes = []
if target_dataset.our_snapshots: # on source: destroy all obsoletes before common.
(target_keeps, target_obsoletes) = target_dataset.thin_list(keeps=[target_dataset.our_snapshots[-1]], # But after common, only delete snapshots that target also doesn't want
ignores=incompatible_target_snapshots)
else:
target_keeps = []
target_obsoletes = []
# on source: destroy all obsoletes before common. but after common, only delete snapshots that target also
# doesn't want to explicitly keep
before_common = True before_common = True
for source_snapshot in self.snapshots: for source_snapshot in self.snapshots:
if common_snapshot and source_snapshot.snapshot_name == common_snapshot.snapshot_name: if common_snapshot and source_snapshot.snapshot_name == common_snapshot.snapshot_name:
@ -720,12 +691,9 @@ class ZfsDataset:
if target_snapshot.exists: if target_snapshot.exists:
target_snapshot.destroy() target_snapshot.destroy()
# now actually transfer the snapshots, if we want def _validate_resume_token(self, target_dataset, start_snapshot):
if no_send: """validate and get (or destory) resume token"""
return
# resume?
resume_token = None
if 'receive_resume_token' in target_dataset.properties: if 'receive_resume_token' in target_dataset.properties:
resume_token = target_dataset.properties['receive_resume_token'] resume_token = target_dataset.properties['receive_resume_token']
# not valid anymore? # not valid anymore?
@ -733,9 +701,36 @@ class ZfsDataset:
if not resume_snapshot or start_snapshot.snapshot_name != resume_snapshot.snapshot_name: if not resume_snapshot or start_snapshot.snapshot_name != resume_snapshot.snapshot_name:
target_dataset.verbose("Cant resume, resume token no longer valid.") target_dataset.verbose("Cant resume, resume token no longer valid.")
target_dataset.abort_resume() target_dataset.abort_resume()
resume_token = None else:
return resume_token
def _plan_sync(self, target_dataset, also_other_snapshots):
"""plan where to start syncing and what to sync and what to keep"""
# determine common and start snapshot
target_dataset.debug("Determining start snapshot")
common_snapshot = self.find_common_snapshot(target_dataset)
start_snapshot = self.find_start_snapshot(common_snapshot, also_other_snapshots)
incompatible_target_snapshots = target_dataset.find_incompatible_snapshots(common_snapshot)
# let thinner decide whats obsolete on source
source_obsoletes = []
if self.our_snapshots:
source_obsoletes = self.thin_list(keeps=[self.our_snapshots[-1]])[1]
# let thinner decide keeps/obsoletes on target, AFTER the transfer would be done (by using virtual snapshots)
target_dataset._add_virtual_snapshots(self, start_snapshot, also_other_snapshots)
target_keeps = []
target_obsoletes = []
if target_dataset.our_snapshots:
(target_keeps, target_obsoletes) = target_dataset.thin_list(keeps=[target_dataset.our_snapshots[-1]],
ignores=incompatible_target_snapshots)
return common_snapshot, start_snapshot, source_obsoletes, target_obsoletes, target_keeps, incompatible_target_snapshots
def handle_incompatible_snapshots(self, incompatible_target_snapshots, destroy_incompatible):
"""destroy incompatbile snapshots on target before sync, or inform user what to do"""
# incompatible target snapshots?
if incompatible_target_snapshots: if incompatible_target_snapshots:
if not destroy_incompatible: if not destroy_incompatible:
for snapshot in incompatible_target_snapshots: for snapshot in incompatible_target_snapshots:
@ -745,7 +740,33 @@ class ZfsDataset:
for snapshot in incompatible_target_snapshots: for snapshot in incompatible_target_snapshots:
snapshot.verbose("Incompatible snapshot") snapshot.verbose("Incompatible snapshot")
snapshot.destroy() snapshot.destroy()
target_dataset.snapshots.remove(snapshot) self.snapshots.remove(snapshot)
def sync_snapshots(self, target_dataset, features, show_progress, filter_properties, set_properties,
ignore_recv_exit_code, holds, rollback, raw, also_other_snapshots,
no_send, destroy_incompatible, no_thinning):
"""sync this dataset's snapshots to target_dataset, while also thinning out old snapshots along the way."""
(common_snapshot, start_snapshot, source_obsoletes, target_obsoletes, target_keeps,
incompatible_target_snapshots) = \
self._plan_sync(target_dataset=target_dataset, also_other_snapshots=also_other_snapshots)
# NOTE: we do this because we dont want filesystems to fillup when backups keep failing.
# Also usefull with no_send to still cleanup stuff.
if not no_thinning:
self._pre_clean(
common_snapshot=common_snapshot, target_dataset=target_dataset,
target_keeps=target_keeps, target_obsoletes=target_obsoletes, source_obsoletes=source_obsoletes)
# now actually transfer the snapshots, if we want
if no_send:
return
# check if we can resume
resume_token = self._validate_resume_token(target_dataset, start_snapshot)
# handle incompatible stuff on target
target_dataset.handle_incompatible_snapshots(incompatible_target_snapshots, destroy_incompatible)
# rollback target to latest? # rollback target to latest?
if rollback: if rollback:
@ -780,15 +801,16 @@ class ZfsDataset:
prev_source_snapshot.release() prev_source_snapshot.release()
target_dataset.find_snapshot(prev_source_snapshot).release() target_dataset.find_snapshot(prev_source_snapshot).release()
# we may now destroy the previous source snapshot if its obsolete if not no_thinning:
if prev_source_snapshot in source_obsoletes: # we may now destroy the previous source snapshot if its obsolete
prev_source_snapshot.destroy() if prev_source_snapshot in source_obsoletes:
prev_source_snapshot.destroy()
# destroy the previous target snapshot if obsolete (usually this is only the common_snapshot, # destroy the previous target snapshot if obsolete (usually this is only the common_snapshot,
# the rest was already destroyed or will not be send) # the rest was already destroyed or will not be send)
prev_target_snapshot = target_dataset.find_snapshot(prev_source_snapshot) prev_target_snapshot = target_dataset.find_snapshot(prev_source_snapshot)
if prev_target_snapshot in target_obsoletes: if prev_target_snapshot in target_obsoletes:
prev_target_snapshot.destroy() prev_target_snapshot.destroy()
prev_source_snapshot = source_snapshot prev_source_snapshot = source_snapshot
else: else:
@ -799,4 +821,4 @@ class ZfsDataset:
target_dataset.abort_resume() target_dataset.abort_resume()
resume_token = None resume_token = None
source_snapshot = self.find_next_snapshot(source_snapshot, other_snapshots) source_snapshot = self.find_next_snapshot(source_snapshot, also_other_snapshots)