forked from third-party-mirrors/zfs_autobackup
this also makes it so that it doesnt conflict with --allow-empty. added regression tests for exclude-unchanged as well.
1208 lines
42 KiB
Python
1208 lines
42 KiB
Python
import re
|
|
from datetime import datetime
|
|
import sys
|
|
import time
|
|
|
|
from .CachedProperty import CachedProperty
|
|
from .ExecuteNode import ExecuteError
|
|
|
|
|
|
class ZfsDataset:
|
|
"""a zfs dataset (filesystem/volume/snapshot/clone) Note that a dataset
|
|
doesn't have to actually exist (yet/anymore) Also most properties are cached
|
|
for performance-reasons, but also to allow --test to function correctly.
|
|
"""
|
|
|
|
# illegal properties per dataset type. these will be removed from --set-properties and --filter-properties
|
|
ILLEGAL_PROPERTIES = {
|
|
'filesystem': [],
|
|
'volume': ["canmount"],
|
|
}
|
|
|
|
def __init__(self, zfs_node, name, force_exists=None):
|
|
"""
|
|
Args:
|
|
:type zfs_node: ZfsNode.ZfsNode
|
|
:type name: str
|
|
:type force_exists: bool
|
|
"""
|
|
self.zfs_node = zfs_node
|
|
self.name = name # full name
|
|
self._virtual_snapshots = []
|
|
self.invalidate()
|
|
self.force_exists = force_exists
|
|
|
|
def __repr__(self):
|
|
return "{}: {}".format(self.zfs_node, self.name)
|
|
|
|
def __str__(self):
|
|
return self.name
|
|
|
|
def __eq__(self, obj):
|
|
if not isinstance(obj, ZfsDataset):
|
|
return False
|
|
|
|
return self.name == obj.name
|
|
|
|
def verbose(self, txt):
|
|
"""
|
|
Args:
|
|
:type txt: str
|
|
"""
|
|
self.zfs_node.verbose("{}: {}".format(self.name, txt))
|
|
|
|
def error(self, txt):
|
|
"""
|
|
Args:
|
|
:type txt: str
|
|
"""
|
|
self.zfs_node.error("{}: {}".format(self.name, txt))
|
|
|
|
def debug(self, txt):
|
|
"""
|
|
Args:
|
|
:type txt: str
|
|
"""
|
|
self.zfs_node.debug("{}: {}".format(self.name, txt))
|
|
|
|
def invalidate(self):
|
|
"""clear caches"""
|
|
CachedProperty.clear(self)
|
|
self.force_exists = None
|
|
self._virtual_snapshots = []
|
|
|
|
def split_path(self):
|
|
"""return the path elements as an array"""
|
|
return self.name.split("/")
|
|
|
|
def lstrip_path(self, count):
|
|
"""return name with first count components stripped
|
|
|
|
Args:
|
|
:type count: int
|
|
"""
|
|
components=self.split_path()
|
|
if count>len(components):
|
|
raise Exception("Trying to strip too much from path ({} items from {})".format(count, self.name))
|
|
|
|
return "/".join(components[count:])
|
|
|
|
def rstrip_path(self, count):
|
|
"""return name with last count components stripped
|
|
|
|
Args:
|
|
:type count: int
|
|
"""
|
|
return "/".join(self.split_path()[:-count])
|
|
|
|
@property
|
|
def filesystem_name(self):
|
|
"""filesystem part of the name (before the @)"""
|
|
if self.is_snapshot:
|
|
(filesystem, snapshot) = self.name.split("@")
|
|
return filesystem
|
|
else:
|
|
return self.name
|
|
|
|
@property
|
|
def snapshot_name(self):
|
|
"""snapshot part of the name"""
|
|
if not self.is_snapshot:
|
|
raise (Exception("This is not a snapshot"))
|
|
|
|
(filesystem, snapshot_name) = self.name.split("@")
|
|
return snapshot_name
|
|
|
|
@property
|
|
def is_snapshot(self):
|
|
"""true if this dataset is a snapshot"""
|
|
return self.name.find("@") != -1
|
|
|
|
def is_selected(self, value, source, inherited, exclude_received, exclude_paths, exclude_unchanged):
|
|
"""determine if dataset should be selected for backup (called from
|
|
ZfsNode)
|
|
|
|
Args:
|
|
:type exclude_paths: list of str
|
|
:type value: str
|
|
:type source: str
|
|
:type inherited: bool
|
|
:type exclude_received: bool
|
|
:type exclude_unchanged: int
|
|
|
|
:param value: Value of the zfs property ("false"/"true"/"child"/parent/"-")
|
|
:param source: Source of the zfs property ("local"/"received", "-")
|
|
:param inherited: True of the value/source was inherited from a higher dataset.
|
|
|
|
Returns: True : Selected
|
|
False: Excluded
|
|
None: No property found
|
|
"""
|
|
|
|
# sanity checks
|
|
if source not in ["local", "received", "-"]:
|
|
# probably a program error in zfs-autobackup or new feature in zfs
|
|
raise (Exception(
|
|
"{} autobackup-property has illegal source: '{}' (possible BUG)".format(self.name, source)))
|
|
|
|
if value not in ["false", "true", "child", "parent", "-"]:
|
|
# user error
|
|
raise (Exception(
|
|
"{} autobackup-property has illegal value: '{}'".format(self.name, value)))
|
|
|
|
# non specified, ignore
|
|
if value == "-":
|
|
return None
|
|
|
|
# only select childs of this dataset, ignore
|
|
if value == "child" and not inherited:
|
|
return False
|
|
|
|
# only select parent, no childs, ignore
|
|
if value == "parent" and inherited:
|
|
return False
|
|
|
|
# manually excluded by property
|
|
if value == "false":
|
|
self.verbose("Excluded")
|
|
return False
|
|
|
|
# from here on the dataset is selected by property, now do additional exclusion checks
|
|
|
|
# our path starts with one of the excluded paths?
|
|
for exclude_path in exclude_paths:
|
|
# if self.name.startswith(exclude_path):
|
|
if (self.name + "/").startswith(exclude_path + "/"):
|
|
# too noisy for verbose
|
|
self.debug("Excluded (path in exclude list)")
|
|
return False
|
|
|
|
if source == "received":
|
|
if exclude_received:
|
|
self.verbose("Excluded (dataset already received)")
|
|
return False
|
|
|
|
if not self.is_changed(exclude_unchanged):
|
|
self.verbose("Excluded (by --exclude-unchanged)")
|
|
return False
|
|
|
|
self.verbose("Selected")
|
|
return True
|
|
|
|
|
|
@CachedProperty
|
|
def parent(self):
|
|
"""get zfs-parent of this dataset. for snapshots this means it will get
|
|
the filesystem/volume that it belongs to. otherwise it will return the
|
|
parent according to path
|
|
|
|
we cache this so everything in the parent that is cached also stays.
|
|
|
|
returns None if there is no parent.
|
|
"""
|
|
if self.is_snapshot:
|
|
return self.zfs_node.get_dataset(self.filesystem_name)
|
|
else:
|
|
stripped=self.rstrip_path(1)
|
|
if stripped:
|
|
return self.zfs_node.get_dataset(stripped)
|
|
else:
|
|
return None
|
|
|
|
# NOTE: unused for now
|
|
# def find_prev_snapshot(self, snapshot, also_other_snapshots=False):
|
|
# """find previous snapshot in this dataset. None if it doesn't exist.
|
|
#
|
|
# also_other_snapshots: set to true to also return snapshots that where
|
|
# not created by us. (is_ours)
|
|
#
|
|
# Args:
|
|
# :type snapshot: str or ZfsDataset.ZfsDataset
|
|
# :type also_other_snapshots: bool
|
|
# """
|
|
#
|
|
# if self.is_snapshot:
|
|
# raise (Exception("Please call this on a dataset."))
|
|
#
|
|
# index = self.find_snapshot_index(snapshot)
|
|
# while index:
|
|
# index = index - 1
|
|
# if also_other_snapshots or self.snapshots[index].is_ours():
|
|
# return self.snapshots[index]
|
|
# return None
|
|
|
|
def find_next_snapshot(self, snapshot, also_other_snapshots=False):
|
|
"""find next snapshot in this dataset. None if it doesn't exist
|
|
|
|
Args:
|
|
:type snapshot: ZfsDataset
|
|
:type also_other_snapshots: bool
|
|
"""
|
|
|
|
if self.is_snapshot:
|
|
raise (Exception("Please call this on a dataset."))
|
|
|
|
index = self.find_snapshot_index(snapshot)
|
|
while index is not None and index < len(self.snapshots) - 1:
|
|
index = index + 1
|
|
if also_other_snapshots or self.snapshots[index].is_ours():
|
|
return self.snapshots[index]
|
|
return None
|
|
|
|
@CachedProperty
|
|
def exists(self):
|
|
"""check if dataset exists. Use force to force a specific value to be
|
|
cached, if you already know. Useful for performance reasons
|
|
"""
|
|
|
|
if self.force_exists is not None:
|
|
self.debug("Checking if filesystem exists: was forced to {}".format(self.force_exists))
|
|
return self.force_exists
|
|
else:
|
|
self.debug("Checking if filesystem exists")
|
|
|
|
return (self.zfs_node.run(tab_split=True, cmd=["zfs", "list", self.name], readonly=True, valid_exitcodes=[0, 1],
|
|
hide_errors=True) and True)
|
|
|
|
def create_filesystem(self, parents=False):
|
|
"""create a filesystem
|
|
|
|
Args:
|
|
:type parents: bool
|
|
"""
|
|
if parents:
|
|
self.verbose("Creating filesystem and parents")
|
|
self.zfs_node.run(["zfs", "create", "-p", self.name])
|
|
else:
|
|
self.verbose("Creating filesystem")
|
|
self.zfs_node.run(["zfs", "create", self.name])
|
|
|
|
self.force_exists = True
|
|
|
|
def destroy(self, fail_exception=False, deferred=False, verbose=True):
|
|
"""destroy the dataset. by default failures are not an exception, so we
|
|
can continue making backups
|
|
|
|
Args:
|
|
:type fail_exception: bool
|
|
"""
|
|
|
|
if verbose:
|
|
self.verbose("Destroying")
|
|
else:
|
|
self.debug("Destroying")
|
|
|
|
if self.is_snapshot:
|
|
self.release()
|
|
|
|
try:
|
|
if deferred and self.is_snapshot:
|
|
self.zfs_node.run(["zfs", "destroy", "-d", self.name])
|
|
else:
|
|
self.zfs_node.run(["zfs", "destroy", self.name])
|
|
|
|
self.invalidate()
|
|
self.force_exists = False
|
|
return True
|
|
except ExecuteError:
|
|
if not fail_exception:
|
|
return False
|
|
else:
|
|
raise
|
|
|
|
@CachedProperty
|
|
def properties(self):
|
|
"""all zfs properties"""
|
|
|
|
cmd = [
|
|
"zfs", "get", "-H", "-o", "property,value", "-p", "all", self.name
|
|
]
|
|
|
|
if not self.exists:
|
|
return {}
|
|
|
|
self.debug("Getting zfs properties")
|
|
|
|
ret = {}
|
|
for pair in self.zfs_node.run(tab_split=True, cmd=cmd, readonly=True, valid_exitcodes=[0]):
|
|
if len(pair) == 2:
|
|
ret[pair[0]] = pair[1]
|
|
|
|
return ret
|
|
|
|
def is_changed(self, min_changed_bytes=1):
|
|
"""dataset is changed since ANY latest snapshot ?
|
|
|
|
Args:
|
|
:type min_changed_bytes: int
|
|
"""
|
|
self.debug("Checking if dataset is changed")
|
|
|
|
if min_changed_bytes == 0:
|
|
return True
|
|
|
|
|
|
if int(self.properties['written']) < min_changed_bytes:
|
|
return False
|
|
else:
|
|
return True
|
|
|
|
def is_ours(self):
|
|
"""return true if this snapshot name has format"""
|
|
try:
|
|
test = self.timestamp
|
|
except ValueError as e:
|
|
return False
|
|
|
|
return True
|
|
|
|
@property
|
|
def holds(self):
|
|
"""get list of holds for dataset"""
|
|
|
|
output = self.zfs_node.run(["zfs", "holds", "-H", self.name], valid_exitcodes=[0], tab_split=True,
|
|
readonly=True)
|
|
return map(lambda fields: fields[1], output)
|
|
|
|
def is_hold(self):
|
|
"""did we hold this snapshot?"""
|
|
return self.zfs_node.hold_name in self.holds
|
|
|
|
def hold(self):
|
|
"""hold dataset"""
|
|
self.debug("holding")
|
|
self.zfs_node.run(["zfs", "hold", self.zfs_node.hold_name, self.name], valid_exitcodes=[0, 1])
|
|
|
|
def release(self):
|
|
"""release dataset"""
|
|
if self.zfs_node.readonly or self.is_hold():
|
|
self.debug("releasing")
|
|
self.zfs_node.run(["zfs", "release", self.zfs_node.hold_name, self.name], valid_exitcodes=[0, 1])
|
|
|
|
@property
|
|
def timestamp(self):
|
|
"""get timestamp from snapshot name. Only works for our own snapshots
|
|
with the correct format.
|
|
"""
|
|
dt = datetime.strptime(self.snapshot_name, self.zfs_node.snapshot_time_format)
|
|
if sys.version_info[0] >= 3:
|
|
from datetime import timezone
|
|
if self.zfs_node.utc:
|
|
dt = dt.replace(tzinfo=timezone.utc)
|
|
seconds = dt.timestamp()
|
|
else:
|
|
# python2 has no good functions to deal with UTC. Yet the unix timestamp
|
|
# must be in UTC to allow comparison against `time.time()` in on other parts
|
|
# of this project (e.g. Thinner.py). If we are handling UTC timestamps,
|
|
# we must adjust for that here.
|
|
if self.zfs_node.utc:
|
|
seconds = (dt - datetime(1970, 1, 1)).total_seconds()
|
|
else:
|
|
seconds = time.mktime(dt.timetuple())
|
|
return seconds
|
|
|
|
def from_names(self, names):
|
|
"""convert a list of names to a list ZfsDatasets for this zfs_node
|
|
|
|
Args:
|
|
:type names: list of str
|
|
"""
|
|
ret = []
|
|
for name in names:
|
|
ret.append(self.zfs_node.get_dataset(name))
|
|
|
|
return ret
|
|
|
|
# def add_virtual_snapshot(self, snapshot):
|
|
# """pretend a snapshot exists (usefull in test mode)"""
|
|
#
|
|
# # NOTE: we could just call self.snapshots.append() but this would trigger a zfs list which is not always needed.
|
|
# if CachedProperty.is_cached(self, 'snapshots'):
|
|
# # already cached so add it
|
|
# print ("ADDED")
|
|
# self.snapshots.append(snapshot)
|
|
# else:
|
|
# # self.snapshots will add it when requested
|
|
# print ("ADDED VIRT")
|
|
# self._virtual_snapshots.append(snapshot)
|
|
|
|
@CachedProperty
|
|
def snapshots(self):
|
|
"""get all snapshots of this dataset"""
|
|
|
|
if not self.exists:
|
|
return []
|
|
|
|
self.debug("Getting snapshots")
|
|
|
|
cmd = [
|
|
"zfs", "list", "-d", "1", "-r", "-t", "snapshot", "-H", "-o", "name", self.name
|
|
]
|
|
|
|
return self.from_names(self.zfs_node.run(cmd=cmd, readonly=True))
|
|
|
|
@property
|
|
def our_snapshots(self):
|
|
"""get list of snapshots creates by us of this dataset"""
|
|
ret = []
|
|
for snapshot in self.snapshots:
|
|
if snapshot.is_ours():
|
|
ret.append(snapshot)
|
|
|
|
return ret
|
|
|
|
def find_snapshot(self, snapshot):
|
|
"""find snapshot by snapshot (can be a snapshot_name or a different
|
|
ZfsDataset )
|
|
|
|
Args:
|
|
:rtype: ZfsDataset
|
|
:type snapshot: str or ZfsDataset
|
|
"""
|
|
|
|
if not isinstance(snapshot, ZfsDataset):
|
|
snapshot_name = snapshot
|
|
else:
|
|
snapshot_name = snapshot.snapshot_name
|
|
|
|
for snapshot in self.snapshots:
|
|
if snapshot.snapshot_name == snapshot_name:
|
|
return snapshot
|
|
|
|
return None
|
|
|
|
def find_snapshot_index(self, snapshot):
|
|
"""find snapshot index by snapshot (can be a snapshot_name or
|
|
ZfsDataset)
|
|
|
|
Args:
|
|
:type snapshot: str or ZfsDataset
|
|
"""
|
|
|
|
if not isinstance(snapshot, ZfsDataset):
|
|
snapshot_name = snapshot
|
|
else:
|
|
snapshot_name = snapshot.snapshot_name
|
|
|
|
index = 0
|
|
for snapshot in self.snapshots:
|
|
if snapshot.snapshot_name == snapshot_name:
|
|
return index
|
|
index = index + 1
|
|
|
|
return None
|
|
|
|
@CachedProperty
|
|
def written_since_ours(self):
|
|
"""get number of bytes written since our last snapshot"""
|
|
|
|
latest_snapshot = self.our_snapshots[-1]
|
|
|
|
self.debug("Getting bytes written since our last snapshot")
|
|
cmd = ["zfs", "get", "-H", "-ovalue", "-p", "written@" + str(latest_snapshot), self.name]
|
|
|
|
output = self.zfs_node.run(readonly=True, tab_split=False, cmd=cmd, valid_exitcodes=[0])
|
|
|
|
return int(output[0])
|
|
|
|
def is_changed_ours(self, min_changed_bytes=1):
|
|
"""dataset is changed since OUR latest snapshot?
|
|
|
|
Args:
|
|
:type min_changed_bytes: int
|
|
"""
|
|
|
|
if min_changed_bytes == 0:
|
|
return True
|
|
|
|
if not self.our_snapshots:
|
|
return True
|
|
|
|
# NOTE: filesystems can have a very small amount written without actual changes in some cases
|
|
if self.written_since_ours < min_changed_bytes:
|
|
return False
|
|
|
|
return True
|
|
|
|
@CachedProperty
|
|
def recursive_datasets(self, types="filesystem,volume"):
|
|
"""get all (non-snapshot) datasets recursively under us
|
|
|
|
Args:
|
|
:type types: str
|
|
"""
|
|
|
|
self.debug("Getting all recursive datasets under us")
|
|
|
|
names = self.zfs_node.run(tab_split=False, readonly=True, valid_exitcodes=[0], cmd=[
|
|
"zfs", "list", "-r", "-t", types, "-o", "name", "-H", self.name
|
|
])
|
|
|
|
return self.from_names(names[1:])
|
|
|
|
@CachedProperty
|
|
def datasets(self, types="filesystem,volume"):
|
|
"""get all (non-snapshot) datasets directly under us
|
|
|
|
Args:
|
|
:type types: str
|
|
"""
|
|
|
|
self.debug("Getting all datasets under us")
|
|
|
|
names = self.zfs_node.run(tab_split=False, readonly=True, valid_exitcodes=[0], cmd=[
|
|
"zfs", "list", "-r", "-t", types, "-o", "name", "-H", "-d", "1", self.name
|
|
])
|
|
|
|
return self.from_names(names[1:])
|
|
|
|
def send_pipe(self, features, prev_snapshot, resume_token, show_progress, raw, send_properties, write_embedded, send_pipes, zfs_compressed):
|
|
"""returns a pipe with zfs send output for this snapshot
|
|
|
|
resume_token: resume sending from this token. (in that case we don't
|
|
need to know snapshot names)
|
|
|
|
Args:
|
|
:param send_pipes: output cmd array that will be added to actual zfs send command. (e.g. mbuffer or compression program)
|
|
:type send_pipes: list of str
|
|
:type features: list of str
|
|
:type prev_snapshot: ZfsDataset
|
|
:type resume_token: str
|
|
:type show_progress: bool
|
|
:type raw: bool
|
|
"""
|
|
# build source command
|
|
cmd = []
|
|
|
|
cmd.extend(["zfs", "send", ])
|
|
|
|
# all kind of performance options:
|
|
if 'large_blocks' in features and "-L" in self.zfs_node.supported_send_options:
|
|
# large block support (only if recordsize>128k which is seldomly used)
|
|
cmd.append("-L") # --large-block
|
|
|
|
if write_embedded and 'embedded_data' in features and "-e" in self.zfs_node.supported_send_options:
|
|
cmd.append("-e") # --embed; WRITE_EMBEDDED, more compact stream
|
|
|
|
if zfs_compressed and "-c" in self.zfs_node.supported_send_options:
|
|
cmd.append("-c") # --compressed; use compressed WRITE records
|
|
|
|
# raw? (send over encrypted data in its original encrypted form without decrypting)
|
|
if raw:
|
|
cmd.append("--raw")
|
|
|
|
# progress output
|
|
if show_progress:
|
|
cmd.append("-v") # --verbose
|
|
cmd.append("-P") # --parsable
|
|
|
|
# resume a previous send? (don't need more parameters in that case)
|
|
if resume_token:
|
|
cmd.extend(["-t", resume_token])
|
|
|
|
else:
|
|
# send properties
|
|
if send_properties:
|
|
cmd.append("-p") # --props
|
|
|
|
# incremental?
|
|
if prev_snapshot:
|
|
cmd.extend(["-i", "@" + prev_snapshot.snapshot_name])
|
|
|
|
cmd.append(self.name)
|
|
|
|
cmd.extend(send_pipes)
|
|
|
|
output_pipe = self.zfs_node.run(cmd, pipe=True, readonly=True)
|
|
|
|
return output_pipe
|
|
|
|
def recv_pipe(self, pipe, features, recv_pipes, filter_properties=None, set_properties=None, ignore_exit_code=False, force=False):
|
|
"""starts a zfs recv for this snapshot and uses pipe as input
|
|
|
|
note: you can it both on a snapshot or filesystem object. The
|
|
resulting zfs command is the same, only our object cache is invalidated
|
|
differently.
|
|
|
|
Args:
|
|
:param recv_pipes: input cmd array that will be prepended to actual zfs recv command. (e.g. mbuffer or decompression program)
|
|
:type pipe: subprocess.pOpen
|
|
:type features: list of str
|
|
:type filter_properties: list of str
|
|
:type set_properties: list of str
|
|
:type ignore_exit_code: bool
|
|
"""
|
|
|
|
if set_properties is None:
|
|
set_properties = []
|
|
|
|
if filter_properties is None:
|
|
filter_properties = []
|
|
|
|
# build target command
|
|
cmd = []
|
|
|
|
cmd.extend(recv_pipes)
|
|
|
|
cmd.extend(["zfs", "recv"])
|
|
|
|
# don't mount filesystem that is received
|
|
cmd.append("-u")
|
|
|
|
for property_ in filter_properties:
|
|
cmd.extend(["-x", property_])
|
|
|
|
for property_ in set_properties:
|
|
cmd.extend(["-o", property_])
|
|
|
|
# verbose output
|
|
cmd.append("-v")
|
|
|
|
if force:
|
|
cmd.append("-F")
|
|
|
|
if 'extensible_dataset' in features and "-s" in self.zfs_node.supported_recv_options:
|
|
# support resuming
|
|
self.debug("Enabled resume support")
|
|
cmd.append("-s")
|
|
|
|
cmd.append(self.filesystem_name)
|
|
|
|
if ignore_exit_code:
|
|
valid_exitcodes = []
|
|
else:
|
|
valid_exitcodes = [0]
|
|
|
|
# self.zfs_node.reset_progress()
|
|
self.zfs_node.run(cmd, inp=pipe, valid_exitcodes=valid_exitcodes)
|
|
|
|
# invalidate cache, but we at least know we exist now
|
|
self.invalidate()
|
|
|
|
# in test mode we assume everything was ok and it exists
|
|
if self.zfs_node.readonly:
|
|
self.force_exists = True
|
|
|
|
# check if transfer was really ok (exit codes have been wrong before due to bugs in zfs-utils and some
|
|
# errors should be ignored, thats where the ignore_exitcodes is for.)
|
|
if not self.exists:
|
|
self.error("error during transfer")
|
|
raise (Exception("Target doesn't exist after transfer, something went wrong."))
|
|
|
|
def transfer_snapshot(self, target_snapshot, features, prev_snapshot, show_progress,
|
|
filter_properties, set_properties, ignore_recv_exit_code, resume_token,
|
|
raw, send_properties, write_embedded, send_pipes, recv_pipes, zfs_compressed, force):
|
|
"""transfer this snapshot to target_snapshot. specify prev_snapshot for
|
|
incremental transfer
|
|
|
|
connects a send_pipe() to recv_pipe()
|
|
|
|
Args:
|
|
:type send_pipes: list of str
|
|
:type recv_pipes: list of str
|
|
:type target_snapshot: ZfsDataset
|
|
:type features: list of str
|
|
:type prev_snapshot: ZfsDataset
|
|
:type show_progress: bool
|
|
:type filter_properties: list of str
|
|
:type set_properties: list of str
|
|
:type ignore_recv_exit_code: bool
|
|
:type resume_token: str
|
|
:type raw: bool
|
|
"""
|
|
|
|
if set_properties is None:
|
|
set_properties = []
|
|
if filter_properties is None:
|
|
filter_properties = []
|
|
|
|
self.debug("Transfer snapshot to {}".format(target_snapshot.filesystem_name))
|
|
|
|
if resume_token:
|
|
target_snapshot.verbose("resuming")
|
|
|
|
# initial or increment
|
|
if not prev_snapshot:
|
|
target_snapshot.verbose("receiving full".format(self.snapshot_name))
|
|
else:
|
|
# incremental
|
|
target_snapshot.verbose("receiving incremental".format(self.snapshot_name))
|
|
|
|
# do it
|
|
pipe = self.send_pipe(features=features, show_progress=show_progress, prev_snapshot=prev_snapshot,
|
|
resume_token=resume_token, raw=raw, send_properties=send_properties, write_embedded=write_embedded, send_pipes=send_pipes, zfs_compressed=zfs_compressed)
|
|
target_snapshot.recv_pipe(pipe, features=features, filter_properties=filter_properties,
|
|
set_properties=set_properties, ignore_exit_code=ignore_recv_exit_code, recv_pipes=recv_pipes, force=force)
|
|
|
|
def abort_resume(self):
|
|
"""abort current resume state"""
|
|
self.debug("Aborting resume")
|
|
self.zfs_node.run(["zfs", "recv", "-A", self.name])
|
|
|
|
def rollback(self):
|
|
"""rollback to latest existing snapshot on this dataset"""
|
|
|
|
for snapshot in reversed(self.snapshots):
|
|
if snapshot.exists:
|
|
self.debug("Rolling back")
|
|
self.zfs_node.run(["zfs", "rollback", snapshot.name])
|
|
return
|
|
|
|
def get_resume_snapshot(self, resume_token):
|
|
"""returns snapshot that will be resumed by this resume token (run this
|
|
on source with target-token)
|
|
|
|
Args:
|
|
:type resume_token: str
|
|
"""
|
|
# use zfs send -n option to determine this
|
|
# NOTE: on smartos stderr, on linux stdout
|
|
(stdout, stderr) = self.zfs_node.run(["zfs", "send", "-t", resume_token, "-n", "-v"], valid_exitcodes=[0, 255],
|
|
readonly=True, return_stderr=True)
|
|
if stdout:
|
|
lines = stdout
|
|
else:
|
|
lines = stderr
|
|
for line in lines:
|
|
matches = re.findall("toname = .*@(.*)", line)
|
|
if matches:
|
|
snapshot_name = matches[0]
|
|
snapshot = self.zfs_node.get_dataset(self.filesystem_name + "@" + snapshot_name)
|
|
snapshot.debug("resume token belongs to this snapshot")
|
|
return snapshot
|
|
|
|
return None
|
|
|
|
def thin_list(self, keeps=None, ignores=None):
|
|
"""determines list of snapshots that should be kept or deleted based on
|
|
the thinning schedule. cull the herd!
|
|
|
|
returns: ( keeps, obsoletes )
|
|
|
|
Args:
|
|
:param keeps: list of snapshots to always keep (usually the last)
|
|
:param ignores: snapshots to completely ignore (usually incompatible target snapshots that are going to be destroyed anyway)
|
|
:type keeps: list of ZfsDataset
|
|
:type ignores: list of ZfsDataset
|
|
"""
|
|
|
|
if ignores is None:
|
|
ignores = []
|
|
if keeps is None:
|
|
keeps = []
|
|
|
|
snapshots = [snapshot for snapshot in self.our_snapshots if snapshot not in ignores]
|
|
|
|
return self.zfs_node.thin(snapshots, keep_objects=keeps)
|
|
|
|
def thin(self, skip_holds=False):
|
|
"""destroys snapshots according to thin_list, except last snapshot
|
|
|
|
Args:
|
|
:type skip_holds: bool
|
|
"""
|
|
|
|
(keeps, obsoletes) = self.thin_list(keeps=self.our_snapshots[-1:])
|
|
for obsolete in obsoletes:
|
|
if skip_holds and obsolete.is_hold():
|
|
obsolete.verbose("Keeping (common snapshot)")
|
|
else:
|
|
obsolete.destroy()
|
|
self.snapshots.remove(obsolete)
|
|
|
|
def find_common_snapshot(self, target_dataset):
|
|
"""find latest common snapshot between us and target returns None if its
|
|
an initial transfer
|
|
|
|
Args:
|
|
:type target_dataset: ZfsDataset
|
|
"""
|
|
if not target_dataset.snapshots:
|
|
# target has nothing yet
|
|
return None
|
|
else:
|
|
for source_snapshot in reversed(self.snapshots):
|
|
if target_dataset.find_snapshot(source_snapshot):
|
|
source_snapshot.debug("common snapshot")
|
|
return source_snapshot
|
|
target_dataset.error("Cant find common snapshot with source.")
|
|
raise (Exception("You probably need to delete the target dataset to fix this."))
|
|
|
|
def find_start_snapshot(self, common_snapshot, also_other_snapshots):
|
|
"""finds first snapshot to send :rtype: ZfsDataset or None if we cant
|
|
find it.
|
|
|
|
Args:
|
|
:type common_snapshot: ZfsDataset
|
|
:type also_other_snapshots: bool
|
|
"""
|
|
|
|
if not common_snapshot:
|
|
if not self.snapshots:
|
|
start_snapshot = None
|
|
else:
|
|
# no common snapshot, start from beginning
|
|
start_snapshot = self.snapshots[0]
|
|
|
|
if not start_snapshot.is_ours() and not also_other_snapshots:
|
|
# try to start at a snapshot thats ours
|
|
start_snapshot = self.find_next_snapshot(start_snapshot, also_other_snapshots)
|
|
else:
|
|
# normal situation: start_snapshot is the one after the common snapshot
|
|
start_snapshot = self.find_next_snapshot(common_snapshot, also_other_snapshots)
|
|
|
|
return start_snapshot
|
|
|
|
def find_incompatible_snapshots(self, common_snapshot):
|
|
"""returns a list of snapshots that is incompatible for a zfs recv onto
|
|
the common_snapshot. all direct followup snapshots with written=0 are
|
|
compatible.
|
|
|
|
Args:
|
|
:type common_snapshot: ZfsDataset
|
|
"""
|
|
|
|
ret = []
|
|
|
|
if common_snapshot and self.snapshots:
|
|
followup = True
|
|
for snapshot in self.snapshots[self.find_snapshot_index(common_snapshot) + 1:]:
|
|
if not followup or int(snapshot.properties['written']) != 0:
|
|
followup = False
|
|
ret.append(snapshot)
|
|
|
|
return ret
|
|
|
|
def get_allowed_properties(self, filter_properties, set_properties):
|
|
"""only returns lists of allowed properties for this dataset type
|
|
|
|
Args:
|
|
:type filter_properties: list of str
|
|
:type set_properties: list of str
|
|
"""
|
|
|
|
allowed_filter_properties = []
|
|
allowed_set_properties = []
|
|
illegal_properties = self.ILLEGAL_PROPERTIES[self.properties['type']]
|
|
for set_property in set_properties:
|
|
(property_, value) = set_property.split("=")
|
|
if property_ not in illegal_properties:
|
|
allowed_set_properties.append(set_property)
|
|
|
|
for filter_property in filter_properties:
|
|
if filter_property not in illegal_properties:
|
|
allowed_filter_properties.append(filter_property)
|
|
|
|
return allowed_filter_properties, allowed_set_properties
|
|
|
|
def _add_virtual_snapshots(self, source_dataset, source_start_snapshot, also_other_snapshots):
|
|
"""add snapshots from source to our snapshot list. (just the in memory
|
|
list, no disk operations)
|
|
|
|
Args:
|
|
:type source_dataset: ZfsDataset
|
|
:type source_start_snapshot: ZfsDataset
|
|
:type also_other_snapshots: bool
|
|
"""
|
|
|
|
self.debug("Creating virtual target snapshots")
|
|
snapshot = source_start_snapshot
|
|
while snapshot:
|
|
# create virtual target snapsho
|
|
# NOTE: with force_exist we're telling the dataset it doesnt exist yet. (e.g. its virtual)
|
|
virtual_snapshot = self.zfs_node.get_dataset(self.filesystem_name + "@" + snapshot.snapshot_name, force_exists=False)
|
|
self.snapshots.append(virtual_snapshot)
|
|
snapshot = source_dataset.find_next_snapshot(snapshot, also_other_snapshots)
|
|
|
|
def _pre_clean(self, common_snapshot, target_dataset, source_obsoletes, target_obsoletes, target_keeps):
|
|
"""cleanup old stuff before starting snapshot syncing
|
|
|
|
Args:
|
|
:type common_snapshot: ZfsDataset
|
|
:type target_dataset: ZfsDataset
|
|
:type source_obsoletes: list of ZfsDataset
|
|
:type target_obsoletes: list of ZfsDataset
|
|
:type target_keeps: list of ZfsDataset
|
|
"""
|
|
|
|
# on source: destroy all obsoletes before common. (since we cant send them anyways)
|
|
# But after common, only delete snapshots that target also doesn't want
|
|
if common_snapshot:
|
|
before_common = True
|
|
else:
|
|
before_common = False
|
|
|
|
for source_snapshot in self.snapshots:
|
|
if common_snapshot and source_snapshot.snapshot_name == common_snapshot.snapshot_name:
|
|
before_common = False
|
|
# never destroy common snapshot
|
|
else:
|
|
target_snapshot = target_dataset.find_snapshot(source_snapshot)
|
|
if (source_snapshot in source_obsoletes) and (before_common or (target_snapshot not in target_keeps)):
|
|
source_snapshot.destroy()
|
|
|
|
# on target: destroy everything thats obsolete, except common_snapshot
|
|
for target_snapshot in target_dataset.snapshots:
|
|
if (target_snapshot in target_obsoletes) \
|
|
and ( not common_snapshot or (target_snapshot.snapshot_name != common_snapshot.snapshot_name)):
|
|
if target_snapshot.exists:
|
|
target_snapshot.destroy()
|
|
|
|
def _validate_resume_token(self, target_dataset, start_snapshot):
|
|
"""validate and get (or destory) resume token
|
|
|
|
Args:
|
|
:type target_dataset: ZfsDataset
|
|
:type start_snapshot: ZfsDataset
|
|
"""
|
|
|
|
if 'receive_resume_token' in target_dataset.properties:
|
|
if start_snapshot==None:
|
|
target_dataset.verbose("Aborting resume, its obsolete.")
|
|
target_dataset.abort_resume()
|
|
else:
|
|
resume_token = target_dataset.properties['receive_resume_token']
|
|
# not valid anymore
|
|
resume_snapshot = self.get_resume_snapshot(resume_token)
|
|
if not resume_snapshot or start_snapshot.snapshot_name != resume_snapshot.snapshot_name:
|
|
target_dataset.verbose("Aborting resume, its no longer valid.")
|
|
target_dataset.abort_resume()
|
|
else:
|
|
return resume_token
|
|
|
|
def _plan_sync(self, target_dataset, also_other_snapshots):
|
|
"""plan where to start syncing and what to sync and what to keep
|
|
|
|
Args:
|
|
:rtype: ( ZfsDataset, ZfsDataset, list of ZfsDataset, list of ZfsDataset, list of ZfsDataset, list of ZfsDataset )
|
|
:type target_dataset: ZfsDataset
|
|
:type also_other_snapshots: bool
|
|
"""
|
|
|
|
# determine common and start snapshot
|
|
target_dataset.debug("Determining start snapshot")
|
|
common_snapshot = self.find_common_snapshot(target_dataset)
|
|
start_snapshot = self.find_start_snapshot(common_snapshot, also_other_snapshots)
|
|
incompatible_target_snapshots = target_dataset.find_incompatible_snapshots(common_snapshot)
|
|
|
|
# let thinner decide whats obsolete on source
|
|
source_obsoletes = []
|
|
if self.our_snapshots:
|
|
source_obsoletes = self.thin_list(keeps=[self.our_snapshots[-1]])[1]
|
|
|
|
# let thinner decide keeps/obsoletes on target, AFTER the transfer would be done (by using virtual snapshots)
|
|
target_dataset._add_virtual_snapshots(self, start_snapshot, also_other_snapshots)
|
|
target_keeps = []
|
|
target_obsoletes = []
|
|
if target_dataset.our_snapshots:
|
|
(target_keeps, target_obsoletes) = target_dataset.thin_list(keeps=[target_dataset.our_snapshots[-1]],
|
|
ignores=incompatible_target_snapshots)
|
|
|
|
return common_snapshot, start_snapshot, source_obsoletes, target_obsoletes, target_keeps, incompatible_target_snapshots
|
|
|
|
def handle_incompatible_snapshots(self, incompatible_target_snapshots, destroy_incompatible):
|
|
"""destroy incompatbile snapshots on target before sync, or inform user
|
|
what to do
|
|
|
|
Args:
|
|
:type incompatible_target_snapshots: list of ZfsDataset
|
|
:type destroy_incompatible: bool
|
|
"""
|
|
|
|
if incompatible_target_snapshots:
|
|
if not destroy_incompatible:
|
|
for snapshot in incompatible_target_snapshots:
|
|
snapshot.error("Incompatible snapshot")
|
|
raise (Exception("Please destroy incompatible snapshots or use --destroy-incompatible."))
|
|
else:
|
|
for snapshot in incompatible_target_snapshots:
|
|
snapshot.verbose("Incompatible snapshot")
|
|
snapshot.destroy()
|
|
self.snapshots.remove(snapshot)
|
|
|
|
|
|
def sync_snapshots(self, target_dataset, features, show_progress, filter_properties, set_properties,
|
|
ignore_recv_exit_code, holds, rollback, decrypt, encrypt, also_other_snapshots,
|
|
no_send, destroy_incompatible, send_pipes, recv_pipes, zfs_compressed, force):
|
|
"""sync this dataset's snapshots to target_dataset, while also thinning
|
|
out old snapshots along the way.
|
|
|
|
Args:
|
|
:type send_pipes: list of str
|
|
:type recv_pipes: list of str
|
|
:type target_dataset: ZfsDataset
|
|
:type features: list of str
|
|
:type show_progress: bool
|
|
:type filter_properties: list of str
|
|
:type set_properties: list of str
|
|
:type ignore_recv_exit_code: bool
|
|
:type holds: bool
|
|
:type rollback: bool
|
|
:type decrypt: bool
|
|
:type also_other_snapshots: bool
|
|
:type no_send: bool
|
|
:type destroy_incompatible: bool
|
|
"""
|
|
|
|
self.verbose("sending to {}".format(target_dataset))
|
|
|
|
(common_snapshot, start_snapshot, source_obsoletes, target_obsoletes, target_keeps,
|
|
incompatible_target_snapshots) = \
|
|
self._plan_sync(target_dataset=target_dataset, also_other_snapshots=also_other_snapshots)
|
|
|
|
# NOTE: we do this because we dont want filesystems to fillup when backups keep failing.
|
|
# Also usefull with no_send to still cleanup stuff.
|
|
self._pre_clean(
|
|
common_snapshot=common_snapshot, target_dataset=target_dataset,
|
|
target_keeps=target_keeps, target_obsoletes=target_obsoletes, source_obsoletes=source_obsoletes)
|
|
|
|
# handle incompatible stuff on target
|
|
target_dataset.handle_incompatible_snapshots(incompatible_target_snapshots, destroy_incompatible)
|
|
|
|
# now actually transfer the snapshots, if we want
|
|
if no_send:
|
|
return
|
|
|
|
# check if we can resume
|
|
resume_token = self._validate_resume_token(target_dataset, start_snapshot)
|
|
|
|
# rollback target to latest?
|
|
if rollback:
|
|
target_dataset.rollback()
|
|
|
|
#defaults for these settings if there is no encryption stuff going on:
|
|
send_properties = True
|
|
raw = False
|
|
write_embedded = True
|
|
|
|
(active_filter_properties, active_set_properties) = self.get_allowed_properties(filter_properties, set_properties)
|
|
|
|
# source dataset encrypted?
|
|
if self.properties.get('encryption', 'off')!='off':
|
|
# user wants to send it over decrypted?
|
|
if decrypt:
|
|
# when decrypting, zfs cant send properties
|
|
send_properties=False
|
|
else:
|
|
# keep data encrypted by sending it raw (including properties)
|
|
raw=True
|
|
|
|
# encrypt at target?
|
|
if encrypt and not raw:
|
|
# filter out encryption properties to let encryption on the target take place
|
|
active_filter_properties.extend(["keylocation","pbkdf2iters","keyformat", "encryption"])
|
|
write_embedded=False
|
|
|
|
|
|
# now actually transfer the snapshots
|
|
prev_source_snapshot = common_snapshot
|
|
source_snapshot = start_snapshot
|
|
while source_snapshot:
|
|
target_snapshot = target_dataset.find_snapshot(source_snapshot) # still virtual
|
|
|
|
# does target actually want it?
|
|
if target_snapshot not in target_obsoletes:
|
|
|
|
source_snapshot.transfer_snapshot(target_snapshot, features=features,
|
|
prev_snapshot=prev_source_snapshot, show_progress=show_progress,
|
|
filter_properties=active_filter_properties,
|
|
set_properties=active_set_properties,
|
|
ignore_recv_exit_code=ignore_recv_exit_code,
|
|
resume_token=resume_token, write_embedded=write_embedded, raw=raw,
|
|
send_properties=send_properties, send_pipes=send_pipes,
|
|
recv_pipes=recv_pipes, zfs_compressed=zfs_compressed, force=force)
|
|
|
|
resume_token = None
|
|
|
|
# hold the new common snapshots and release the previous ones
|
|
if holds:
|
|
target_snapshot.hold()
|
|
source_snapshot.hold()
|
|
|
|
if prev_source_snapshot:
|
|
if holds:
|
|
prev_source_snapshot.release()
|
|
target_dataset.find_snapshot(prev_source_snapshot).release()
|
|
|
|
# we may now destroy the previous source snapshot if its obsolete
|
|
if prev_source_snapshot in source_obsoletes:
|
|
prev_source_snapshot.destroy()
|
|
|
|
# destroy the previous target snapshot if obsolete (usually this is only the common_snapshot,
|
|
# the rest was already destroyed or will not be send)
|
|
prev_target_snapshot = target_dataset.find_snapshot(prev_source_snapshot)
|
|
if prev_target_snapshot in target_obsoletes:
|
|
prev_target_snapshot.destroy()
|
|
|
|
prev_source_snapshot = source_snapshot
|
|
else:
|
|
source_snapshot.debug("skipped (target doesn't need it)")
|
|
# was it actually a resume?
|
|
if resume_token:
|
|
target_dataset.verbose("Aborting resume, we dont want that snapshot anymore.")
|
|
target_dataset.abort_resume()
|
|
resume_token = None
|
|
|
|
source_snapshot = self.find_next_snapshot(source_snapshot, also_other_snapshots)
|
|
|
|
def mount(self, mount_point):
|
|
|
|
self.debug("Mounting")
|
|
|
|
cmd = [
|
|
"mount", "-tzfs", self.name, mount_point
|
|
]
|
|
|
|
self.zfs_node.run(cmd=cmd, valid_exitcodes=[0])
|
|
|
|
def unmount(self):
|
|
|
|
self.debug("Unmounting")
|
|
|
|
cmd = [
|
|
"umount", self.name
|
|
]
|
|
|
|
|
|
self.zfs_node.run(cmd=cmd, valid_exitcodes=[0])
|
|
|
|
def clone(self, name):
|
|
"""clones this snapshot and returns ZfsDataset of the clone"""
|
|
|
|
self.debug("Cloning to {}".format(name))
|
|
|
|
cmd = [
|
|
"zfs", "clone", self.name, name
|
|
]
|
|
|
|
self.zfs_node.run(cmd=cmd, valid_exitcodes=[0])
|
|
|
|
return self.zfs_node.get_dataset(name, force_exists=True)
|
|
|
|
def set(self, prop, value):
|
|
"""set a zfs property"""
|
|
|
|
self.debug("Setting {}={}".format(prop, value))
|
|
|
|
cmd = [
|
|
"zfs", "set", "{}={}".format(prop, value), self.name
|
|
]
|
|
|
|
self.zfs_node.run(cmd=cmd, valid_exitcodes=[0])
|
|
|
|
self.invalidate()
|
|
|
|
def inherit(self, prop):
|
|
"""inherit zfs property"""
|
|
|
|
self.debug("Inheriting property {}".format(prop))
|
|
|
|
cmd = [
|
|
"zfs", "inherit", prop, self.name
|
|
]
|
|
|
|
self.zfs_node.run(cmd=cmd, valid_exitcodes=[0])
|
|
|
|
self.invalidate()
|
|
|