#!/usr/bin/env python # -*- coding: utf8 -*- # (c)edwin@datux.nl - Released under GPL # # Greetings from eth0 2019 :) from __future__ import print_function import os import sys import re import traceback import subprocess import pprint import time import argparse from pprint import pprint as p import select use_color=False if sys.stdout.isatty(): try: import colorama use_color=True except ImportError: pass VERSION="3.0-rc9" HEADER="zfs-autobackup v{} - Copyright 2020 E.H.Eefting (edwin@datux.nl)\n".format(VERSION) class Log: def __init__(self, show_debug=False, show_verbose=False): self.last_log="" self.show_debug=show_debug self.show_verbose=show_verbose def error(self, txt): if use_color: print(colorama.Fore.RED+colorama.Style.BRIGHT+ "! "+txt+colorama.Style.RESET_ALL, file=sys.stderr) else: print("! "+txt, file=sys.stderr) def verbose(self, txt): if self.show_verbose: if use_color: print(colorama.Style.NORMAL+ " "+txt+colorama.Style.RESET_ALL) else: print(" "+txt) def debug(self, txt): if self.show_debug: if use_color: print(colorama.Fore.GREEN+ "# "+txt+colorama.Style.RESET_ALL) else: print("# "+txt) class ThinnerRule: """a thinning schedule rule for Thinner""" TIME_NAMES={ 'y' : 3600 * 24 * 365.25, 'm' : 3600 * 24 * 30, 'w' : 3600 * 24 * 7, 'd' : 3600 * 24, 'h' : 3600, 'min' : 60, 's' : 1, } TIME_DESC={ 'y' : 'year', 'm' : 'month', 'w' : 'week', 'd' : 'day', 'h' : 'hour', 'min' : 'minute', 's' : 'second', } def parse_rule(self, rule_str): """parse scheduling string example: daily snapshot, remove after a week: 1d1w weekly snapshot, remove after a month: 1w1m monthly snapshot, remove after 6 months: 1m6m yearly snapshot, remove after 2 year: 1y2y keep all snapshots, remove after a day 1s1d keep nothing: 1s1s """ rule_str=rule_str.lower() matches=re.findall("([0-9]*)([a-z]*)([0-9]*)([a-z]*)", rule_str)[0] period_amount=int(matches[0]) period_unit=matches[1] ttl_amount=int(matches[2]) ttl_unit=matches[3] if not period_unit in self.TIME_NAMES: raise(Exception("Invalid period string in schedule: '{}'".format(rule_str))) if not ttl_unit in self.TIME_NAMES: raise(Exception("Invalid ttl string in schedule: '{}'".format(rule_str))) self.period=period_amount * self.TIME_NAMES[period_unit] self.ttl=ttl_amount * self.TIME_NAMES[ttl_unit] if self.period>self.ttl: raise(Exception("Period cant be longer than ttl in schedule: '{}'".format(rule_str))) self.rule_str=rule_str self.human_str="Keep every {} {}{}, delete after {} {}{}.".format( period_amount, self.TIME_DESC[period_unit], period_amount!=1 and "s" or "", ttl_amount, self.TIME_DESC[ttl_unit], ttl_amount!=1 and "s" or "" ) def __str__(self): """get schedule as a schedule string""" return(self.rule_str) def __init__(self, rule_str): self.parse_rule(rule_str) pass class Thinner: """progressive thinner (universal, used for cleaning up snapshots)""" def __init__(self, schedule_str=""): """schedule_str: comma seperated list of ThinnerRules. A plain number specifies how many snapshots to always keep. """ self.rules=[] self.always_keep=0 if schedule_str=="": return rule_strs=schedule_str.split(",") for rule_str in rule_strs: if rule_str.isdigit(): self.always_keep=int(rule_str) if self.always_keep<0: raise(Exception("Number of snapshots to keep cant be negative: {}".format(self.keep_source))) else: self.rules.append(ThinnerRule(rule_str)) def human_rules(self): """get list of human readable rules""" ret=[] if self.always_keep: ret.append("Keep the last {} snapshot{}.".format(self.always_keep, self.always_keep!=1 and "s" or "")) for rule in self.rules: ret.append(rule.human_str) return(ret) def thin(self,objects, keep_objects=[], now=None): """thin list of objects with current schedule rules. objects: list of objects to thin. every object should have timestamp attribute. keep_objects: objects to always keep (these should also be in normal objects list, so we can use them to perhaps delete other obsolete objects) return( keeps, removes ) """ #always keep a number of the last objets? if self.always_keep: #all of them if len(objects)<=self.always_keep: return ( (objects, []) ) #determine which ones always_keep_objects=objects[-self.always_keep:] else: always_keep_objects=[] #determine time blocks time_blocks={} for rule in self.rules: time_blocks[rule.period]={} if not now: now=int(time.time()) keeps=[] removes=[] #traverse objects for object in objects: #important they are ints! timestamp=int(object.timestamp) age=int(now)-timestamp # store in the correct time blocks, per period-size, if not too old yet # e.g.: look if there is ANY timeblock that wants to keep this object keep=False for rule in self.rules: if age<=rule.ttl: block_nr=int(timestamp/rule.period) if not block_nr in time_blocks[rule.period]: time_blocks[rule.period][block_nr]=True keep=True #keep it according to schedule, or keep it because it is in the keep_objects list if keep or object in keep_objects or object in always_keep_objects: keeps.append(object) else: removes.append(object) return( (keeps, removes) ) # ######### Thinner testing code # now=int(time.time()) # # t=Thinner("1d1w,1w1m,1m6m,1y2y", always_keep=1) # # import random # # class Thing: # def __init__(self, timestamp): # self.timestamp=timestamp # # def __str__(self): # age=now-self.timestamp # struct=time.localtime(self.timestamp) # return("{} ({} days old)".format(time.strftime("%Y-%m-%d %H:%M:%S",struct),int(age/(3600*24)))) # # def test(): # global now # things=[] # # while True: # print("#################### {}".format(time.strftime("%Y-%m-%d %H:%M:%S",time.localtime(now)))) # # (keeps, removes)=t.run(things, now) # # print ("### KEEP ") # for thing in keeps: # print(thing) # # print ("### REMOVE ") # for thing in removes: # print(thing) # # things=keeps # # #increase random amount of time and maybe add a thing # now=now+random.randint(0,160000) # if random.random()>=0: # things.append(Thing(now)) # # sys.stdin.readline() # # test() class cached_property(object): """ A property that is only computed once per instance and then replaces itself with an ordinary attribute. Deleting the attribute resets the property. Source: https://github.com/bottlepy/bottle/commit/fa7733e075da0d790d809aa3d2f53071897e6f76 """ def __init__(self, func): self.__doc__ = getattr(func, '__doc__') self.func = func def __get__(self, obj, cls): if obj is None: return self propname=self.func.__name__ if not hasattr(obj, '_cached_properties'): obj._cached_properties={} if not propname in obj._cached_properties: obj._cached_properties[propname]=self.func(obj) # value = obj.__dict__[propname] = self.func(obj) return obj._cached_properties[propname] class ExecuteNode: """an endpoint to execute local or remote commands via ssh""" def __init__(self, ssh_config=None, ssh_to=None, readonly=False, debug_output=False): """ssh_config: custom ssh config ssh_to: server you want to ssh to. none means local readonly: only execute commands that don't make any changes (usefull for testing-runs) debug_output: show output and exit codes of commands in debugging output. """ self.ssh_config=ssh_config self.ssh_to=ssh_to self.readonly=readonly self.debug_output=debug_output def __repr__(self): if self.ssh_to==None: return("(local)") else: return(self.ssh_to) def _parse_stdout(self, line): """parse stdout. can be overridden in subclass""" if self.debug_output: self.debug("STDOUT > "+line.rstrip()) def _parse_stderr(self, line, hide_errors): """parse stderr. can be overridden in subclass""" if hide_errors: self.debug("STDERR > "+line.rstrip()) else: self.error("STDERR > "+line.rstrip()) def _parse_stderr_pipe(self, line, hide_errors): """parse stderr from pipe input process. can be overridden in subclass""" if hide_errors: self.debug("STDERR|> "+line.rstrip()) else: self.error("STDERR|> "+line.rstrip()) def run(self, cmd, input=None, tab_split=False, valid_exitcodes=[ 0 ], readonly=False, hide_errors=False, pipe=False, return_stderr=False): """run a command on the node readonly: make this True if the command doesn't make any changes and is safe to execute in testmode pipe: Instead of executing, return a pipe-handle to be used to input to another run() command. (just like a | in linux) input: Can be None, a string or a pipe-handle you got from another run() return_stderr: return both stdout and stderr as a tuple """ encoded_cmd=[] #use ssh? if self.ssh_to != None: encoded_cmd.append("ssh".encode('utf-8')) if self.ssh_config != None: encoded_cmd.extend(["-F".encode('utf-8'), self.ssh_config.encode('utf-8')]) encoded_cmd.append(self.ssh_to.encode('utf-8')) #make sure the command gets all the data in utf8 format: #(this is necessary if LC_ALL=en_US.utf8 is not set in the environment) for arg in cmd: #add single quotes for remote commands to support spaces and other weird stuff (remote commands are executed in a shell) encoded_cmd.append( ("'"+arg+"'").encode('utf-8')) else: for arg in cmd: encoded_cmd.append(arg.encode('utf-8')) #debug and test stuff debug_txt="" for c in encoded_cmd: debug_txt=debug_txt+" "+c.decode() if pipe: debug_txt=debug_txt+" |" if self.readonly and not readonly: self.debug("SKIP > "+ debug_txt) else: if pipe: self.debug("PIPE > "+ debug_txt) else: self.debug("RUN > "+ debug_txt) #determine stdin if input==None: stdin=None elif isinstance(input,str) or type(input)=='unicode': self.debug("INPUT > \n"+input.rstrip()) stdin=subprocess.PIPE elif isinstance(input, subprocess.Popen): self.debug("Piping input") stdin=input.stdout else: raise(Exception("Program error: Incompatible input")) if self.readonly and not readonly: #todo: what happens if input is piped? return #execute and parse/return results p=subprocess.Popen(encoded_cmd, env=os.environ, stdout=subprocess.PIPE, stdin=stdin, stderr=subprocess.PIPE) #Note: make streaming? if isinstance(input,str) or type(input)=='unicode': p.stdin.write(input) if pipe: return(p) #handle all outputs if isinstance(input, subprocess.Popen): selectors=[p.stdout, p.stderr, input.stderr ] input.stdout.close() #otherwise inputprocess wont exit when ours does else: selectors=[p.stdout, p.stderr ] output_lines=[] error_lines=[] while True: (read_ready, write_ready, ex_ready)=select.select(selectors, [], []) eof_count=0 if p.stdout in read_ready: line=p.stdout.readline().decode('utf-8') if line!="": if tab_split: output_lines.append(line.rstrip().split('\t')) else: output_lines.append(line.rstrip()) self._parse_stdout(line) else: eof_count=eof_count+1 if p.stderr in read_ready: line=p.stderr.readline().decode('utf-8') if line!="": if tab_split: error_lines.append(line.rstrip().split('\t')) else: error_lines.append(line.rstrip()) self._parse_stderr(line, hide_errors) else: eof_count=eof_count+1 if isinstance(input, subprocess.Popen) and (input.stderr in read_ready): line=input.stderr.readline().decode('utf-8') if line!="": self._parse_stderr_pipe(line, hide_errors) else: eof_count=eof_count+1 #stop if both processes are done and all filehandles are EOF: if p.poll()!=None and ((not isinstance(input, subprocess.Popen)) or input.poll()!=None) and eof_count==len(selectors): break if self.debug_output: self.debug("EXIT > {}".format(p.returncode)) #handle piped process error output and exit codes if isinstance(input, subprocess.Popen): if self.debug_output: self.debug("EXIT |> {}".format(input.returncode)) if valid_exitcodes and input.returncode not in valid_exitcodes: raise(subprocess.CalledProcessError(input.returncode, "(pipe)")) if valid_exitcodes and p.returncode not in valid_exitcodes: raise(subprocess.CalledProcessError(p.returncode, encoded_cmd)) if return_stderr: return ( output_lines, error_lines ) else: return(output_lines) class ZfsDataset(): """a zfs dataset (filesystem/volume/snapshot/clone) Note that a dataset doesn't have to actually exist (yet/anymore) Also most properties are cached for performance-reasons, but also to allow --test to function correctly. """ # illegal properties per dataset type. these will be removed from --set-properties and --filter-properties ILLEGAL_PROPERTIES={ 'filesystem': [ ], 'volume': [ "canmount" ], } def __init__(self, zfs_node, name, force_exists=None): """name: full path of the zfs dataset exists: specify if you already know a dataset exists or not. for performance reasons. (otherwise it will have to check with zfs list when needed) """ self.zfs_node=zfs_node self.name=name #full name self.force_exists=force_exists def __repr__(self): return("{}: {}".format(self.zfs_node, self.name)) def __str__(self): return(self.name) def __eq__(self, obj): if not isinstance(obj, ZfsDataset): return(False) return(self.name == obj.name) def verbose(self,txt): self.zfs_node.verbose("{}: {}".format(self.name, txt)) def error(self,txt): self.zfs_node.error("{}: {}".format(self.name, txt)) def debug(self,txt): self.zfs_node.debug("{}: {}".format(self.name, txt)) def invalidate(self): """clear cache""" #TODO: nicer? self._cached_properties={} self.force_exists=None def split_path(self): """return the path elements as an array""" return(self.name.split("/")) def lstrip_path(self,count): """return name with first count components stripped""" return("/".join(self.split_path()[count:])) def rstrip_path(self,count): """return name with last count components stripped""" return("/".join(self.split_path()[:-count])) @property def filesystem_name(self): """filesystem part of the name (before the @)""" if self.is_snapshot: ( filesystem, snapshot )=self.name.split("@") return(filesystem) else: return(self.name) @property def snapshot_name(self): """snapshot part of the name""" if not self.is_snapshot: raise(Exception("This is not a snapshot")) (filesystem, snapshot_name)=self.name.split("@") return(snapshot_name) @property def is_snapshot(self): """true if this dataset is a snapshot""" return(self.name.find("@")!=-1) @cached_property def parent(self): """get zfs-parent of this dataset. for snapshots this means it will get the filesystem/volume that it belongs to. otherwise it will return the parent according to path we cache this so everything in the parent that is cached also stays. """ if self.is_snapshot: return(ZfsDataset(self.zfs_node, self.filesystem_name)) else: return(ZfsDataset(self.zfs_node, self.rstrip_path(1))) def find_prev_snapshot(self, snapshot, other_snapshots=False): """find previous snapshot in this dataset. None if it doesn't exist. other_snapshots: set to true to also return snapshots that where not created by us. (is_ours) """ if self.is_snapshot: raise(Exception("Please call this on a dataset.")) index=self.find_snapshot_index(snapshot) while index: index=index-1 if other_snapshots or self.snapshots[index].is_ours(): return(self.snapshots[index]) return(None) def find_next_snapshot(self, snapshot, other_snapshots=False): """find next snapshot in this dataset. None if it doesn't exist""" if self.is_snapshot: raise(Exception("Please call this on a dataset.")) index=self.find_snapshot_index(snapshot) while index!=None and index=3: if progress_fields[0]=='full' or progress_fields[0]=='size': self._progress_total_bytes=int(progress_fields[2]) elif progress_fields[0]=='incremental': self._progress_total_bytes=int(progress_fields[3]) else: bytes=int(progress_fields[1]) percentage=0 if self._progress_total_bytes: percentage=min(100,int(bytes*100/self._progress_total_bytes)) speed=int(bytes/(time.time()-self._progress_start_time)/(1024*1024)) bytes_left=self._progress_total_bytes-bytes minutes_left=int((bytes_left/(bytes/(time.time()-self._progress_start_time)))/60) print(">>> {}% {}MB/s (total {}MB, {} minutes left) \r".format(percentage, speed, int(self._progress_total_bytes/(1024*1024)), minutes_left), end='') sys.stdout.flush() return #still do the normal stderr output handling if hide_errors: self.debug(prefix+line.rstrip()) else: self.error(prefix+line.rstrip()) def _parse_stderr_pipe(self, line, hide_errors): self.parse_zfs_progress(line, hide_errors, "STDERR|> ") def _parse_stderr(self, line, hide_errors): self.parse_zfs_progress(line, hide_errors, "STDERR > ") def verbose(self,txt): self.zfs_autobackup.verbose("{} {}".format(self.description, txt)) def error(self,txt,titles=[]): self.zfs_autobackup.error("{} {}".format(self.description, txt)) def debug(self,txt, titles=[]): self.zfs_autobackup.debug("{} {}".format(self.description, txt)) def new_snapshotname(self): """determine uniq new snapshotname""" return(self.backup_name+"-"+time.strftime("%Y%m%d%H%M%S")) def consistent_snapshot(self, datasets, snapshot_name, min_changed_bytes): """create a consistent (atomic) snapshot of specified datasets, per pool. """ pools={} #collect snapshots that we want to make, per pool for dataset in datasets: if not dataset.is_changed_ours(min_changed_bytes): dataset.verbose("No changes since {}".format(dataset.our_snapshots[-1].snapshot_name)) continue snapshot=ZfsDataset(dataset.zfs_node, dataset.name+"@"+snapshot_name) pool=dataset.split_path()[0] if not pool in pools: pools[pool]=[] pools[pool].append(snapshot) #add snapshot to cache (also usefull in testmode) dataset.snapshots.append(snapshot) #NOTE: this will trigger zfs list if not pools: self.verbose("No changes anywhere: not creating snapshots.") return #create consistent snapshot per pool for (pool_name, snapshots) in pools.items(): cmd=[ "zfs", "snapshot" ] cmd.extend(map(lambda snapshot: str(snapshot), snapshots)) self.verbose("Creating snapshots {} in pool {}".format(snapshot_name, pool_name)) self.run(cmd, readonly=False) @cached_property def selected_datasets(self): """determine filesystems that should be backupped by looking at the special autobackup-property, systemwide returns: list of ZfsDataset """ #get all source filesystems that have the backup property lines=self.run(tab_split=True, readonly=True, cmd=[ "zfs", "get", "-t", "volume,filesystem", "-o", "name,value,source", "-s", "local,inherited", "-H", "autobackup:"+self.backup_name ]) #determine filesystems that should be actually backupped selected_filesystems=[] direct_filesystems=[] for line in lines: (name,value,source)=line dataset=ZfsDataset(self, name) if value=="false": dataset.verbose("Ignored (disabled)") else: if source=="local" and ( value=="true" or value=="child"): direct_filesystems.append(name) if source=="local" and value=="true": dataset.verbose("Selected (direct selection)") selected_filesystems.append(dataset) elif source.find("inherited from ")==0 and (value=="true" or value=="child"): inherited_from=re.sub("^inherited from ", "", source) if inherited_from in direct_filesystems: selected_filesystems.append(dataset) dataset.verbose("Selected (inherited selection)") else: dataset.verbose("Ignored (already a backup)") else: dataset.verbose("Ignored (only childs)") return(selected_filesystems) class ZfsAutobackup: """main class""" def __init__(self): parser = argparse.ArgumentParser( description=HEADER, epilog='When a filesystem fails, zfs_backup will continue and report the number of failures at that end. Also the exit code will indicate the number of failures.') parser.add_argument('--ssh-config', default=None, help='Custom ssh client config') parser.add_argument('--ssh-source', default=None, help='Source host to get backup from. (user@hostname) Default %(default)s.') parser.add_argument('--ssh-target', default=None, help='Target host to push backup to. (user@hostname) Default %(default)s.') parser.add_argument('--keep-source', type=str, default="10,1d1w,1w1m,1m1y", help='Thinning schedule for old source snapshots. Default: %(default)s') parser.add_argument('--keep-target', type=str, default="10,1d1w,1w1m,1m1y", help='Thinning schedule for old target snapshots. Default: %(default)s') parser.add_argument('backup_name', help='Name of the backup (you should set the zfs property "autobackup:backup-name" to true on filesystems you want to backup') parser.add_argument('target_path', help='Target ZFS filesystem') parser.add_argument('--other-snapshots', action='store_true', help='Send over other snapshots as well, not just the ones created by this tool.') parser.add_argument('--no-snapshot', action='store_true', help='Don\'t create new snapshots (usefull for finishing uncompleted backups, or cleanups)') parser.add_argument('--no-send', action='store_true', help='Don\'t send snapshots (usefull for cleanups, or if you want a serperate send-cronjob)') parser.add_argument('--min-change', type=int, default=1, help='Number of bytes written after which we consider a dataset changed (default %(default)s)') parser.add_argument('--allow-empty', action='store_true', help='If nothing has changed, still create empty snapshots. (same as --min-change=0)') parser.add_argument('--ignore-replicated', action='store_true', help='Ignore datasets that seem to be replicated some other way. (No changes since lastest snapshot. Usefull for proxmox HA replication)') parser.add_argument('--no-holds', action='store_true', help='Don\'t lock snapshots on the source. (Usefull to allow proxmox HA replication to switches nodes)') #not sure if this ever was usefull: # parser.add_argument('--ignore-new', action='store_true', help='Ignore filesystem if there are already newer snapshots for it on the target (use with caution)') parser.add_argument('--resume', action='store_true', help='Support resuming of interrupted transfers by using the zfs extensible_dataset feature (both zpools should have it enabled) Disadvantage is that you need to use zfs recv -A if another snapshot is created on the target during a receive. Otherwise it will keep failing.') parser.add_argument('--strip-path', default=0, type=int, help='Number of directory to strip from path (use 1 when cloning zones between 2 SmartOS machines)') # parser.add_argument('--buffer', default="", help='Use mbuffer with specified size to speedup zfs transfer. (e.g. --buffer 1G) Will also show nice progress output.') # parser.add_argument('--destroy-stale', action='store_true', help='Destroy stale backups that have no more snapshots. Be sure to verify the output before using this! ') parser.add_argument('--clear-refreservation', action='store_true', help='Filter "refreservation" property. (recommended, safes space. same as --filter-properties refreservation)') parser.add_argument('--clear-mountpoint', action='store_true', help='Set property canmount=noauto for new datasets. (recommended, prevents mount conflicts. same as --set-properties canmount=noauto)') parser.add_argument('--filter-properties', type=str, help='List of properties to "filter" when receiving filesystems. (you can still restore them with zfs inherit -S)') parser.add_argument('--set-properties', type=str, help='List of propererties to override when receiving filesystems. (you can still restore them with zfs inherit -S)') parser.add_argument('--rollback', action='store_true', help='Rollback changes to the latest target snapshot before starting. (normally you can prevent changes by setting the readonly property on the target_path to on)') parser.add_argument('--destroy-incompatible', action='store_true', help='Destroy incompatible snapshots on target. Use with care! (implies --rollback)') parser.add_argument('--ignore-transfer-errors', action='store_true', help='Ignore transfer errors (still checks if received filesystem exists. usefull for acltype errors)') parser.add_argument('--raw', action='store_true', help='For encrypted datasets, send data exactly as it exists on disk.') parser.add_argument('--test', action='store_true', help='dont change anything, just show what would be done (still does all read-only operations)') parser.add_argument('--verbose', action='store_true', help='verbose output') parser.add_argument('--debug', action='store_true', help='Show zfs commands that are executed, stops after an exception.') parser.add_argument('--debug-output', action='store_true', help='Show zfs commands and their output/exit codes. (noisy)') parser.add_argument('--progress', action='store_true', help='show zfs progress output (to stderr)') #note args is the only global variable we use, since its a global readonly setting anyway args = parser.parse_args() self.args=args if args.debug_output: args.debug=True if self.args.test: self.args.verbose=True if args.allow_empty: args.min_change=0 if args.destroy_incompatible: args.rollback=True self.log=Log(show_debug=self.args.debug, show_verbose=self.args.verbose) def verbose(self,txt,titles=[]): self.log.verbose(txt) def error(self,txt,titles=[]): self.log.error(txt) def debug(self,txt, titles=[]): self.log.debug(txt) def set_title(self, title): self.log.verbose("") self.log.verbose("#### "+title) def run(self): self.verbose (HEADER) if self.args.test: self.verbose("TEST MODE - SIMULATING WITHOUT MAKING ANY CHANGES") self.set_title("Settings summary") description="[Source]" source_thinner=Thinner(self.args.keep_source) source_node=ZfsNode(self.args.backup_name, self, ssh_config=self.args.ssh_config, ssh_to=self.args.ssh_source, readonly=self.args.test, debug_output=self.args.debug_output, description=description, thinner=source_thinner) source_node.verbose("Send all datasets that have 'autobackup:{}=true' or 'autobackup:{}=child'".format(self.args.backup_name, self.args.backup_name)) self.verbose("") description="[Target]" target_thinner=Thinner(self.args.keep_target) target_node=ZfsNode(self.args.backup_name, self, ssh_config=self.args.ssh_config, ssh_to=self.args.ssh_target, readonly=self.args.test, debug_output=self.args.debug_output, description=description, thinner=target_thinner) target_node.verbose("Receive datasets under: {}".format(self.args.target_path)) self.set_title("Selecting") selected_source_datasets=source_node.selected_datasets if not selected_source_datasets: self.error("No source filesystems selected, please do a 'zfs set autobackup:{0}=true' on the source datasets you want to backup.".format(self.args.backup_name)) return(255) source_datasets=[] #filter out already replicated stuff? if not self.args.ignore_replicated: source_datasets=selected_source_datasets else: self.set_title("Filtering already replicated filesystems") for selected_source_dataset in selected_source_datasets: if selected_source_dataset.is_changed(self.args.min_change): source_datasets.append(selected_source_dataset) else: selected_source_dataset.verbose("Ignoring, already replicated") if not self.args.no_snapshot: self.set_title("Snapshotting") source_node.consistent_snapshot(source_datasets, source_node.new_snapshotname(), min_changed_bytes=self.args.min_change) if self.args.no_send: self.set_title("Thinning") else: self.set_title("Sending and thinning") if self.args.filter_properties: filter_properties=self.args.filter_properties.split(",") else: filter_properties=[] if self.args.set_properties: set_properties=self.args.set_properties.split(",") else: set_properties=[] if self.args.clear_refreservation: filter_properties.append("refreservation") if self.args.clear_mountpoint: set_properties.append("canmount=noauto") fail_count=0 for source_dataset in source_datasets: try: #determine corresponding target_dataset target_name=self.args.target_path + "/" + source_dataset.lstrip_path(self.args.strip_path) target_dataset=ZfsDataset(target_node, target_name) #ensure parents exists if not self.args.no_send and not target_dataset.parent.exists: target_dataset.parent.create_filesystem(parents=True) source_dataset.sync_snapshots(target_dataset, show_progress=self.args.progress, resume=self.args.resume, filter_properties=filter_properties, set_properties=set_properties, ignore_recv_exit_code=self.args.ignore_transfer_errors, source_holds= not self.args.no_holds, rollback=self.args.rollback, raw=self.args.raw, other_snapshots=self.args.other_snapshots, no_send=self.args.no_send, destroy_incompatible=self.args.destroy_incompatible) except Exception as e: fail_count=fail_count+1 self.error("DATASET FAILED: "+str(e)) if self.args.debug: raise if not fail_count: if self.args.test: self.set_title("All tests successfull.") else: self.set_title("All backups completed successfully") else: self.error("{} datasets failed!".format(fail_count)) if self.args.test: self.verbose("TEST MODE - DID NOT MAKE ANY BACKUPS!") return(fail_count) if __name__ == "__main__": zfs_autobackup=ZfsAutobackup() sys.exit(zfs_autobackup.run())