wip (will usse zfs-check to do actual hashing)
This commit is contained in:
		| @ -16,10 +16,12 @@ from basetest import * | |||||||
| # - test all directions (local, remote/local, local/remote, remote/remote) | # - test all directions (local, remote/local, local/remote, remote/remote) | ||||||
| # | # | ||||||
|  |  | ||||||
| class TestZfsEncryption(unittest2.TestCase): | class TestZfsVerify(unittest2.TestCase): | ||||||
|  |  | ||||||
|  |  | ||||||
|     def setUp(self): |     def setUp(self): | ||||||
|  |         self.skipTest("WIP") | ||||||
|  |  | ||||||
|         prepare_zpools() |         prepare_zpools() | ||||||
|  |  | ||||||
|         #create actual test files and data |         #create actual test files and data | ||||||
|  | |||||||
| @ -1,80 +1,67 @@ | |||||||
| import os | # from util import activate_volume_snapshot, create_mountpoints, cleanup_mountpoint | ||||||
| import time |  | ||||||
|  |  | ||||||
| from .ExecuteNode import ExecuteNode |  | ||||||
| from .ZfsAuto import ZfsAuto | from .ZfsAuto import ZfsAuto | ||||||
| from .ZfsDataset import ZfsDataset |  | ||||||
| from .ZfsNode import ZfsNode | from .ZfsNode import ZfsNode | ||||||
| import sys | import sys | ||||||
| import platform |  | ||||||
|  |  | ||||||
| def tmp_name(suffix=""): |  | ||||||
|     """create temporary name unique to this process and node""" |  | ||||||
|  |  | ||||||
|     #we could use uuids but those are ugly and confusing |  | ||||||
|     name="zfstmp_{}_{}".format(platform.node(), os.getpid()) |  | ||||||
|     name=name+suffix |  | ||||||
|     return name |  | ||||||
|  |  | ||||||
|  |  | ||||||
| # try to be as unix compatible as possible, while still having decent performance | # # try to be as unix compatible as possible, while still having decent performance | ||||||
| def compare_trees_find(source_node, source_path, target_node, target_path): | # def compare_trees_find(source_node, source_path, target_node, target_path): | ||||||
|     # find /tmp/zfstmp_pve1_1993135target/ -xdev -type f -print0 | xargs -0 md5sum | md5sum -c | #     # find /tmp/zfstmp_pve1_1993135target/ -xdev -type f -print0 | xargs -0 md5sum | md5sum -c | ||||||
|  | # | ||||||
|     #verify tree has atleast one file | #     #verify tree has atleast one file | ||||||
|  | # | ||||||
|     stdout=source_node.run(["find", ".", "-type", "f", | #     stdout=source_node.run(["find", ".", "-type", "f", | ||||||
|                           ExecuteNode.PIPE, "head", "-n1", | #                           ExecuteNode.PIPE, "head", "-n1", | ||||||
|                           ], cwd=source_path) | #                           ], cwd=source_path) | ||||||
|  | # | ||||||
|     if not stdout: | #     if not stdout: | ||||||
|         source_node.debug("No files, skipping check") | #         source_node.debug("No files, skipping check") | ||||||
|     else: | #     else: | ||||||
|         pipe=source_node.run(["find", ".", "-type", "f", "-print0", | #         pipe=source_node.run(["find", ".", "-type", "f", "-print0", | ||||||
|                               ExecuteNode.PIPE, "xargs", "-0", "md5sum" | #                               ExecuteNode.PIPE, "xargs", "-0", "md5sum" | ||||||
|                               ], pipe=True, cwd=source_path) | #                               ], pipe=True, cwd=source_path) | ||||||
|         stdout=target_node.run([ "md5sum", "-c", "--quiet"], inp=pipe, cwd=target_path, valid_exitcodes=[0,1]) | #         stdout=target_node.run([ "md5sum", "-c", "--quiet"], inp=pipe, cwd=target_path, valid_exitcodes=[0,1]) | ||||||
|  | # | ||||||
|         if len(stdout): | #         if len(stdout): | ||||||
|             for line in stdout: | #             for line in stdout: | ||||||
|                 target_node.error("md5sum: "+line) | #                 target_node.error("md5sum: "+line) | ||||||
|  | # | ||||||
|             raise(Exception("Some files have checksum errors")) | #             raise(Exception("Some files have checksum errors")) | ||||||
|  | # | ||||||
|  | # | ||||||
| def compare_trees_rsync(source_node, source_path, target_node, target_path): | # def compare_trees_rsync(source_node, source_path, target_node, target_path): | ||||||
|     """use rsync to compare two trees. | #     """use rsync to compare two trees. | ||||||
|      Advantage is that we can see which individual files differ. | #      Advantage is that we can see which individual files differ. | ||||||
|      But requires rsync and cant do remote to remote.""" | #      But requires rsync and cant do remote to remote.""" | ||||||
|  | # | ||||||
|     cmd = ["rsync", "-rcnq", "--info=COPY,DEL,MISC,NAME,SYMSAFE", "--msgs2stderr", "--delete" ] | #     cmd = ["rsync", "-rcnq", "--info=COPY,DEL,MISC,NAME,SYMSAFE", "--msgs2stderr", "--delete" ] | ||||||
|  | # | ||||||
|     #local | #     #local | ||||||
|     if source_node.ssh_to is None and target_node.ssh_to is None: | #     if source_node.ssh_to is None and target_node.ssh_to is None: | ||||||
|         cmd.append("{}/".format(source_path)) | #         cmd.append("{}/".format(source_path)) | ||||||
|         cmd.append("{}/".format(target_path)) | #         cmd.append("{}/".format(target_path)) | ||||||
|         source_node.debug("Running rsync locally, on source.") | #         source_node.debug("Running rsync locally, on source.") | ||||||
|         stdout, stderr = source_node.run(cmd, return_stderr=True) | #         stdout, stderr = source_node.run(cmd, return_stderr=True) | ||||||
|  | # | ||||||
|     #source is local | #     #source is local | ||||||
|     elif source_node.ssh_to is None and target_node.ssh_to is not None: | #     elif source_node.ssh_to is None and target_node.ssh_to is not None: | ||||||
|         cmd.append("{}/".format(source_path)) | #         cmd.append("{}/".format(source_path)) | ||||||
|         cmd.append("{}:{}/".format(target_node.ssh_to, target_path)) | #         cmd.append("{}:{}/".format(target_node.ssh_to, target_path)) | ||||||
|         source_node.debug("Running rsync locally, on source.") | #         source_node.debug("Running rsync locally, on source.") | ||||||
|         stdout, stderr = source_node.run(cmd, return_stderr=True) | #         stdout, stderr = source_node.run(cmd, return_stderr=True) | ||||||
|  | # | ||||||
|     #target is local | #     #target is local | ||||||
|     elif source_node.ssh_to is not None and target_node.ssh_to is None: | #     elif source_node.ssh_to is not None and target_node.ssh_to is None: | ||||||
|         cmd.append("{}:{}/".format(source_node.ssh_to, source_path)) | #         cmd.append("{}:{}/".format(source_node.ssh_to, source_path)) | ||||||
|         cmd.append("{}/".format(target_path)) | #         cmd.append("{}/".format(target_path)) | ||||||
|         source_node.debug("Running rsync locally, on target.") | #         source_node.debug("Running rsync locally, on target.") | ||||||
|         stdout, stderr=target_node.run(cmd, return_stderr=True) | #         stdout, stderr=target_node.run(cmd, return_stderr=True) | ||||||
|  | # | ||||||
|     else: | #     else: | ||||||
|         raise Exception("Source and target cant both be remote when verifying. (rsync limitation)") | #         raise Exception("Source and target cant both be remote when verifying. (rsync limitation)") | ||||||
|  | # | ||||||
|     if stderr: | #     if stderr: | ||||||
|         raise Exception("Dataset verify failed, see above list for differences") | #         raise Exception("Dataset verify failed, see above list for differences") | ||||||
|  |  | ||||||
|  |  | ||||||
| def verify_filesystem(source_snapshot, source_mnt, target_snapshot, target_mnt, method): | def verify_filesystem(source_snapshot, source_mnt, target_snapshot, target_mnt, method): | ||||||
| @ -88,8 +75,8 @@ def verify_filesystem(source_snapshot, source_mnt, target_snapshot, target_mnt, | |||||||
|  |  | ||||||
|         if method=='rsync': |         if method=='rsync': | ||||||
|             compare_trees_rsync(source_snapshot.zfs_node, source_mnt, target_snapshot.zfs_node, target_mnt) |             compare_trees_rsync(source_snapshot.zfs_node, source_mnt, target_snapshot.zfs_node, target_mnt) | ||||||
|         elif method == 'tar': |         # elif method == 'tar': | ||||||
|             compare_trees_tar(source_snapshot.zfs_node, source_mnt, target_snapshot.zfs_node, target_mnt) |         #     compare_trees_tar(source_snapshot.zfs_node, source_mnt, target_snapshot.zfs_node, target_mnt) | ||||||
|         elif method == 'find': |         elif method == 'find': | ||||||
|             compare_trees_find(source_snapshot.zfs_node, source_mnt, target_snapshot.zfs_node, target_mnt) |             compare_trees_find(source_snapshot.zfs_node, source_mnt, target_snapshot.zfs_node, target_mnt) | ||||||
|         else: |         else: | ||||||
| @ -100,102 +87,54 @@ def verify_filesystem(source_snapshot, source_mnt, target_snapshot, target_mnt, | |||||||
|         target_snapshot.unmount() |         target_snapshot.unmount() | ||||||
|  |  | ||||||
|  |  | ||||||
| def hash_dev(node, dev): | # def hash_dev(node, dev): | ||||||
|     """calculate md5sum of a device on a node""" | #     """calculate md5sum of a device on a node""" | ||||||
|  | # | ||||||
|     node.debug("Hashing volume {} ".format(dev)) | #     node.debug("Hashing volume {} ".format(dev)) | ||||||
|  | # | ||||||
|     cmd = [ "md5sum", dev ] | #     cmd = [ "md5sum", dev ] | ||||||
|  | # | ||||||
|     stdout = node.run(cmd) | #     stdout = node.run(cmd) | ||||||
|  | # | ||||||
|     if node.readonly: | #     if node.readonly: | ||||||
|         hashed=None | #         hashed=None | ||||||
|     else: | #     else: | ||||||
|         hashed = stdout[0].split(" ")[0] | #         hashed = stdout[0].split(" ")[0] | ||||||
|  | # | ||||||
|     node.debug("Hash of volume {} is {}".format(dev, hashed)) | #     node.debug("Hash of volume {} is {}".format(dev, hashed)) | ||||||
|  | # | ||||||
|     return hashed | #     return hashed | ||||||
|  |  | ||||||
|  |  | ||||||
| #NOTE: https://www.google.com/search?q=Mount+Path+Limit+freebsd |  | ||||||
| #Freebsd has limitations regarding path length, so we cant use the above method. |  | ||||||
| #Instead we create a temporary clone |  | ||||||
|  |  | ||||||
| def get_tmp_clone_name(snapshot): | # def deacitvate_volume_snapshot(snapshot): | ||||||
|     pool=snapshot.zfs_node.get_pool(snapshot) | #     clone_name=get_tmp_clone_name(snapshot) | ||||||
|     return pool.name+"/"+tmp_name() | #     clone=snapshot.zfs_node.get_dataset(clone_name) | ||||||
|  | #     clone.destroy(deferred=True, verbose=False) | ||||||
| def activate_volume_snapshot(snapshot): |  | ||||||
|     """clone volume, waits and tries to findout /dev path to the volume, in a compatible way. (linux/freebsd/smartos)""" |  | ||||||
|  |  | ||||||
|     clone_name=get_tmp_clone_name(snapshot) |  | ||||||
|     clone=snapshot.clone(clone_name) |  | ||||||
|  |  | ||||||
|     #NOTE: add smartos location to this list as well |  | ||||||
|     locations=[ |  | ||||||
|         "/dev/zvol/" + clone_name |  | ||||||
|     ] |  | ||||||
|  |  | ||||||
|     clone.debug("Waiting for /dev entry to appear...") |  | ||||||
|     time.sleep(0.1) |  | ||||||
|  |  | ||||||
|     start_time=time.time() |  | ||||||
|     while time.time()-start_time<10: |  | ||||||
|         for location in locations: |  | ||||||
|             stdout, stderr, exit_code=clone.zfs_node.run(["test", "-e", location], return_all=True, valid_exitcodes=[0,1]) |  | ||||||
|  |  | ||||||
|             #fake it in testmode |  | ||||||
|             if clone.zfs_node.readonly: |  | ||||||
|                 return location |  | ||||||
|  |  | ||||||
|             if exit_code==0: |  | ||||||
|                 return location |  | ||||||
|         time.sleep(1) |  | ||||||
|  |  | ||||||
|     raise(Exception("Timeout while waiting for {} entry to appear.".format(locations))) |  | ||||||
|  |  | ||||||
| def deacitvate_volume_snapshot(snapshot): |  | ||||||
|     clone_name=get_tmp_clone_name(snapshot) |  | ||||||
|     clone=snapshot.zfs_node.get_dataset(clone_name) |  | ||||||
|     clone.destroy(deferred=True, verbose=False) |  | ||||||
|  |  | ||||||
| def verify_volume(source_dataset, source_snapshot, target_dataset, target_snapshot): | def verify_volume(source_dataset, source_snapshot, target_dataset, target_snapshot): | ||||||
|     """compare the contents of two zfs volume snapshots""" |     """compare the contents of two zfs volume snapshots""" | ||||||
|  |  | ||||||
|     try: |     # try: | ||||||
|         source_dev= activate_volume_snapshot(source_snapshot) |     source_dev= activate_volume_snapshot(source_snapshot) | ||||||
|         target_dev= activate_volume_snapshot(target_snapshot) |     target_dev= activate_volume_snapshot(target_snapshot) | ||||||
|  |  | ||||||
|         source_hash= hash_dev(source_snapshot.zfs_node, source_dev) |     source_hash= hash_dev(source_snapshot.zfs_node, source_dev) | ||||||
|         target_hash= hash_dev(target_snapshot.zfs_node, target_dev) |     target_hash= hash_dev(target_snapshot.zfs_node, target_dev) | ||||||
|  |  | ||||||
|         if source_hash!=target_hash: |     if source_hash!=target_hash: | ||||||
|             raise Exception("md5hash difference: {} != {}".format(source_hash, target_hash)) |         raise Exception("md5hash difference: {} != {}".format(source_hash, target_hash)) | ||||||
|  |  | ||||||
|     finally: |     # finally: | ||||||
|         deacitvate_volume_snapshot(source_snapshot) |     #     deacitvate_volume_snapshot(source_snapshot) | ||||||
|         deacitvate_volume_snapshot(target_snapshot) |     #     deacitvate_volume_snapshot(target_snapshot) | ||||||
|  |  | ||||||
| def create_mountpoints(source_node, target_node): |  | ||||||
|  |  | ||||||
|     # prepare mount points |  | ||||||
|     source_node.debug("Create temporary mount point") |  | ||||||
|     source_mnt = "/tmp/"+tmp_name("source") |  | ||||||
|     source_node.run(["mkdir", source_mnt]) |  | ||||||
|  |  | ||||||
|     target_node.debug("Create temporary mount point") |  | ||||||
|     target_mnt = "/tmp/"+tmp_name("target") |  | ||||||
|     target_node.run(["mkdir", target_mnt]) |  | ||||||
|  |  | ||||||
|     return source_mnt, target_mnt |  | ||||||
|  |  | ||||||
|  |  | ||||||
| def cleanup_mountpoint(node, mnt): | # class ZfsAutoChecksumVolume(ZfsAuto): | ||||||
|     node.debug("Cleaning up temporary mount point") | #     def __init__(self, argv, print_arguments=True): | ||||||
|     node.run([ "rmdir", mnt ], hide_errors=True, valid_exitcodes=[] ) | # | ||||||
|  | #         # NOTE: common options and parameters are in ZfsAuto | ||||||
|  | #         super(ZfsAutoverify, self).__init__(argv, print_arguments) | ||||||
|  |  | ||||||
| class ZfsAutoverify(ZfsAuto): | class ZfsAutoverify(ZfsAuto): | ||||||
|     """The zfs-autoverify class, default agruments and stuff come from ZfsAuto""" |     """The zfs-autoverify class, default agruments and stuff come from ZfsAuto""" | ||||||
|  | |||||||
		Reference in New Issue
	
	Block a user