summaryrefslogtreecommitdiffstats
path: root/tests/functional/afr
diff options
context:
space:
mode:
Diffstat (limited to 'tests/functional/afr')
-rw-r--r--tests/functional/afr/test_afr_cli_gfid_splitbrain.py191
1 files changed, 191 insertions, 0 deletions
diff --git a/tests/functional/afr/test_afr_cli_gfid_splitbrain.py b/tests/functional/afr/test_afr_cli_gfid_splitbrain.py
new file mode 100644
index 000000000..a886209f5
--- /dev/null
+++ b/tests/functional/afr/test_afr_cli_gfid_splitbrain.py
@@ -0,0 +1,191 @@
+# Copyright (C) 2017-2018 Red Hat, Inc. <http://www.redhat.com>
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License along
+# with this program; if not, write to the Free Software Foundation, Inc.,
+# 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
+
+# pylint: disable=too-many-statements, too-many-locals
+
+from glusto.core import Glusto as g
+from glustolibs.gluster.exceptions import ExecutionError
+from glustolibs.gluster.gluster_base_class import GlusterBaseClass, runs_on
+from glustolibs.gluster.brick_libs import (get_all_bricks,
+ bring_bricks_offline,
+ bring_bricks_online)
+from glustolibs.misc.misc_libs import upload_scripts
+from glustolibs.io.utils import validate_io_procs
+from glustolibs.gluster.heal_ops import (disable_self_heal_daemon,
+ enable_self_heal_daemon,
+ trigger_heal)
+from glustolibs.gluster.heal_libs import (is_volume_in_split_brain,
+ monitor_heal_completion)
+
+
+@runs_on([['replicated'], ['glusterfs', 'cifs']])
+class TestSelfHeal(GlusterBaseClass):
+
+ @classmethod
+ def setUpClass(cls):
+
+ # Calling GlusterBaseClass setUpClass
+ GlusterBaseClass.setUpClass.im_func(cls)
+
+ # Upload io scripts for running IO on mounts
+ g.log.info("Upload io scripts to clients %s for running IO on "
+ "mounts", cls.clients)
+ script_local_path = ("/usr/share/glustolibs/io/scripts/"
+ "file_dir_ops.py")
+ cls.script_upload_path = ("/usr/share/glustolibs/io/scripts/"
+ "file_dir_ops.py")
+ ret = upload_scripts(cls.clients, script_local_path)
+ if not ret:
+ raise ExecutionError("Failed to upload IO scripts "
+ "to clients %s" % cls.clients)
+ g.log.info("Successfully uploaded IO scripts to clients %s",
+ cls.clients)
+
+ # Override Volumes
+ if cls.volume_type == "replicated":
+ # Define x2 replicated volume
+ cls.volume['voltype'] = {
+ 'type': 'replicated',
+ 'replica_count': 2,
+ 'transport': 'tcp'}
+
+ # Setup Volume and Mount Volume
+ g.log.info("Starting to Setup Volume and Mount Volume")
+ ret = cls.setup_volume_and_mount_volume(cls.mounts, True)
+ if not ret:
+ raise ExecutionError("Failed to Setup_Volume and Mount_Volume")
+ g.log.info("Successful in Setup Volume and Mount Volume")
+
+ @classmethod
+ def tearDownClass(cls):
+
+ # Cleanup Volume
+ g.log.info("Starting to clean up Volume %s", cls.volname)
+ ret = cls.unmount_volume_and_cleanup_volume(cls.mounts)
+ if not ret:
+ raise ExecutionError("Failed to create volume")
+ g.log.info("Successful in cleaning up Volume %s", cls.volname)
+
+ GlusterBaseClass.tearDownClass.im_func(cls)
+
+ def test_afr_gfid_heal(self):
+
+ """
+ Description: This test case runs split-brain resolution CLIs
+ on a file in gfid split-brain on 1x2 volume.
+ 1. kill 1 brick
+ 2. create a file at mount point
+ 3. bring back the killed brick
+ 4. kill the other brick
+ 5. create same file at mount point
+ 6. bring back the killed brick
+ 7. try heal from CLI and check if it gets completed
+ """
+
+ g.log.info("disabling the self heal daemon")
+ ret = disable_self_heal_daemon(self.mnode, self.volname)
+ self.assertTrue(ret, "unable to disable self heal daemon")
+ g.log.info("Successfully disabled the self heal daemon")
+
+ # getting list of all bricks
+ all_bricks = get_all_bricks(self.mnode, self.volname)
+ self.assertIsNotNone(all_bricks, "unable to get list of bricks")
+ g.log.info("bringing down brick1")
+ ret = bring_bricks_offline(self.volname, all_bricks[0])
+ self.assertTrue(ret, "unable to bring brick1 offline")
+ g.log.info("Successfully brought the following brick offline "
+ ": %s", str(all_bricks[0]))
+
+ g.log.info("creating a file from mount point")
+ all_mounts_procs = []
+ for mount_obj in self.mounts:
+ cmd = ("python %s create_files "
+ "-f 1 --base-file-name test_file --fixed-file-size 1k %s"
+ % (self.script_upload_path, mount_obj.mountpoint))
+ proc = g.run_async(mount_obj.client_system, cmd,
+ user=mount_obj.user)
+ all_mounts_procs.append(proc)
+ # Validate I/O
+ g.log.info("Wait for IO to complete and validate IO.....")
+ ret = validate_io_procs(all_mounts_procs, self.mounts)
+ self.assertTrue(ret, "IO failed on some of the clients")
+ g.log.info("IO is successful on all mounts")
+ g.log.info("Successfully created a file from mount point")
+
+ g.log.info("bringing brick 1 back online")
+ ret = bring_bricks_online(self.mnode, self.volname, all_bricks[0])
+ self.assertIsNotNone(ret, "unable to bring brick 1 online")
+ g.log.info("Successfully brought the following brick online "
+ ": %s", str(all_bricks[0]))
+
+ g.log.info("bringing down brick2")
+ ret = bring_bricks_offline(self.volname, all_bricks[1])
+ self.assertTrue(ret, "unable to bring brick2 offline")
+ g.log.info("Successfully brought the following brick offline "
+ ": %s", str(all_bricks[1]))
+
+ g.log.info("creating a new file of same name from mount point")
+ all_mounts_procs = []
+ for mount_obj in self.mounts:
+ cmd = ("python %s create_files "
+ "-f 1 --base-file-name test_file --fixed-file-size 1k %s"
+ % (self.script_upload_path, mount_obj.mountpoint))
+ proc = g.run_async(mount_obj.client_system, cmd,
+ user=mount_obj.user)
+ all_mounts_procs.append(proc)
+ # Validate I/O
+ g.log.info("Wait for IO to complete and validate IO.....")
+ ret = validate_io_procs(all_mounts_procs, self.mounts)
+ self.assertTrue(ret, "IO failed on some of the clients")
+ g.log.info("IO is successful on all mounts")
+ g.log.info("Successfully created a new file of same name "
+ "from mount point")
+
+ g.log.info("bringing brick2 back online")
+ ret = bring_bricks_online(self.mnode, self.volname, all_bricks[1])
+ self.assertIsNotNone(ret, "unable to bring brick2 online")
+ g.log.info("Successfully brought the following brick online "
+ ": %s", str(all_bricks[1]))
+
+ g.log.info("enabling the self heal daemon")
+ ret = enable_self_heal_daemon(self.mnode, self.volname)
+ self.assertTrue(ret, "failed to enable self heal daemon")
+ g.log.info("Successfully enabled the self heal daemon")
+
+ g.log.info("checking if file is in split-brain")
+ ret = is_volume_in_split_brain(self.mnode, self.volname)
+ self.assertTrue(ret, "unable to create split-brain scenario")
+ g.log.info("Successfully created split brain scenario")
+
+ g.log.info("resolving split-brain by choosing second brick as "
+ "the source brick")
+ node, _ = all_bricks[0].split(':')
+ command = ("gluster v heal " + self.volname + " split-brain "
+ "source-brick " + all_bricks[1] + " /test_file0.txt")
+ ret, _, _ = g.run(node, command)
+ self.assertEqual(ret, 0, "command execution not successful")
+ # triggering heal
+ ret = trigger_heal(self.mnode, self.volname)
+ self.assertTrue(ret, "heal not triggered")
+ # waiting for heal to complete
+ ret = monitor_heal_completion(self.mnode, self.volname,
+ timeout_period=120)
+ self.assertTrue(ret, "heal not completed")
+ # checking if file is in split-brain
+ ret = is_volume_in_split_brain(self.mnode, self.volname)
+ self.assertFalse(ret, "file still in split-brain")
+ g.log.info("Successfully resolved split brain situation using "
+ "CLI based resolution")