summaryrefslogtreecommitdiffstats
path: root/tests/functional/glusterd/test_self_heal_quota_daemon_after_reboot.py
blob: f1a523ce64b6dbac65d7d2dc10cf92abec651130 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
#  Copyright (C) 2017-2020  Red Hat, Inc. <http://www.redhat.com>
#
#  This program is free software; you can redistribute it and/or modify
#  it under the terms of the GNU General Public License as published by
#  the Free Software Foundation; either version 2 of the License, or
#  any later version.
#
#  This program is distributed in the hope that it will be useful,
#  but WITHOUT ANY WARRANTY; without even the implied warranty of
#  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
#  GNU General Public License for more details.
#
#  You should have received a copy of the GNU General Public License along
#  with this program; if not, write to the Free Software Foundation, Inc.,
#  51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.

"""
        Description:
        Test Cases in this module related to test self heal
        deamon and quota daemon status after reboot.
"""
from glusto.core import Glusto as g
from glustolibs.gluster.exceptions import ExecutionError
from glustolibs.gluster.gluster_base_class import GlusterBaseClass, runs_on
from glustolibs.gluster.quota_ops import quota_enable, quota_limit_usage
from glustolibs.gluster.volume_ops import get_volume_status
from glustolibs.misc.misc_libs import reboot_nodes_and_wait_to_come_online
from glustolibs.gluster.gluster_init import (is_glusterd_running,
                                             start_glusterd,
                                             wait_for_glusterd_to_start)
from glustolibs.gluster.peer_ops import wait_for_peers_to_connect


@runs_on([['replicated', 'distributed-replicated'], ['glusterfs']])
class TestSelfHealDeamonQuotaDeamonAfterReboot(GlusterBaseClass):
    def setUp(self):
        self.get_super_method(self, 'setUp')()

        # checking for peer status from every node
        ret = self.validate_peers_are_connected()
        if not ret:
            raise ExecutionError("Servers are not in peer probed state")

        # Creating Volume
        g.log.info("Started creating volume")
        ret = self.setup_volume_and_mount_volume(self.mounts)
        if not ret:
            raise ExecutionError("Volume creation failed: %s" % self.volname)
        g.log.info("Volume created successfully : %s", self.volname)

    def tearDown(self):
        ret = is_glusterd_running(self.servers)
        if ret:
            ret = start_glusterd(self.servers)
            if not ret:
                raise ExecutionError("Failed to start glusterd on %s"
                                     % self.servers)
        g.log.info("Glusterd started successfully on %s", self.servers)

        # checking for peer status from every node
        ret = wait_for_peers_to_connect(self.mnode, self.servers)
        if not ret:
            raise ExecutionError("Peers are not in connected state")

        # stopping the volume and Cleaning up the volume
        ret = self.unmount_volume_and_cleanup_volume(self.mounts)
        if not ret:
            raise ExecutionError("Failed to Cleanup the Volume %s"
                                 % self.volname)
        g.log.info("Volume deleted successfully %s", self.volname)

    def is_daemon_process_running(self):
        """
            function for checking daemon process.
        """
        vol_status_shd_pid_list = []
        vol_status_quotad_pid_list = []
        g.log.info("Total self-heal and quota daemon process should be %d for "
                   "%d nodes", len(self.servers) * 2, len(self.servers))

        # Getting vol status in dictonary format
        vol_status = get_volume_status(self.mnode, self.volname)

        # Getting self-heal daemon and quota daemon pids of every host from
        # gluster volume status
        for server in self.servers:
            vol_status_quotad_pid_list.append(
                vol_status[self.volname][server]['Quota Daemon']['pid'])
            vol_status_shd_pid_list.append(
                vol_status[self.volname][server]['Self-heal Daemon']['pid'])

        g.log.info("shd list from get volume status: %s",
                   vol_status_shd_pid_list)
        g.log.info("quotad list from get volume status: %s",
                   vol_status_quotad_pid_list)

        sh_daemon_list = []
        quotad_list = []

        # Finding and Storing all hosts self heal daemon
        # in to sh_daemon_list, all
        # host quota daemon into quotad_list list using ps command
        for daemon_name, daemon_list in (('glustershd', sh_daemon_list),
                                         ('quotad', quotad_list)):
            for host in self.servers:
                cmd = "ps -eaf |grep %s |grep -v grep | awk '{ print $2 }'" % (
                    daemon_name)
                ret, out, err = g.run(host, cmd)
                err_msg = (
                    "Failed to find '%s' daemon on the '%s' host using "
                    "'ps -eaf' command.\nret: %s\nout: %s\nerr: %s" % (
                        daemon_name, host, ret, out, err)
                )
                self.assertEqual(ret, 0, err_msg)
                daemon_list.append(out.strip())

        g.log.info("shd list :%s", sh_daemon_list)
        g.log.info("quotad list :%s", quotad_list)

        # Checking in all hosts quota daemon and self heal daemon is
        # running or not
        # Here comparing the list of daemons got from ps command and
        # list of daemons got from vol status command,
        # all daemons should match from both the list
        if sorted(sh_daemon_list + quotad_list) == sorted(
                vol_status_shd_pid_list + vol_status_quotad_pid_list):
            return len(sh_daemon_list + quotad_list) == len(self.servers) * 2

        return False

    def test_daemons_after_reboot(self):
        '''
        Creating volume then performing FUSE mount
        then enable quota to that volume, then set quota
        limit to that volume then perform a reboot and check
        the selfheal daemon and quota daemon running or not
        after reboot
        '''

        # Enabling quota to volume
        ret, _, _ = quota_enable(self.mnode, self.volname)
        self.assertEqual(ret, 0, "Failed to enable quota on volume : "
                                 "%s" % self.volname)
        g.log.info("quota enabled successfully on volume: %s", self.volname)

        # Setting quota limit to volume
        ret, _, _ = quota_limit_usage(
            self.mnode,
            self.volname,
            path='/',
            limit='1GB',
            soft_limit='')
        self.assertEqual(ret, 0, "Quota limit set failed "
                                 "on volume : %s" % self.volname)

        ret, _ = reboot_nodes_and_wait_to_come_online(self.servers[1])
        self.assertTrue(ret, "Failed to reboot the node %s"
                        % self.servers[1])
        g.log.info("Node %s rebooted successfully", self.servers[1])

        # Checking glusterd status and peer status afte reboot of server
        self.assertTrue(
            wait_for_glusterd_to_start(self.servers[1]),
            "Failed to start glusterd on %s" % self.servers[1])
        self.assertTrue(
            wait_for_peers_to_connect(self.mnode, self.servers),
            "some peers are not in connected state")
        g.log.info("glusterd is running and all peers are in "
                   "connected state")

        # Checks self heal daemon and quota daemon process running or not
        ret = self.is_daemon_process_running()
        self.assertTrue(ret, "failed to run self-heal and quota daemon "
                             "processs on all hosts")
        g.log.info("self-heal and quota daemons are running on all "
                   "hosts successfully")