summaryrefslogtreecommitdiffstats
path: root/cns-libs/cnslibs/common/dynamic_provisioning.py
blob: 70dffa4f5467d0baf705c8e68eb2dfd2ad1c7ec3 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
from collections import OrderedDict
import json
import os
import tempfile

from glusto.core import Glusto as g
from glustolibs.misc.misc_libs import upload_scripts
import rtyaml

from cnslibs.common import exceptions
from cnslibs.common.waiter import Waiter


TEMPLATE_DIR = os.path.abspath(os.path.dirname(__file__))


def create_pvc_file(hostname, claim_name, storage_class, size):
    '''
     This function creates pvc file
     Args:
         hostname (str): hostname on which we need to
                         create pvc file
         claim_name (str): name of the claim
                          ex: storage-claim1
         storage_class(str): name of the storage class
         size (int): size of the claim in GB
                          ex: 10 (for 10GB claim)
     Returns:
         bool: True if successful,
               otherwise False
    '''
    with open(os.path.join(TEMPLATE_DIR,
                           "sample-glusterfs-pvc-claim.json")) as data_file:
        data = json.load(data_file, object_pairs_hook=OrderedDict)
    data['metadata']['annotations'][
        'volume.beta.kubernetes.io/storage-class'] = storage_class
    data['metadata']['name'] = claim_name
    data['spec']['resources']['requests']['storage'] = "%dGi" % size
    try:
        conn = g.rpyc_get_connection(hostname, user="root")
        if conn is None:
            g.log.error("Failed to get rpyc connection of node %s"
                        % hostname)
            return False

        with conn.builtin.open('/%s.json' % claim_name, 'w') as data_file:
            json.dump(data, data_file, sort_keys=False,
                      indent=4, ensure_ascii=False)
    except Exception as err:
        g.log.error("failed to create pvc file %s" % err)
        return False
    finally:
        g.rpyc_close_connection(hostname, user="root")
    g.log.info("creation of pvc file %s successful" % claim_name)
    return True


def create_app_pod_file(hostname, claim_name, app_name, sample_app_name):
    '''
     This function creates app_pod_name file
     Args:
         hostname (str): hostname on which we need to
                         create app pod file
         claim_name (str): name of the claim
                           ex: storage-claim1
         app_name (str): name of the app-pod to create
                         ex: nginx1
         sample_app_name (str): sample-app-pod-name
                                ex: nginx
     Returns:
         bool: True if successful,
               otherwise False
    '''
    data = rtyaml.load(open(
        os.path.join(TEMPLATE_DIR, "sample-%s-pod.yaml" % sample_app_name)))
    data['spec']['volumes'][0]['persistentVolumeClaim'][
        'claimName'] = claim_name
    data['metadata']['name'] = app_name
    data['spec']['containers'][0]['name'] = app_name
    try:
        conn = g.rpyc_get_connection(hostname, user="root")
        if conn is None:
            g.log.error("Failed to get rpyc connection of node %s"
                        % hostname)
            return False
        rtyaml.dump(data, conn.builtin.open('/%s.yaml' % app_name, "w"))
    except Exception as err:
        g.log.error("failed to create app file %s" % err)
        return False
    finally:
        g.rpyc_close_connection(hostname, user="root")
    g.log.info("creation of %s app file successful" % app_name)
    return True


def create_secret_file(hostname, secret_name, namespace,
                       data_key, secret_type):
    '''
     This function creates secret yaml file
     Args:
         hostname (str): hostname on which we need to create
                         secret yaml file
         sc_name (str): secret name ex: heketi-secret
         namespace (str): namespace ex: storage-project
         data_key (str): data-key ex: cGFzc3dvcmQ=
         secret_type (str): type ex: kubernetes.io/glusterfs
                                 or gluster.org/glusterblock
     Returns:
         bool: True if successful,
               otherwise False
    '''
    data = rtyaml.load(open(
        os.path.join(TEMPLATE_DIR, "sample-glusterfs-secret.yaml")))

    data['metadata']['name'] = secret_name
    data['data']['key'] = data_key
    data['metadata']['namespace'] = namespace
    data['type'] = secret_type
    try:
        conn = g.rpyc_get_connection(hostname, user="root")
        if conn is None:
            g.log.error("Failed to get rpyc connection of node %s"
                        % hostname)
            return False
        rtyaml.dump(data, conn.builtin.open('/%s.yaml' % secret_name, "w"))
    except Exception as err:
        g.log.error("failed to create %s.yaml file %s" % (secret_name, err))
        return False
    finally:
        g.rpyc_close_connection(hostname, user="root")
    g.log.info("creation of %s.yaml file successful" % secret_name)
    return True


def create_storage_class_file(hostname, sc_name, resturl,
                              provisioner, **kwargs):
    '''
     This function creates storageclass yaml file
     Args:
         hostname (str): hostname on which we need to create
                         stoargeclass yaml file
         sc_name (str): stoargeclass name ex: fast
         resturl (str): resturl
          ex: http://heketi-storage-project.cloudapps.mystorage.com
         provisioner (str): provisioner
                            ex:  kubernetes.io/glusterfs
                                or gluster.org/glusterblock
         auth (bool): Authorization
                      ex: True/False
     Kwargs:
         **kwargs
            The keys, values in kwargs are:
               restuser:str   ex: username: test-admin
               hacount:int ex: hacount:3
               clusterids:str
                ex: clusterids: "630372ccdc720a92c681fb928f27b53f"
               chapauthenabled:bool ex: chapauthenabled:True/False
               restauthenabled:bool ex: restauthenabled:True/False
               secretnamespace:str ex: secretnamespace:"storage-project"
               secretname:str ex: secretname:"heketi-secret"
               restsecretnamespace:str
                ex: restsecretnamespace:"storage-project"
               restsecretname:str ex: restsecretname:"heketi-secret"
               volumenameprefix:str ex: "dept_qe"
     Returns:
         bool: True if successful,
               otherwise False
    '''
    data = rtyaml.load(open(
        os.path.join(TEMPLATE_DIR, "sample-glusterfs-storageclass.yaml")))

    data['metadata']['name'] = sc_name
    data['parameters']['resturl'] = resturl
    data['provisioner'] = provisioner

    for key in ('secretnamespace', 'restuser', 'secretname',
                'restauthenabled', 'restsecretnamespace',
                'restsecretname', 'hacount', 'clusterids',
                'chapauthenabled', 'volumenameprefix'):
        if kwargs.get(key):
            data['parameters'][key] = kwargs.get(key)

    try:
        conn = g.rpyc_get_connection(hostname, user="root")
        if conn is None:
            g.log.error("Failed to get rpyc connection of node %s"
                        % hostname)
            return False
        provisioner_name = provisioner.split("/")
        file_path = ("/%s-%s-storage-class"
                     ".yaml" % (
                         sc_name, provisioner_name[1]))
        rtyaml.dump(data, conn.builtin.open(file_path, "w"))
    except Exception as err:
        g.log.error("failed to create storage-class file %s" % err)
        return False
    finally:
        g.rpyc_close_connection(hostname, user="root")
    g.log.info("creation of %s-storage-class file successful" % sc_name)
    return True


def wait_for_pod_be_ready(hostname, pod_name,
                          timeout=1200, wait_step=60):
    '''
     This funciton waits for pod to be in ready state
     Args:
         hostname (str): hostname on which we want to check the pod status
         pod_name (str): pod_name for which we need the status
         timeout (int): timeout value,,
                        default value is 1200 sec
         wait_step( int): wait step,
                          default value is 60 sec
     Returns:
         bool: True if pod status is Running and ready state,
               otherwise Raise Exception
    '''
    for w in Waiter(timeout, wait_step):
        # command to find pod status and its phase
        cmd = ("oc get pods %s -o=custom-columns="
               ":.status.containerStatuses[0].ready,"
               ":.status.phase") % pod_name
        ret, out, err = g.run(hostname, cmd, "root")
        if ret != 0:
            msg = ("failed to execute cmd %s" % cmd)
            g.log.error(msg)
            raise exceptions.ExecutionError(msg)
        output = out.strip().split()

        # command to find if pod is ready
        if output[0] == "true" and output[1] == "Running":
            g.log.info("pod %s is in ready state and is "
                       "Running" % pod_name)
            return True
        elif output[1] == "Error":
            msg = ("pod %s status error" % pod_name)
            g.log.error(msg)
            raise exceptions.ExecutionError(msg)
        else:
            g.log.info("pod %s ready state is %s,"
                       " phase is %s,"
                       " sleeping for %s sec" % (
                           pod_name, output[0],
                           output[1], wait_step))
            continue
    if w.expired:
        err_msg = ("exceeded timeout %s for waiting for pod %s "
                   "to be in ready state" % (timeout, pod_name))
        g.log.error(err_msg)
        raise exceptions.ExecutionError(err_msg)


def get_pod_name_from_dc(hostname, dc_name,
                         timeout=1200, wait_step=60):
    '''
     This funciton return pod_name from dc_name
     Args:
         hostname (str): hostname on which we can execute oc
                         commands
         dc_name (str): deployment_confidg name
         timeout (int): timeout value
                        default value is 1200 sec
         wait_step( int): wait step,
                          default value is 60 sec
     Returns:
         str: pod_name if successful
         otherwise Raise Exception
    '''
    cmd = ("oc get pods --all-namespaces -o=custom-columns="
           ":.metadata.name "
           "--no-headers=true "
           "--selector deploymentconfig=%s" % dc_name)
    for w in Waiter(timeout, wait_step):
        ret, out, err = g.run(hostname, cmd, "root")
        if ret != 0:
            msg = ("failed to execute cmd %s" % cmd)
            g.log.error(msg)
            raise exceptions.ExecutionError(msg)
        output = out.strip()
        if output == "":
            g.log.info("podname for dc %s not found sleeping for "
                       "%s sec" % (dc_name, wait_step))
            continue
        else:
            g.log.info("podname is %s for dc %s" % (
                           output, dc_name))
            return output
    if w.expired:
        err_msg = ("exceeded timeout %s for waiting for pod_name"
                   "for dc %s " % (timeout, dc_name))
        g.log.error(err_msg)
        raise exceptions.ExecutionError(err_msg)


def create_mongodb_pod(hostname, pvc_name, pvc_size, sc_name):
    '''
     This function creates mongodb pod
     Args:
         hostname (str): hostname on which we want to create
                         mongodb pod
         pvc_name (str): name of the pvc
                         ex: pvc-claim1
         sc_name (str): name of the storage class
                        ex: fast
     Returns: True if successfull,
              False otherwise
    '''
    template_path = os.path.join(TEMPLATE_DIR, "mongodb-template.json")
    with open(template_path, 'r') as template_f:
        data = json.load(template_f, object_pairs_hook=OrderedDict)
    data['objects'][1]['metadata']['annotations'][
        'volume.beta.kubernetes.io/storage-class'] = sc_name

    tmp_fd, tmp_path = tempfile.mkstemp(
        prefix='cns-automation-mongodb-pvcname-%s-' % pvc_name, suffix='.json')
    dst_dir = '/tmp'
    dst_path = os.path.join(dst_dir, os.path.basename(tmp_path))
    try:
        with os.fdopen(tmp_fd, 'w') as tmp_f:
            json.dump(
                data, tmp_f, sort_keys=False, indent=4, ensure_ascii=False)
        if not upload_scripts(hostname, tmp_path, dst_dir, "root"):
            g.log.error("Failed to upload mongodp template to %s" % hostname)
            return False
    finally:
        os.remove(tmp_path)

    try:
        conn = g.rpyc_get_connection(hostname, user="root")
        if conn is None:
            g.log.error("Failed to get rpyc connection of node %s"
                        % hostname)
            return False
        cmd = ("oc new-app %s --param=DATABASE_SERVICE_NAME=%s "
               "--param=VOLUME_CAPACITY=%sGi") % (
                   dst_path, pvc_name, pvc_size)
        ret, out, err = g.run(hostname, cmd, "root")
        if ret != 0:
            g.log.error("failed to execute cmd %s on %s" % (cmd, hostname))
            return False
    except Exception as err:
        g.log.error("failed to create mongodb pod %s" % err)
        return False
    finally:
        g.rpyc_close_connection(hostname, user="root")
    g.log.info("creation of mongodb pod successfull")
    return True


def get_pvc_status(hostname, pvc_name):
    '''
     This function verifies the if pod is running
     Args:
         hostname (str): hostname on which we want
                         to check the pvc status
         pvc_name (str): pod_name for which we
                         need the status
     Returns:
         bool, status (str): True, status of pvc
               otherwise False, error message.
    '''
    cmd = "oc get pvc | grep %s | awk '{print $2}'" % pvc_name
    ret, out, err = g.run(hostname, cmd, "root")
    if ret != 0:
        g.log.error("failed to execute cmd %s" % cmd)
        return False, err
    output = out.strip().split("\n")[0].strip()
    return True, output


def verify_pvc_status_is_bound(hostname, pvc_name, timeout=120, wait_step=3):
    """Verify that PVC gets 'Bound' status in required time.

    Args:
        hostname (str): hostname on which we will execute oc commands
        pvc_name (str): name of PVC to check status of
        timeout (int): total time in seconds we are ok to wait
                       for 'Bound' status of a PVC
        wait_step (int): time in seconds we will sleep before checking a PVC
                         status again.
    Returns: None
    Raises: exceptions.ExecutionError in case of errors.
    """
    pvc_not_found_counter = 0
    for w in Waiter(timeout, wait_step):
        ret, output = get_pvc_status(hostname, pvc_name)
        if ret is not True:
            msg = ("Failed to execute 'get' command for '%s' PVC. "
                   "Got following responce: %s" % (pvc_name, output))
            g.log.error(msg)
            raise exceptions.ExecutionError(msg)
        if output == "":
            g.log.info("PVC '%s' not found, sleeping for %s "
                       "sec." % (pvc_name, wait_step))
            if pvc_not_found_counter > 0:
                msg = ("PVC '%s' has not been found 2 times already. "
                       "Make sure you provided correct PVC name." % pvc_name)
            else:
                pvc_not_found_counter += 1
                continue
        elif output == "Pending":
            g.log.info("PVC '%s' is in Pending state, sleeping for %s "
                       "sec" % (pvc_name, wait_step))
            continue
        elif output == "Bound":
            g.log.info("PVC '%s' is in Bound state." % pvc_name)
            return pvc_name
        elif output == "Error":
            msg = "PVC '%s' is in 'Error' state." % pvc_name
            g.log.error(msg)
        else:
            msg = "PVC %s has different status - %s" % (pvc_name, output)
            g.log.error(msg)
        if msg:
            raise AssertionError(msg)
    if w.expired:
        # for debug purpose to see why provisioning failed
        cmd = "oc describe pvc %s | grep ProvisioningFailed" % pvc_name
        ret, out, err = g.run(hostname, cmd, "root")
        g.log.info("cmd %s - out- %s err- %s" % (cmd, out, err))
        msg = ("Exceeded timeout of '%s' seconds for verifying PVC '%s' "
               "to reach the 'Bound' status." % (timeout, pvc_name))
        g.log.error(msg)
        raise AssertionError(msg)