2020-03-09 10:11:07 +01:00
|
|
|
#!/usr/bin/python
|
|
|
|
# -*- coding: utf-8 -*-
|
|
|
|
|
|
|
|
# Copyright: (c) 2016, Mathieu Bultel <mbultel@redhat.com>
|
|
|
|
# GNU General Public License v3.0+ (see COPYING or https://www.gnu.org/licenses/gpl-3.0.txt)
|
|
|
|
|
|
|
|
from __future__ import absolute_import, division, print_function
|
|
|
|
__metaclass__ = type
|
|
|
|
|
|
|
|
DOCUMENTATION = '''
|
|
|
|
---
|
|
|
|
module: pacemaker_cluster
|
|
|
|
short_description: Manage pacemaker clusters
|
|
|
|
author:
|
|
|
|
- Mathieu Bultel (@matbu)
|
|
|
|
description:
|
|
|
|
- This module can manage a pacemaker cluster and nodes from Ansible using
|
|
|
|
the pacemaker cli.
|
|
|
|
options:
|
|
|
|
state:
|
|
|
|
description:
|
|
|
|
- Indicate desired state of the cluster
|
|
|
|
choices: [ cleanup, offline, online, restart ]
|
2020-11-28 04:54:00 +01:00
|
|
|
type: str
|
2020-03-09 10:11:07 +01:00
|
|
|
node:
|
|
|
|
description:
|
|
|
|
- Specify which node of the cluster you want to manage. None == the
|
|
|
|
cluster status itself, 'all' == check the status of all nodes.
|
2020-11-28 04:54:00 +01:00
|
|
|
type: str
|
2020-03-09 10:11:07 +01:00
|
|
|
timeout:
|
|
|
|
description:
|
|
|
|
- Timeout when the module should considered that the action has failed
|
|
|
|
default: 300
|
2020-11-28 04:54:00 +01:00
|
|
|
type: int
|
2020-03-09 10:11:07 +01:00
|
|
|
force:
|
|
|
|
description:
|
|
|
|
- Force the change of the cluster state
|
|
|
|
type: bool
|
|
|
|
default: 'yes'
|
|
|
|
'''
|
|
|
|
EXAMPLES = '''
|
|
|
|
---
|
|
|
|
- name: Set cluster Online
|
|
|
|
hosts: localhost
|
|
|
|
gather_facts: no
|
|
|
|
tasks:
|
|
|
|
- name: Get cluster state
|
2020-07-13 21:50:31 +02:00
|
|
|
community.general.pacemaker_cluster:
|
2020-03-09 10:11:07 +01:00
|
|
|
state: online
|
|
|
|
'''
|
|
|
|
|
|
|
|
RETURN = '''
|
|
|
|
changed:
|
|
|
|
description: True if the cluster state has changed
|
|
|
|
type: bool
|
|
|
|
returned: always
|
|
|
|
out:
|
|
|
|
description: The output of the current state of the cluster. It return a
|
|
|
|
list of the nodes state.
|
|
|
|
type: str
|
|
|
|
sample: 'out: [[" overcloud-controller-0", " Online"]]}'
|
|
|
|
returned: always
|
|
|
|
rc:
|
|
|
|
description: exit code of the module
|
|
|
|
type: bool
|
|
|
|
returned: always
|
|
|
|
'''
|
|
|
|
|
|
|
|
import time
|
|
|
|
|
|
|
|
from ansible.module_utils.basic import AnsibleModule
|
|
|
|
|
|
|
|
|
|
|
|
_PCS_CLUSTER_DOWN = "Error: cluster is not currently running on this node"
|
|
|
|
|
|
|
|
|
|
|
|
def get_cluster_status(module):
|
|
|
|
cmd = "pcs cluster status"
|
|
|
|
rc, out, err = module.run_command(cmd)
|
|
|
|
if out in _PCS_CLUSTER_DOWN:
|
|
|
|
return 'offline'
|
|
|
|
else:
|
|
|
|
return 'online'
|
|
|
|
|
|
|
|
|
|
|
|
def get_node_status(module, node='all'):
|
|
|
|
if node == 'all':
|
|
|
|
cmd = "pcs cluster pcsd-status %s" % node
|
|
|
|
else:
|
|
|
|
cmd = "pcs cluster pcsd-status"
|
|
|
|
rc, out, err = module.run_command(cmd)
|
|
|
|
if rc == 1:
|
|
|
|
module.fail_json(msg="Command execution failed.\nCommand: `%s`\nError: %s" % (cmd, err))
|
|
|
|
status = []
|
|
|
|
for o in out.splitlines():
|
|
|
|
status.append(o.split(':'))
|
|
|
|
return status
|
|
|
|
|
|
|
|
|
|
|
|
def clean_cluster(module, timeout):
|
|
|
|
cmd = "pcs resource cleanup"
|
|
|
|
rc, out, err = module.run_command(cmd)
|
|
|
|
if rc == 1:
|
|
|
|
module.fail_json(msg="Command execution failed.\nCommand: `%s`\nError: %s" % (cmd, err))
|
|
|
|
|
|
|
|
|
|
|
|
def set_cluster(module, state, timeout, force):
|
|
|
|
if state == 'online':
|
|
|
|
cmd = "pcs cluster start"
|
|
|
|
if state == 'offline':
|
|
|
|
cmd = "pcs cluster stop"
|
|
|
|
if force:
|
|
|
|
cmd = "%s --force" % cmd
|
|
|
|
rc, out, err = module.run_command(cmd)
|
|
|
|
if rc == 1:
|
|
|
|
module.fail_json(msg="Command execution failed.\nCommand: `%s`\nError: %s" % (cmd, err))
|
|
|
|
|
|
|
|
t = time.time()
|
|
|
|
ready = False
|
|
|
|
while time.time() < t + timeout:
|
|
|
|
cluster_state = get_cluster_status(module)
|
|
|
|
if cluster_state == state:
|
|
|
|
ready = True
|
|
|
|
break
|
|
|
|
if not ready:
|
|
|
|
module.fail_json(msg="Failed to set the state `%s` on the cluster\n" % (state))
|
|
|
|
|
|
|
|
|
|
|
|
def set_node(module, state, timeout, force, node='all'):
|
|
|
|
# map states
|
|
|
|
if state == 'online':
|
|
|
|
cmd = "pcs cluster start"
|
|
|
|
if state == 'offline':
|
|
|
|
cmd = "pcs cluster stop"
|
|
|
|
if force:
|
|
|
|
cmd = "%s --force" % cmd
|
|
|
|
|
|
|
|
nodes_state = get_node_status(module, node)
|
|
|
|
for node in nodes_state:
|
|
|
|
if node[1].strip().lower() != state:
|
|
|
|
cmd = "%s %s" % (cmd, node[0].strip())
|
|
|
|
rc, out, err = module.run_command(cmd)
|
|
|
|
if rc == 1:
|
|
|
|
module.fail_json(msg="Command execution failed.\nCommand: `%s`\nError: %s" % (cmd, err))
|
|
|
|
|
|
|
|
t = time.time()
|
|
|
|
ready = False
|
|
|
|
while time.time() < t + timeout:
|
|
|
|
nodes_state = get_node_status(module)
|
|
|
|
for node in nodes_state:
|
|
|
|
if node[1].strip().lower() == state:
|
|
|
|
ready = True
|
|
|
|
break
|
|
|
|
if not ready:
|
|
|
|
module.fail_json(msg="Failed to set the state `%s` on the cluster\n" % (state))
|
|
|
|
|
|
|
|
|
|
|
|
def main():
|
|
|
|
argument_spec = dict(
|
|
|
|
state=dict(type='str', choices=['online', 'offline', 'restart', 'cleanup']),
|
|
|
|
node=dict(type='str'),
|
|
|
|
timeout=dict(type='int', default=300),
|
|
|
|
force=dict(type='bool', default=True),
|
|
|
|
)
|
|
|
|
|
|
|
|
module = AnsibleModule(
|
|
|
|
argument_spec,
|
|
|
|
supports_check_mode=True,
|
|
|
|
)
|
|
|
|
changed = False
|
|
|
|
state = module.params['state']
|
|
|
|
node = module.params['node']
|
|
|
|
force = module.params['force']
|
|
|
|
timeout = module.params['timeout']
|
|
|
|
|
|
|
|
if state in ['online', 'offline']:
|
|
|
|
# Get cluster status
|
|
|
|
if node is None:
|
|
|
|
cluster_state = get_cluster_status(module)
|
|
|
|
if cluster_state == state:
|
|
|
|
module.exit_json(changed=changed, out=cluster_state)
|
|
|
|
else:
|
|
|
|
set_cluster(module, state, timeout, force)
|
|
|
|
cluster_state = get_cluster_status(module)
|
|
|
|
if cluster_state == state:
|
|
|
|
module.exit_json(changed=True, out=cluster_state)
|
|
|
|
else:
|
|
|
|
module.fail_json(msg="Fail to bring the cluster %s" % state)
|
|
|
|
else:
|
|
|
|
cluster_state = get_node_status(module, node)
|
|
|
|
# Check cluster state
|
|
|
|
for node_state in cluster_state:
|
|
|
|
if node_state[1].strip().lower() == state:
|
|
|
|
module.exit_json(changed=changed, out=cluster_state)
|
|
|
|
else:
|
|
|
|
# Set cluster status if needed
|
|
|
|
set_cluster(module, state, timeout, force)
|
|
|
|
cluster_state = get_node_status(module, node)
|
|
|
|
module.exit_json(changed=True, out=cluster_state)
|
|
|
|
|
|
|
|
if state in ['restart']:
|
|
|
|
set_cluster(module, 'offline', timeout, force)
|
|
|
|
cluster_state = get_cluster_status(module)
|
|
|
|
if cluster_state == 'offline':
|
|
|
|
set_cluster(module, 'online', timeout, force)
|
|
|
|
cluster_state = get_cluster_status(module)
|
|
|
|
if cluster_state == 'online':
|
|
|
|
module.exit_json(changed=True, out=cluster_state)
|
|
|
|
else:
|
|
|
|
module.fail_json(msg="Failed during the restart of the cluster, the cluster can't be started")
|
|
|
|
else:
|
|
|
|
module.fail_json(msg="Failed during the restart of the cluster, the cluster can't be stopped")
|
|
|
|
|
|
|
|
if state in ['cleanup']:
|
|
|
|
clean_cluster(module, timeout)
|
|
|
|
cluster_state = get_cluster_status(module)
|
|
|
|
module.exit_json(changed=True,
|
|
|
|
out=cluster_state)
|
|
|
|
|
|
|
|
|
|
|
|
if __name__ == '__main__':
|
|
|
|
main()
|