fuel-plugin-lma-collector/deployment_scripts/puppet/modules/lma_collector/files/collectd/rabbitmq_info.py

# Name: rabbitmq-collectd-plugin - rabbitmq_info.py
# Author: https://github.com/phrawzty/rabbitmq-collectd-plugin/commits/master
# Description: This plugin uses Collectd's Python plugin to obtain RabbitMQ
#              metrics.
#
# Copyright 2012 Daniel Maher
# Copyright 2015 Mirantis, Inc.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#   http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import collectd
import re

import base


NAME = 'rabbitmq_info'
# Override in config by specifying 'RmqcBin'.
RABBITMQCTL_BIN = '/usr/sbin/rabbitmqctl'
# Override in config by specifying 'PmapBin'
PMAP_BIN = '/usr/bin/pmap'
# Override in config by specifying 'Vhost'.
VHOST = "/"

# Used to find disk nodes and running nodes.
CLUSTER_STATUS = re.compile('.*disc,\[([^\]]+)\].*running_nodes,\[([^\]]+)\]',
                            re.S)


class RabbitMqPlugin(base.Base):

    # we need to substract the length of the longest prefix (eg '.consumers')
    MAX_QUEUE_IDENTIFIER_LENGTH = base.Base.MAX_IDENTIFIER_LENGTH - 10

    def __init__(self, *args, **kwargs):
        super(RabbitMqPlugin, self).__init__(*args, **kwargs)
        self.plugin = NAME
        self.rabbitmqctl_bin = RABBITMQCTL_BIN
        self.pidfile = None
        self.pmap_bin = PMAP_BIN
        self.vhost = VHOST
        self.re_queues = []
        self.queues = []

    def _matching_queue(self, name):
        for r in self.re_queues:
            if r.match(name):
                return True

        for q in self.queues:
            if q == name:
                return True

        return False

    def config_callback(self, conf):
        super(RabbitMqPlugin, self).config_callback(conf)

        for node in conf.children:
            if node.key == 'RmqcBin':
                self.rabbitmqctl_bin = node.values[0]
            elif node.key == 'PmapBin':
                self.pmap_bin = node.values[0]
            elif node.key == 'PidFile':
                self.pidfile = node.values[0]
            elif node.key == 'Vhost':
                self.vhost = node.values[0]
            elif node.key == 'Queue':
                for val in node.values:
                    if val.startswith('/') and val.endswith('/') and \
                            len(val) > 2:
                        regex = val[1:len(val) - 1]
                        try:
                            self.re_queues.append(re.compile(regex))
                        except Exception as e:
                            self.logger.error(
                                'Cannot compile regex {}: {}'.format(regex, e))
                            raise e
                    elif len(val) > 0:
                        self.queues.append(val)

            else:
                self.logger.warning('Unknown config key: %s' % node.key)

    def itermetrics(self):
        stats = {}
        stats['messages'] = 0
        stats['memory'] = 0
        stats['consumers'] = 0
        stats['queues'] = 0
        stats['unmirrored_queues'] = 0
        stats['pmap_mapped'] = 0
        stats['pmap_used'] = 0
        stats['pmap_shared'] = 0

        out, err = self.execute([self.rabbitmqctl_bin, '-q', 'status'],
                                shell=False)
        if not out:
            self.logger.error('%s: Failed to get the status' %
                              self.rabbitmqctl_bin)
            return

        for v in ('vm_memory_limit', 'disk_free_limit', 'disk_free'):
            try:
                stats[v] = int(re.findall('{%s,([0-9]+)}' % v, out)[0])
            except:
                self.logger.error('%s: Failed to get %s' %
                                  (self.rabbitmqctl_bin, v))

        mem_str = re.findall('{memory,\s+\[([^\]]+)\]\}', out)
        # We are only interested by the total of memory used
        # TODO(all): Get all informations about memory usage from mem_str
        try:
            stats['used_memory'] = int(re.findall('total,([0-9]+)',
                                                  mem_str[0])[0])
        except:
            self.logger.error('%s: Failed to get the memory used by rabbitmq' %
                              self.rabbitmqctl_bin)

        if 'vm_memory_limit' in stats and 'used_memory' in stats:
            stats['remaining_memory'] = \
                stats['vm_memory_limit'] - stats['used_memory']
        if 'disk_free' in stats and 'disk_free_limit' in stats:
            stats['remaining_disk'] = \
                stats['disk_free'] - stats['disk_free_limit']

        out, err = self.execute([self.rabbitmqctl_bin, '-q', 'cluster_status'],
                                shell=False)
        if not out:
            self.logger.error('%s: Failed to get the cluster status' %
                              self.rabbitmqctl_bin)
            return

        # TODO(all): Need to be modified in case we are using RAM nodes.
        status = CLUSTER_STATUS.findall(out)
        if len(status) == 0:
            self.logger.error('%s: Failed to parse (%s)' %
                              (self.rabbitmqctl_bin, out))
        else:
            stats['total_nodes'] = len(status[0][0].split(","))
            stats['running_nodes'] = len(status[0][1].split(","))

        out, err = self.execute([self.rabbitmqctl_bin, '-q',
                                 'list_connections'], shell=False)
        if not out:
            self.logger.error('%s: Failed to get the number of connections' %
                              self.rabbitmqctl_bin)
            return
        stats['connections'] = len(out.split('\n'))

        out, err = self.execute([self.rabbitmqctl_bin, '-q', 'list_exchanges'],
                                shell=False)
        if not out:
            self.logger.error('%s: Failed to get the number of exchanges' %
                              self.rabbitmqctl_bin)
            return
        stats['exchanges'] = len(out.split('\n'))

        out, err = self.execute([self.rabbitmqctl_bin, '-q', '-p', self.vhost,
                                 'list_queues', 'name', 'messages', 'memory',
                                 'consumers', 'slave_pids',
                                 'synchronised_slave_pids'], shell=False)
        if not out:
            self.logger.error('%s: Failed to get the list of queues' %
                              self.rabbitmqctl_bin)
            return

        for line in out.split('\n'):
            ctl_stats = line.split('\t')
            try:
                ctl_stats[1] = int(ctl_stats[1])
                ctl_stats[2] = int(ctl_stats[2])
                ctl_stats[3] = int(ctl_stats[3])
            except:
                continue

            stats['queues'] += 1
            stats['messages'] += ctl_stats[1]
            stats['memory'] += ctl_stats[2]
            stats['consumers'] += ctl_stats[3]

            queue_name = ctl_stats[0]
            if self._matching_queue(queue_name):
                meta = {
                    'queue': ctl_stats[0][:self.MAX_QUEUE_IDENTIFIER_LENGTH]
                }
                yield {
                    'type_instance': 'queue_messages',
                    'values': ctl_stats[1],
                    'meta': meta
                }
                yield {
                    'type_instance': 'queue_memory',
                    'values': ctl_stats[2],
                    'meta': meta
                }
                yield {
                    'type_instance': 'queue_consumers',
                    'values': ctl_stats[3],
                    'meta': meta
                }

            # we need to check if the list of synchronised slaves is
            # equal to the list of slaves.
            try:
                slaves = re.findall('<([a-zA-Z@\-.0-9]+)>', ctl_stats[4])
                for s in slaves:
                    if s not in ctl_stats[5]:
                        stats['unmirrored_queues'] += 1
                        break
            except IndexError:
                pass

        if not stats['memory'] > 0:
            self.logger.warning(
                '%s reports 0 memory usage. This is probably incorrect.' %
                self.rabbitmqctl_bin)

        # pmap metrics are only collected if the location of the pid file is
        # explicitly configured
        if self.pidfile:
            try:
                with open(self.pidfile, 'r') as f:
                    pid = f.read().strip()
            except:
                self.logger.error('Unable to read %s' % self.pidfile)
                return

            # use pmap to get proper memory stats
            out, err = self.execute([self.pmap_bin, '-d', pid], shell=False)
            if not out:
                self.logger.error('Failed to run %s' % self.pmap_bin)
                return

            out = out.split('\n')[-1]
            if re.match('mapped', out):
                m = re.match(r"\D+(\d+)\D+(\d+)\D+(\d+)", out)
                stats['pmap_mapped'] = int(m.group(1))
                stats['pmap_used'] = int(m.group(2))
                stats['pmap_shared'] = int(m.group(3))
            else:
                self.logger.warning('%s returned something strange.' %
                                    self.pmap_bin)

        for k, v in stats.iteritems():
            yield {'type_instance': k, 'values': v}


plugin = RabbitMqPlugin(collectd)


def init_callback():
    plugin.restore_sigchld()


def config_callback(conf):
    plugin.config_callback(conf)


def read_callback():
    plugin.read_callback()

collectd.register_init(init_callback)
collectd.register_config(config_callback)
collectd.register_read(read_callback)