collector: Support for collectd as one of the collectors.

The changes include: 1. Configuration in 05_collector.conf. User can specify the metrics that are of their interest and also fine tune the same. 2. collectd_bucky.py: This is derived from python_bucky library. Formal approval for reuse is obtained. 3. collectd.py: This is the main file that receives the samples, stores the required ones, plots the values and saves the values in a data-file in results folder. 4. Fixed some pylint errors 5. Added required libraries to requirements.txt. hashlib is supported by default. However, matplotlib and numpy required 6. added __init__.py to overcome import errors. 7. Crypto needs pycrypto module 8. Builtin filter function usage return bad-builtin pylint warning. Rewrite to remove filter function. 9. Added support for reporting the ovs processes statistics. 10. Import order corrected according to pylint 11. Fixed copyright issues, removed python-3 checking, enhance to include VPP and qemu processes. 12. Removed pylint disables. 13. Added documentaion to describe sample information 14. Added @staticmethod to remove disable-no-self-use. 15. Fixed year in Copyright. 16. Updated print_results function to print the process values. 17. Removed example values form INTELRDT_XKEYS in conf file 18. Removed use of len(SEQUENCE) in loop and renamed data to pdata to avoid name clashes 19. Fixed issue with requirements.txt Note: A separate documentation covering all external tools will be provided. JIRA: VSPERF-505 Change-Id: Ieedcbe7b92e8933263d34df12b1e24be8447b524 Signed-off-by: Sridhar K. N. Rao <sridhar.rao@spirent.com>
author: Sridhar K. N. Rao <sridhar.rao@spirent.com> 2017-11-28 16:13:50 +0530
committer: Martin Klozik <martinx.klozik@intel.com> 2018-01-31 08:31:01 +0000
commit: 23eff36d6a4b9e42ce06152e2b75e50fb7aaa5c5 (patch)
tree: 45373add2d85256b9ca529f7921cc7aa754991a9 /tools/collectors/collectd
parent: a897b7bdc10e20db989d10ff7cdf8a14b5a5d517 (diff)
3 files changed, 1051 insertions, 0 deletions
diff --git a/tools/collectors/collectd/__init__.py b/tools/collectors/collectd/__init__.py
new file mode 100755
index 00000000..25e2c3c2
--- /dev/null
+++ b/tools/collectors/collectd/__init__.py
@@ -0,0 +1,17 @@
+# Copyright 2017 Spirent Communications.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+Wrapper for Collectd as a collector
+"""
diff --git a/tools/collectors/collectd/collectd.py b/tools/collectors/collectd/collectd.py
new file mode 100644
index 00000000..90df6b04
--- /dev/null
+++ b/tools/collectors/collectd/collectd.py
@@ -0,0 +1,265 @@
+# Copyright 2017-2018 Spirent Communications.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+Collects samples from collectd through collectd_bucky.
+Depending on the policy - decides to keep the sample or discard.
+Plot the values of the stored samples once the test is completed
+"""
+
+import copy
+import csv
+import logging
+import multiprocessing
+import os
+from collections import OrderedDict
+import queue
+
+import matplotlib.pyplot as plt
+import numpy as np
+import tools.collectors.collectd.collectd_bucky as cb
+from tools.collectors.collector import collector
+from conf import settings
+
+# The y-lables. Keys in this dictionary are used as y-labels.
+YLABELS = {'No/Of Packets': ['dropped', 'packets', 'if_octets', 'errors',
+                             'if_rx_octets', 'if_tx_octets'],
+           'Jiffies': ['cputime'],
+           'Bandwidth b/s': ['memory_bandwidth'],
+           'Bytes': ['bytes.llc']}
+
+
+def get_label(sample):
+    """
+    Returns the y-label for the plot.
+    """
+    for label in YLABELS:
+        if any(r in sample for r in YLABELS[label]):
+            return label
+
+
+def plot_graphs(dict_of_arrays):
+    """
+    Plot the values
+    Store the data used for plotting.
+    """
+    i = 1
+    results_dir = settings.getValue('RESULTS_PATH')
+    for key in dict_of_arrays:
+        tup_list = dict_of_arrays[key]
+        two_lists = list(map(list, zip(*tup_list)))
+        y_axis_list = two_lists[0]
+        x_axis_list = two_lists[1]
+        if np.count_nonzero(y_axis_list) > 0:
+            with open(os.path.join(results_dir,
+                                   str(key) + '.data'), "w") as pfile:
+                writer = csv.writer(pfile, delimiter='\t')
+                writer.writerows(zip(x_axis_list, y_axis_list))
+            plt.figure(i)
+            plt.plot(x_axis_list, y_axis_list)
+            plt.xlabel("Time (Ticks)")
+            plt.ylabel(get_label(key))
+            plt.savefig(os.path.join(results_dir, str(key) + '.png'))
+            plt.cla()
+            plt.clf()
+            plt.close()
+            i = i + 1
+
+
+def get_results_to_print(dict_of_arrays):
+    """
+    Return a results dictionary for report tool to
+    print the process-statistics.
+    """
+    presults = OrderedDict()
+    results = OrderedDict()
+    for key in dict_of_arrays:
+        if ('processes' in key and
+                any(proc in key for proc in ['ovs', 'vpp', 'qemu'])):
+            reskey = '.'.join(key.split('.')[2:])
+            preskey = key.split('.')[1] + '_collectd'
+            tup_list = dict_of_arrays[key]
+            two_lists = list(map(list, zip(*tup_list)))
+            y_axis_list = two_lists[0]
+            mean = 0.0
+            if np.count_nonzero(y_axis_list) > 0:
+                mean = np.mean(y_axis_list)
+            results[reskey] = mean
+            presults[preskey] = results
+    return presults
+
+
+class Receiver(multiprocessing.Process):
+    """
+    Wrapper Receiver (of samples) class
+    """
+    def __init__(self, pd_dict, control):
+        """
+        Initialize.
+        A queue will be shared with collectd_bucky
+        """
+        super(Receiver, self).__init__()
+        self.daemon = False
+        self.q_of_samples = multiprocessing.Queue()
+        self.server = cb.get_collectd_server(self.q_of_samples)
+        self.control = control
+        self.pd_dict = pd_dict
+        self.collectd_cpu_keys = settings.getValue('COLLECTD_CPU_KEYS')
+        self.collectd_processes_keys = settings.getValue(
+            'COLLECTD_PROCESSES_KEYS')
+        self.collectd_iface_keys = settings.getValue(
+            'COLLECTD_INTERFACE_KEYS')
+        self.collectd_iface_xkeys = settings.getValue(
+            'COLLECTD_INTERFACE_XKEYS')
+        self.collectd_intelrdt_keys = settings.getValue(
+            'COLLECTD_INTELRDT_KEYS')
+        self.collectd_ovsstats_keys = settings.getValue(
+            'COLLECTD_OVSSTAT_KEYS')
+        self.collectd_dpdkstats_keys = settings.getValue(
+            'COLLECTD_DPDKSTAT_KEYS')
+        self.collectd_intelrdt_xkeys = settings.getValue(
+            'COLLECTD_INTELRDT_XKEYS')
+        self.exclude_coreids = []
+        # Expand the ranges in the intelrdt-xkeys
+        for xkey in self.collectd_intelrdt_xkeys:
+            if '-' not in xkey:
+                self.exclude_coreids.append(int(xkey))
+            else:
+                left, right = map(int, xkey.split('-'))
+                self.exclude_coreids += range(left, right + 1)
+
+    def run(self):
+        """
+        Start receiving the samples.
+        """
+        while not self.control.value:
+            try:
+                sample = self.q_of_samples.get(True, 1)
+                if not sample:
+                    break
+                self.handle(sample)
+            except queue.Empty:
+                pass
+            except IOError:
+                continue
+            except (ValueError, IndexError, KeyError, MemoryError):
+                self.stop()
+                break
+
+    # pylint: disable=too-many-boolean-expressions
+    def handle(self, sample):
+        ''' Store values and names if names matches following:
+            1. cpu + keys
+            2. processes + keys
+            3. interface + keys +  !xkeys
+            4. ovs_stats + keys
+            5. dpdkstat + keys
+            6. intel_rdt + keys + !xkeys
+            sample[1] is the name of the sample, which is . separated strings.
+            The first field in sample[1] is the type - cpu, proceesses, etc.
+            For intel_rdt, the second field contains the core-id, which is
+            used to make the decision on 'exclusions'
+            sample[0]: Contains the host information - which is not considered.
+            sample[2]: Contains the Value.
+            sample[3]: Contains the Time (in ticks)
+            '''
+        if (('cpu' in sample[1] and
+             any(c in sample[1] for c in self.collectd_cpu_keys)) or
+                ('processes' in sample[1] and
+                 any(p in sample[1] for p in self.collectd_processes_keys)) or
+                ('interface' in sample[1] and
+                 (any(i in sample[1] for i in self.collectd_iface_keys) and
+                  any(x not in sample[1]
+                      for x in self.collectd_iface_xkeys))) or
+                ('ovs_stats' in sample[1] and
+                 any(o in sample[1] for o in self.collectd_ovsstats_keys)) or
+                ('dpdkstat' in sample[1] and
+                 any(d in sample[1] for d in self.collectd_dpdkstats_keys)) or
+                ('intel_rdt' in sample[1] and
+                 any(r in sample[1] for r in self.collectd_intelrdt_keys) and
+                 (int(sample[1].split('.')[1]) not in self.exclude_coreids))):
+            if sample[1] not in self.pd_dict:
+                self.pd_dict[sample[1]] = list()
+            val = self.pd_dict[sample[1]]
+            val.append((sample[2], sample[3]))
+            self.pd_dict[sample[1]] = val
+
+    def stop(self):
+        """
+        Stop receiving the samples.
+        """
+        self.server.close()
+        self.q_of_samples.put(None)
+        self.control.value = True
+
+
+# inherit from collector.Icollector.
+class Collectd(collector.ICollector):
+    """A collector of system statistics based on collectd
+
+    It starts a UDP server, receives metrics from collectd
+    and plot the results.
+    """
+
+    def __init__(self, results_dir, test_name):
+        """
+        Initialize collection of statistics
+        """
+        self._log = os.path.join(results_dir,
+                                 settings.getValue('LOG_FILE_COLLECTD') +
+                                 '_' + test_name + '.log')
+        self.results = {}
+        self.sample_dict = multiprocessing.Manager().dict()
+        self.control = multiprocessing.Value('b', False)
+        self.receiver = Receiver(self.sample_dict, self.control)
+
+    def start(self):
+        """
+        Start receiving samples
+        """
+        self.receiver.server.start()
+        self.receiver.start()
+
+    def stop(self):
+        """
+        Stop receiving samples
+        """
+        self.control.value = True
+        self.receiver.stop()
+        self.receiver.server.join(5)
+        self.receiver.join(5)
+        if self.receiver.server.is_alive():
+            self.receiver.server.terminate()
+        if self.receiver.is_alive():
+            self.receiver.terminate()
+        self.results = copy.deepcopy(self.sample_dict)
+
+    def get_results(self):
+        """
+        Return the results.
+        """
+        return get_results_to_print(self.results)
+
+    def print_results(self):
+        """
+        Print - Plot and save raw-data.
+        log the collected statistics
+        """
+        plot_graphs(self.results)
+        proc_stats = get_results_to_print(self.results)
+        for process in proc_stats:
+            logging.info("Process: " + '_'.join(process.split('_')[:-1]))
+            for(key, value) in proc_stats[process].items():
+                logging.info("         Statistic: " + str(key) +
+                             ", Value: " + str(value))
diff --git a/tools/collectors/collectd/collectd_bucky.py b/tools/collectors/collectd/collectd_bucky.py
new file mode 100644
index 00000000..bac24ed7
--- /dev/null
+++ b/tools/collectors/collectd/collectd_bucky.py
@@ -0,0 +1,769 @@
+# Copyright 2014-2018 TRBS, Spirent Communications
+#
+# Licensed under the Apache License, Version 2.0 (the "License"); you may not
+# use this file except in compliance with the License. You may obtain a copy of
+# the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
+# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
+# License for the specific language governing permissions and limitations under
+# the License.
+
+# This file is a modified version of scripts present in bucky software
+# details of bucky can be found at https://github.com/trbs/bucky
+
+"""
+This module receives the samples from collectd, processes it and
+enqueues it in a format suitable for easy processing.
+It also handles secure communication with collectd.
+"""
+import copy
+import hmac
+import logging
+import multiprocessing
+import os
+import socket
+import struct
+import sys
+from hashlib import sha1, sha256
+
+from Crypto.Cipher import AES
+from conf import settings
+
+logging.basicConfig()
+LOG = logging.getLogger(__name__)
+
+
+class CollectdError(Exception):
+    """
+    Custom error class.
+    """
+    def __init__(self, mesg):
+        super(CollectdError, self).__init__(mesg)
+        self.mesg = mesg
+
+    def __str__(self):
+        return self.mesg
+
+
+class ConnectError(CollectdError):
+    """
+    Custom connect error
+    """
+    pass
+
+
+class ConfigError(CollectdError):
+    """
+    Custom config error
+    """
+    pass
+
+
+class ProtocolError(CollectdError):
+    """
+    Custom protocol error
+    """
+    pass
+
+
+class UDPServer(multiprocessing.Process):
+    """
+    Actual UDP server receiving collectd samples over network
+    """
+    def __init__(self, ip, port):
+        super(UDPServer, self).__init__()
+        self.daemon = True
+        addrinfo = socket.getaddrinfo(ip, port,
+                                      socket.AF_UNSPEC, socket.SOCK_DGRAM)
+        afamily, _, _, _, addr = addrinfo[0]
+        ip, port = addr[:2]
+        self.ip_addr = ip
+        self.port = port
+        self.sock = socket.socket(afamily, socket.SOCK_DGRAM)
+        self.sock.setsockopt(socket.SOL_SOCKET, socket.SO_REUSEADDR, 1)
+        try:
+            self.sock.bind((ip, port))
+            LOG.info("Bound socket socket %s:%s", ip, port)
+        except socket.error:
+            LOG.exception("Error binding socket %s:%s.", ip, port)
+            sys.exit(1)
+
+        self.sock_recvfrom = self.sock.recvfrom
+
+    def run(self):
+        """
+        Start receiving messages
+        """
+        recvfrom = self.sock_recvfrom
+        while True:
+            try:
+                data, addr = recvfrom(65535)
+            except (IOError, KeyboardInterrupt):
+                continue
+            addr = addr[:2]  # for compatibility with longer ipv6 tuples
+            if data == b'EXIT':
+                break
+            if not self.handle(data, addr):
+                break
+        try:
+            self.pre_shutdown()
+        except SystemExit:
+            LOG.exception("Failed pre_shutdown method for %s",
+                          self.__class__.__name__)
+
+    def handle(self, data, addr):
+        """
+        Handle the message.
+        """
+        raise NotImplementedError()
+
+    def pre_shutdown(self):
+        """ Pre shutdown hook """
+        pass
+
+    def close(self):
+        """
+        Close the communication
+        """
+        self.send('EXIT')
+
+    def send(self, data):
+        """
+        Send over the network
+        """
+        sock = socket.socket(socket.AF_INET, socket.SOCK_DGRAM)
+        if not isinstance(data, bytes):
+            data = data.encode()
+        sock.sendto(data, 0, (self.ip_addr, self.port))
+
+
+class CPUConverter(object):
+    """
+    Converter for CPU samples fom collectd.
+    """
+    PRIORITY = -1
+
+    def __call__(self, sample):
+        return ["cpu", sample["plugin_instance"], sample["type_instance"]]
+
+
+class InterfaceConverter(object):
+    """
+    Converter for Interface samples from collectd
+    """
+    PRIORITY = -1
+
+    def __call__(self, sample):
+        parts = []
+        parts.append("interface")
+        if sample.get("plugin_instance", ""):
+            parts.append(sample["plugin_instance"].strip())
+        stypei = sample.get("type_instance", "").strip()
+        if stypei:
+            parts.append(stypei)
+        stype = sample.get("type").strip()
+        if stype:
+            parts.append(stype)
+        vname = sample.get("value_name").strip()
+        if vname:
+            parts.append(vname)
+        return parts
+
+
+class MemoryConverter(object):
+    """
+    Converter for Memory samples from collectd
+    """
+    PRIORITY = -1
+
+    def __call__(self, sample):
+        return ["memory", sample["type_instance"]]
+
+
+class DefaultConverter(object):
+    """
+    Default converter for samples from collectd
+    """
+    PRIORITY = -1
+
+    def __call__(self, sample):
+        parts = []
+        parts.append(sample["plugin"].strip())
+        if sample.get("plugin_instance"):
+            parts.append(sample["plugin_instance"].strip())
+        stype = sample.get("type", "").strip()
+        if stype and stype != "value":
+            parts.append(stype)
+        stypei = sample.get("type_instance", "").strip()
+        if stypei:
+            parts.append(stypei)
+        vname = sample.get("value_name").strip()
+        if vname and vname != "value":
+            parts.append(vname)
+        return parts
+
+
+DEFAULT_CONVERTERS = {
+    "cpu": CPUConverter(),
+    "interface": InterfaceConverter(),
+    "memory": MemoryConverter(),
+    "_default": DefaultConverter(),
+}
+
+
+class CollectDTypes(object):
+    """
+    Class to handle the sample types. The types.db that comes
+    with collectd, usually, defines the various types.
+    """
+    def __init__(self, types_dbs=None):
+        if types_dbs is None:
+            types_dbs = []
+        dirs = ["/opt/collectd/share/collectd/types.db",
+                "/usr/local/share/collectd/types.db"]
+        self.types = {}
+        self.type_ranges = {}
+        if not types_dbs:
+            types_dbs = [tdb for tdb in dirs if os.path.exists(tdb)]
+            if not types_dbs:
+                raise ConfigError("Unable to locate types.db")
+        self.types_dbs = types_dbs
+        self._load_types()
+
+    def get(self, name):
+        """
+        Get the name of the type
+        """
+        t_name = self.types.get(name)
+        if t_name is None:
+            raise ProtocolError("Invalid type name: %s" % name)
+        return t_name
+
+    def _load_types(self):
+        """
+        Load all the types from types_db
+        """
+        for types_db in self.types_dbs:
+            with open(types_db) as handle:
+                for line in handle:
+                    if line.lstrip()[:1] == "#":
+                        continue
+                    if not line.strip():
+                        continue
+                    self._add_type_line(line)
+            LOG.info("Loaded collectd types from %s", types_db)
+
+    def _add_type_line(self, line):
+        """
+        Add types information
+        """
+        types = {
+            "COUNTER": 0,
+            "GAUGE": 1,
+            "DERIVE": 2,
+            "ABSOLUTE": 3
+        }
+        name, spec = line.split(None, 1)
+        self.types[name] = []
+        self.type_ranges[name] = {}
+        vals = spec.split(", ")
+        for val in vals:
+            vname, vtype, minv, maxv = val.strip().split(":")
+            vtype = types.get(vtype)
+            if vtype is None:
+                raise ValueError("Invalid value type: %s" % vtype)
+            minv = None if minv == "U" else float(minv)
+            maxv = None if maxv == "U" else float(maxv)
+            self.types[name].append((vname, vtype))
+            self.type_ranges[name][vname] = (minv, maxv)
+
+
+class CollectDParser(object):
+    """
+    Parser class: Implements the sample parsing operations.
+    The types definition defines the parsing process.
+    """
+    def __init__(self, types_dbs=None, counter_eq_derive=False):
+        if types_dbs is None:
+            types_dbs = []
+        self.types = CollectDTypes(types_dbs=types_dbs)
+        self.counter_eq_derive = counter_eq_derive
+
+    def parse(self, data):
+        """
+        Parse individual samples
+        """
+        for sample in self.parse_samples(data):
+            yield sample
+
+    def parse_samples(self, data):
+        """
+        Extract all the samples from the message.
+        """
+        types = {
+            0x0000: self._parse_string("host"),
+            0x0001: self._parse_time("time"),
+            0x0008: self._parse_time_hires("time"),
+            0x0002: self._parse_string("plugin"),
+            0x0003: self._parse_string("plugin_instance"),
+            0x0004: self._parse_string("type"),
+            0x0005: self._parse_string("type_instance"),
+            0x0006: None,  # handle specially
+            0x0007: self._parse_time("interval"),
+            0x0009: self._parse_time_hires("interval")
+        }
+        sample = {}
+        for (ptype, pdata) in self.parse_data(data):
+            if ptype not in types:
+                LOG.debug("Ignoring part type: 0x%02x", ptype)
+                continue
+            if ptype != 0x0006:
+                types[ptype](sample, pdata)
+                continue
+            for vname, vtype, val in self.parse_values(sample["type"], pdata):
+                sample["value_name"] = vname
+                sample["value_type"] = vtype
+                sample["value"] = val
+                yield copy.deepcopy(sample)
+
+    @staticmethod
+    def parse_data(data):
+        """
+        Parse the message
+        """
+        types = set([
+            0x0000, 0x0001, 0x0002, 0x0003, 0x0004,
+            0x0005, 0x0006, 0x0007, 0x0008, 0x0009,
+            0x0100, 0x0101, 0x0200, 0x0210
+        ])
+        while data:
+            if len(data) < 4:
+                raise ProtocolError("Truncated header.")
+            (part_type, part_len) = struct.unpack("!HH", data[:4])
+            data = data[4:]
+            if part_type not in types:
+                raise ProtocolError("Invalid part type: 0x%02x" % part_type)
+            part_len -= 4  # includes four header bytes we just parsed
+            if len(data) < part_len:
+                raise ProtocolError("Truncated value.")
+            part_data, data = data[:part_len], data[part_len:]
+            yield (part_type, part_data)
+
+    def parse_values(self, stype, data):
+        """
+        Parse the value of a particular type
+        """
+        types = {0: "!Q", 1: "<d", 2: "!q", 3: "!Q"}
+        (nvals,) = struct.unpack("!H", data[:2])
+        data = data[2:]
+        if len(data) != 9 * nvals:
+            raise ProtocolError("Invalid value structure length.")
+        vtypes = self.types.get(stype)
+        if nvals != len(vtypes):
+            raise ProtocolError("Values different than types.db info.")
+        for i in range(nvals):
+            vtype = data[i]
+            if vtype != vtypes[i][1]:
+                if self.counter_eq_derive and \
+                   (vtype, vtypes[i][1]) in ((0, 2), (2, 0)):
+                    # if counter vs derive don't break, assume server is right
+                    LOG.debug("Type mismatch (counter/derive) for %s/%s",
+                              stype, vtypes[i][0])
+                else:
+                    raise ProtocolError("Type mismatch with types.db")
+        data = data[nvals:]
+        for i in range(nvals):
+            vdata, data = data[:8], data[8:]
+            (val,) = struct.unpack(types[vtypes[i][1]], vdata)
+            yield vtypes[i][0], vtypes[i][1], val
+
+    @staticmethod
+    def _parse_string(name):
+        """
+        Parse string value
+        """
+        def _parser(sample, data):
+            """
+            Actual string parser
+            """
+            data = data.decode()
+            if data[-1] != '\0':
+                raise ProtocolError("Invalid string detected.")
+            sample[name] = data[:-1]
+        return _parser
+
+    @staticmethod
+    def _parse_time(name):
+        """
+        Parse time value
+        """
+        def _parser(sample, data):
+            """
+            Actual time parser
+            """
+            if len(data) != 8:
+                raise ProtocolError("Invalid time data length.")
+            (val,) = struct.unpack("!Q", data)
+            sample[name] = float(val)
+        return _parser
+
+    @staticmethod
+    def _parse_time_hires(name):
+        """
+        Parse time hires value
+        """
+        def _parser(sample, data):
+            """
+            Actual time hires parser
+            """
+            if len(data) != 8:
+                raise ProtocolError("Invalid hires time data length.")
+            (val,) = struct.unpack("!Q", data)
+            sample[name] = val * (2 ** -30)
+        return _parser
+
+
+class CollectDCrypto(object):
+    """
+    Handle the sercured communications with collectd daemon
+    """
+    def __init__(self):
+        sec_level = settings.getValue('COLLECTD_SECURITY_LEVEL')
+        if sec_level in ("sign", "SIGN", "Sign", 1):
+            self.sec_level = 1
+        elif sec_level in ("encrypt", "ENCRYPT", "Encrypt", 2):
+            self.sec_level = 2
+        else:
+            self.sec_level = 0
+        if self.sec_level:
+            self.auth_file = settings.getValue('COLLECTD_AUTH_FILE')
+            self.auth_db = {}
+            if self.auth_file:
+                self.load_auth_file()
+            if not self.auth_file:
+                raise ConfigError("Collectd security level configured but no "
+                                  "auth file specified in configuration")
+            if not self.auth_db:
+                LOG.warning("Collectd security level configured but no "
+                            "user/passwd entries loaded from auth file")
+
+    def load_auth_file(self):
+        """
+        Loading the authentication file.
+        """
+        try:
+            fil = open(self.auth_file)
+        except IOError as exc:
+            raise ConfigError("Unable to load collectd's auth file: %r" % exc)
+        self.auth_db.clear()
+        for line in fil:
+            line = line.strip()
+            if not line or line[0] == "#":
+                continue
+            user, passwd = line.split(":", 1)
+            user = user.strip()
+            passwd = passwd.strip()
+            if not user or not passwd:
+                LOG.warning("Found line with missing user or password")
+                continue
+            if user in self.auth_db:
+                LOG.warning("Found multiple entries for single user")
+            self.auth_db[user] = passwd
+        fil.close()
+        LOG.info("Loaded collectd's auth file from %s", self.auth_file)
+
+    def parse(self, data):
+        """
+        Parse the non-encrypted message
+        """
+        if len(data) < 4:
+            raise ProtocolError("Truncated header.")
+        part_type, part_len = struct.unpack("!HH", data[:4])
+        sec_level = {0x0200: 1, 0x0210: 2}.get(part_type, 0)
+        if sec_level < self.sec_level:
+            raise ProtocolError("Packet has lower security level than allowed")
+        if not sec_level:
+            return data
+        if sec_level == 1 and not self.sec_level:
+            return data[part_len:]
+        data = data[4:]
+        part_len -= 4
+        if len(data) < part_len:
+            raise ProtocolError("Truncated part payload.")
+        if sec_level == 1:
+            return self.parse_signed(part_len, data)
+        if sec_level == 2:
+            return self.parse_encrypted(part_len, data)
+
+    def parse_signed(self, part_len, data):
+        """
+        Parse the signed message
+        """
+
+        if part_len <= 32:
+            raise ProtocolError("Truncated signed part.")
+        sig, data = data[:32], data[32:]
+        uname_len = part_len - 32
+        uname = data[:uname_len].decode()
+        if uname not in self.auth_db:
+            raise ProtocolError("Signed packet, unknown user '%s'" % uname)
+        password = self.auth_db[uname].encode()
+        sig2 = hmac.new(password, msg=data, digestmod=sha256).digest()
+        if not self._hashes_match(sig, sig2):
+            raise ProtocolError("Bad signature from user '%s'" % uname)
+        data = data[uname_len:]
+        return data
+
+    def parse_encrypted(self, part_len, data):
+        """
+        Parse the encrypted message
+        """
+        if part_len != len(data):
+            raise ProtocolError("Enc pkt size disaggrees with header.")
+        if len(data) <= 38:
+            raise ProtocolError("Truncated encrypted part.")
+        uname_len, data = struct.unpack("!H", data[:2])[0], data[2:]
+        if len(data) <= uname_len + 36:
+            raise ProtocolError("Truncated encrypted part.")
+        uname, data = data[:uname_len].decode(), data[uname_len:]
+        if uname not in self.auth_db:
+            raise ProtocolError("Couldn't decrypt, unknown user '%s'" % uname)
+        ival, data = data[:16], data[16:]
+        password = self.auth_db[uname].encode()
+        key = sha256(password).digest()
+        pad_bytes = 16 - (len(data) % 16)
+        data += b'\0' * pad_bytes
+        data = AES.new(key, IV=ival, mode=AES.MODE_OFB).decrypt(data)
+        data = data[:-pad_bytes]
+        tag, data = data[:20], data[20:]
+        tag2 = sha1(data).digest()
+        if not self._hashes_match(tag, tag2):
+            raise ProtocolError("Bad checksum on enc pkt for '%s'" % uname)
+        return data
+
+    @staticmethod
+    def _hashes_match(val_a, val_b):
+        """Constant time comparison of bytes """
+        if len(val_a) != len(val_b):
+            return False
+        diff = 0
+        for val_x, val_y in zip(val_a, val_b):
+            diff |= val_x ^ val_y
+        return not diff
+
+
+class CollectDConverter(object):
+    """
+    Handle all conversions.
+    Coversion: Convert the sample received from collectd to an
+    appropriate format - for easy processing
+    """
+    def __init__(self):
+        self.converters = dict(DEFAULT_CONVERTERS)
+
+    def convert(self, sample):
+        """
+        Main conversion handling.
+        """
+        default = self.converters["_default"]
+        handler = self.converters.get(sample["plugin"], default)
+        try:
+            name_parts = handler(sample)
+            if name_parts is None:
+                return  # treat None as "ignore sample"
+            name = '.'.join(name_parts)
+        except (AttributeError, IndexError, MemoryError, RuntimeError):
+            LOG.exception("Exception in sample handler  %s (%s):",
+                          sample["plugin"], handler)
+            return
+        host = sample.get("host", "")
+        return (
+            host,
+            name,
+            sample["value_type"],
+            sample["value"],
+            int(sample["time"])
+        )
+
+    def _add_converter(self, name, inst, source="unknown"):
+        """
+        Add new converter types
+        """
+        if name not in self.converters:
+            LOG.info("Converter: %s from %s", name, source)
+            self.converters[name] = inst
+            return
+        kpriority = getattr(inst, "PRIORITY", 0)
+        ipriority = getattr(self.converters[name], "PRIORITY", 0)
+        if kpriority > ipriority:
+            LOG.info("Replacing: %s", name)
+            LOG.info("Converter: %s from %s", name, source)
+            self.converters[name] = inst
+            return
+        LOG.info("Ignoring: %s (%s) from %s (priority: %s vs %s)",
+                 name, inst, source, kpriority, ipriority)
+
+
+class CollectDHandler(object):
+    """Wraps all CollectD parsing functionality in a class"""
+
+    def __init__(self):
+        self.crypto = CollectDCrypto()
+        collectd_types = []
+        collectd_counter_eq_derive = False
+        self.parser = CollectDParser(collectd_types,
+                                     collectd_counter_eq_derive)
+        self.converter = CollectDConverter()
+        self.prev_samples = {}
+        self.last_sample = None
+
+    def parse(self, data):
+        """
+        Parse the samples from collectd
+        """
+        try:
+            data = self.crypto.parse(data)
+        except ProtocolError as error:
+            LOG.error("Protocol error in CollectDCrypto: %s", error)
+            return
+        try:
+            for sample in self.parser.parse(data):
+                self.last_sample = sample
+                stype = sample["type"]
+                vname = sample["value_name"]
+                sample = self.converter.convert(sample)
+                if sample is None:
+                    continue
+                host, name, vtype, val, time = sample
+                if not name.strip():
+                    continue
+                val = self.calculate(host, name, vtype, val, time)
+                val = self.check_range(stype, vname, val)
+                if val is not None:
+                    yield host, name, val, time
+        except ProtocolError as error:
+            LOG.error("Protocol error: %s", error)
+            if self.last_sample is not None:
+                LOG.info("Last sample: %s", self.last_sample)
+
+    def check_range(self, stype, vname, val):
+        """
+        Check the value range
+        """
+        if val is None:
+            return
+        try:
+            vmin, vmax = self.parser.types.type_ranges[stype][vname]
+        except KeyError:
+            LOG.error("Couldn't find vmin, vmax in CollectDTypes")
+            return val
+        if vmin is not None and val < vmin:
+            LOG.debug("Invalid value %s (<%s) for %s", val, vmin, vname)
+            LOG.debug("Last sample: %s", self.last_sample)
+            return
+        if vmax is not None and val > vmax:
+            LOG.debug("Invalid value %s (>%s) for %s", val, vmax, vname)
+            LOG.debug("Last sample: %s", self.last_sample)
+            return
+        return val
+
+    def calculate(self, host, name, vtype, val, time):
+        """
+        Perform calculations for handlers
+        """
+        handlers = {
+            0: self._calc_counter,  # counter
+            1: lambda _host, _name, v, _time: v,  # gauge
+            2: self._calc_derive,  # derive
+            3: self._calc_absolute  # absolute
+        }
+        if vtype not in handlers:
+            LOG.error("Invalid value type %s for %s", vtype, name)
+            LOG.info("Last sample: %s", self.last_sample)
+            return
+        return handlers[vtype](host, name, val, time)
+
+    def _calc_counter(self, host, name, val, time):
+        """
+        Calculating counter values
+        """
+        key = (host, name)
+        if key not in self.prev_samples:
+            self.prev_samples[key] = (val, time)
+            return
+        pval, ptime = self.prev_samples[key]
+        self.prev_samples[key] = (val, time)
+        if time <= ptime:
+            LOG.error("Invalid COUNTER update for: %s:%s", key[0], key[1])
+            LOG.info("Last sample: %s", self.last_sample)
+            return
+        if val < pval:
+            # this is supposed to handle counter wrap around
+            # see https://collectd.org/wiki/index.php/Data_source
+            LOG.debug("COUNTER wrap-around for: %s:%s (%s -> %s)",
+                      host, name, pval, val)
+            if pval < 0x100000000:
+                val += 0x100000000  # 2**32
+            else:
+                val += 0x10000000000000000  # 2**64
+        return float(val - pval) / (time - ptime)
+
+    def _calc_derive(self, host, name, val, time):
+        """
+        Calculating derived values
+        """
+        key = (host, name)
+        if key not in self.prev_samples:
+            self.prev_samples[key] = (val, time)
+            return
+        pval, ptime = self.prev_samples[key]
+        self.prev_samples[key] = (val, time)
+        if time <= ptime:
+            LOG.debug("Invalid DERIVE update for: %s:%s", key[0], key[1])
+            LOG.debug("Last sample: %s", self.last_sample)
+            return
+        return float(abs(val - pval)) / (time - ptime)
+
+    def _calc_absolute(self, host, name, val, time):
+        """
+        Calculating absolute values
+        """
+        key = (host, name)
+        if key not in self.prev_samples:
+            self.prev_samples[key] = (val, time)
+            return
+        _, ptime = self.prev_samples[key]
+        self.prev_samples[key] = (val, time)
+        if time <= ptime:
+            LOG.error("Invalid ABSOLUTE update for: %s:%s", key[0], key[1])
+            LOG.info("Last sample: %s", self.last_sample)
+            return
+        return float(val) / (time - ptime)
+
+
+class CollectDServer(UDPServer):
+    """Single processes CollectDServer"""
+
+    def __init__(self, queue):
+        super(CollectDServer, self).__init__(settings.getValue('COLLECTD_IP'),
+                                             settings.getValue('COLLECTD_PORT'))
+        self.handler = CollectDHandler()
+        self.queue = queue
+
+    def handle(self, data, addr):
+        for sample in self.handler.parse(data):
+            self.queue.put(sample)
+        return True
+
+    def pre_shutdown(self):
+        LOG.info("Sutting down CollectDServer")
+
+
+def get_collectd_server(queue):
+    """Get the collectd server """
+    server = CollectDServer
+    return server(queue)
author	Sridhar K. N. Rao <sridhar.rao@spirent.com>	2017-11-28 16:13:50 +0530
committer	Martin Klozik <martinx.klozik@intel.com>	2018-01-31 08:31:01 +0000
commit	23eff36d6a4b9e42ce06152e2b75e50fb7aaa5c5 (patch)
tree	45373add2d85256b9ca529f7921cc7aa754991a9 /tools/collectors/collectd
parent	a897b7bdc10e20db989d10ff7cdf8a14b5a5d517 (diff)