Source code for mentat.system

#!/usr/bin/env python3
# -*- coding: utf-8 -*-
#-------------------------------------------------------------------------------
# This file is part of Mentat system (https://mentat.cesnet.cz/).
#
# Copyright (C) since 2011 CESNET, z.s.p.o (http://www.ces.net/)
# Use of this source is governed by the MIT license, see LICENSE file.
#-------------------------------------------------------------------------------


"""
Mentat system management and inspection library.
"""


__author__ = "Jan Mach <jan.mach@cesnet.cz>"
__credits__ = "Pavel Kácha <pavel.kacha@cesnet.cz>, Andrea Kropáčová <andrea.kropacova@cesnet.cz>"


import os
import re
import datetime
import collections
import subprocess

import pyzenkit.jsonconf


#
# Real-time module status codes.
#
STATUS_RT_RUNNING_OK            = 0   # Module is running or service is OK
STATUS_RT_RUNNING_PF_MISSING    = 1   # Module is running, but pid file is missing
STATUS_RT_RUNNING_PID_MISSMATCH = 2   # Module is running, but pid file contains different PID
STATUS_RT_RUNNING_INCONSISTENT  = 10  # Module is running, but pid files are inconsistent
STATUS_RT_RUNNING_FEWER         = 11  # Module is running in fewer that required instances
STATUS_RT_RUNNING_MORE          = 12  # Module is running in more that required instances
STATUS_RT_DEAD_PF_EXISTS        = 3   # Module is dead and pid file exists
STATUS_RT_DEAD_LOCK_EXISTS      = 4   # Module is dead and lock file exists
STATUS_RT_NOT_RUNNING           = 5   # Module is not running
STATUS_RT_UNKNOWN               = 6   # Module or service status is unknown

# Overall module status messages
OVERALL_MODULE_STATUS_MESSAGES = {
    STATUS_RT_RUNNING_OK:            "All modules are running OK",
    STATUS_RT_RUNNING_PF_MISSING:    "All modules are running, but all pid files are missing",
    STATUS_RT_RUNNING_PID_MISSMATCH: "All modules are running, but all pid files contain different PID",
    STATUS_RT_RUNNING_INCONSISTENT:  "All modules are running, but all pid files are inconsistent",
    STATUS_RT_RUNNING_FEWER:         "All modules are running in fewer that required instances",
    STATUS_RT_RUNNING_MORE:          "All modules are running in more that required instances",
    STATUS_RT_DEAD_PF_EXISTS:        "All modules are dead and all pid files exist",
    STATUS_RT_DEAD_LOCK_EXISTS:      "All modules are dead and all lock files exist",
    STATUS_RT_NOT_RUNNING:           "All modules are not running",
    STATUS_RT_UNKNOWN:               "Some modules are in different state, overall system state is unknown",
}

#
# Cronjob module status codes.
#
STATUS_CJ_ENABLED  = 0   # Cronjob is enabled
STATUS_CJ_DISABLED = 5   # Cronjob is not running
STATUS_CJ_UNKNOWN  = 6   # Cronjob status is unknown

# Overall cronjob status messages
OVERALL_CRONJOB_STATUS_MESSAGES = {
    STATUS_CJ_ENABLED:  "All cronjobs are enabled",
    STATUS_CJ_DISABLED: "All cronjobs are disabled",
    STATUS_CJ_UNKNOWN:  "Some cronjobs are in different state, overall system state is unknown",
}

#
# Cronjob module status codes.
#
STATUS_ONLINE  = 0   # The whole system is online
STATUS_OFFLINE = 5   # The whole system is offline
STATUS_UNKNOWN = 6   # System overall status is unknown

# Overall cronjob status messages
OVERALL_STATUS_MESSAGES = {
    STATUS_ONLINE:  "All modules are running OK and all cronjobs are enabled",
    STATUS_OFFLINE: "All modules are NOT running and all cronjobs are disabled",
    STATUS_UNKNOWN: "Some modules and cronjobs are in different state, overall system state is unknown",
}


REGEXP_MENTAT_PS     = re.compile(r'\s*(\d+)\s+([^\s]+)\s+([^\s]*(?:python(?:\d+(?:\.\d+)?)?))\s+[^\s]+(mentat-[^\s]+)(?:\s+(.*))?')
"""Regular expression for selecting Mentat related processes."""
REGEXP_MENTAT_PIDF   = re.compile(r'(.+?)(?:\.([0-9a-fA-F]+))?\.pid$')
"""Regular expression for selecting Mentat related PID files."""
REGEXP_MENTAT_CRONF  = re.compile(r'(.+)\.cron$')
"""Regular expression for selecting Mentat related log files."""
REGEXP_MENTAT_LOGF   = re.compile(r'(.+)\.log$')
"""Regular expression for selecting Mentat related log files."""
REGEXP_MENTAT_RLOGF  = re.compile(r'(.+)(?:\.([0-9a-fA-F]+))?\.runlog$')
"""Regular expression for selecting Mentat related runlog files."""
REGEXP_MENTAT_CACHEF = re.compile(r'(.+)\.json$')
"""Regular expression for selecting Mentat related cache files."""


[docs]class MentatModule():
    """
    Class representing Mentat real-time module configuration for control utility.
    """
    def __init__(self, params):
        if 'exec' not in params:
            # raise pyzenkit.baseapp.ZenAppSetupException
            raise Exception("Module definition in configuration file is missing mandatory attribute 'exec'.")

        self.executable = params['exec']

        self.name    = params.get('name', self.executable)
        self.args    = params.get('args', [])
        self.paralel = params.get('paralel', False)
        self.count   = int(params.get('count', 0))

        if self.paralel and self.count <= 1:
            # raise pyzenkit.baseapp.ZenAppSetupException
            raise Exception("Module '{}' is configured to run in paralel and the 'count' attribute is missing or below '2'.".format(self.name))

    def __str__(self):
        return '{}'.format(self.name)

    def __repr__(self):
        return 'MentatModule(name={},executable={})'.format(self.name, self.executable)


[docs]class MentatCronjob():
    """
    Class representing Mentat cronjob module configuration for control utility.
    """
    def __init__(self, params):
        if 'name' not in params:
            # raise pyzenkit.baseapp.ZenAppSetupException
            raise Exception("Cronjob definition in configuration file is missing mandatory attribute 'name'.")

        self.name = params['name']

    def __str__(self):
        return '{}'.format(self.name)

    def __repr__(self):
        return 'MentatCronjob(name={})'.format(self.name)


[docs]def make_module_list(modules):
    """
    *Helper function*
    """
    result = collections.OrderedDict()
    for mod in modules:
        record = MentatModule(mod)
        result[record.name] = record
    return result

[docs]def make_cronjob_list(cronjobs):
    """
    *Helper function*
    """
    result = collections.OrderedDict()
    for mod in cronjobs:
        record = MentatCronjob(mod)
        result[record.name] = record
    return result

#-------------------------------------------------------------------------------


[docs]def analyze_process_ps(cmdline):
    """
    Analyze given process command line received from ``ps`` utility.

    Example of returned structure::

        {
            'args': None,
            'exec': 'mentat-storage.py',
            'name': 'mentat-storage.py',
            'paralel': False,
            'pid': 9349,
            'process': 'python3',
            'psline': '9349 python3 python3 /usr/local/bin/mentat-storage.py'
        }

    :param str cmdline: Command line as received from ``ps`` utility).
    :return: Structure containing parsed process information.
    :rtype: dict
    """
    match = REGEXP_MENTAT_PS.match(cmdline)
    if not match:
        return None
    if match.group(4) in ['mentat-controller.py']:
        return None

    record = {
        'process': match.group(2),
        'name':    match.group(4),
        'exec':    match.group(4),
        'args':    match.group(5),
        'pid':     int(match.group(1)),
        'psline':  cmdline,
        'paralel': False
    }

    # Attempt to parse command line arguments for selected data.
    if record['args']:
        # Attempt to parse custom name.
        match = re.search(r'--name(?: |=)([^\s]+)', record['args'])
        if match:
            record['name'] = match.group(1)

        # Attempt to detect paralel mode switch.
        match = re.search('--paralel', record['args'])
        if match:
            record['paralel'] = True

    return record

[docs]def analyze_process_list_ps():
    """
    Analyze all running processes using Linux`s ``ps`` utility.

    Processes are listed with following exact command::

        /bin/ps axo pid,comm,args | grep mentat | grep -v grep

    Only processes that match the internal regular expression are selected.

    Example of returned structure::

        {
            'mentat-enricher.py': {9356: {'args': None,
                                   'exec': 'mentat-enricher.py',
                                   'name': 'mentat-enricher.py',
                                   'paralel': False,
                                   'pid': 9356,
                                   'process': 'python3',
                                   'psline': '9356 python3 python3 /usr/local/bin/mentat-enricher.py'}},
            'mentat-inspector.py': {9362: {'args': None,
                                    'exec': 'mentat-inspector.py',
                                    'name': 'mentat-inspector.py',
                                    'paralel': False,
                                    'pid': 9362,
                                    'process': 'python3',
                                    'psline': '9362 python3 python3 /usr/local/bin/mentat-inspector.py'}},
            'mentat-storage.py': {9349: {'args': None,
                                  'exec': 'mentat-storage.py',
                                  'name': 'mentat-storage.py',
                                  'paralel': False,
                                  'pid': 9349,
                                  'process': 'python3',
                                  'psline': '9349 python3 python3 /usr/local/bin/mentat-storage.py'}}
        }

    :return: Structured dictionary containing information about selected processess.
    :rtype: dict
    """
    processes = collections.defaultdict(dict)
    with subprocess.Popen(['/bin/ps axo pid,comm,args | grep mentat | grep -v grep'], stdout = subprocess.PIPE, shell = True) as proc:
        for psline in proc.stdout:
            psline = psline.rstrip()
            psline = psline.decode('utf-8')

            record = analyze_process_ps(psline)
            if not record:
                continue

            processes[record['name']][record['pid']] = record
    return dict(processes)

[docs]def analyze_pid_file(pid_file, pid_file_path):
    """
    Analyze given PID file.

    Example of returned structure::

        {
            'atime': datetime.datetime(2018, 1, 23, 8, 25, 16, 439742),
            'file': 'mentat-storage.py.pid',
            'mtime': datetime.datetime(2018, 1, 23, 8, 25, 12, 943727),
            'name': 'mentat-storage.py',
            'paralel': False,
            'path': '/var/mentat/run/mentat-storage.py.pid',
            'pid': 9349,
            'size': 5
        }

    :param str pid_file: Basename of the PID file.
    :param str pid_file_path: Full path to the PID file.
    :return: Structure containing parsed PID file information.
    :rtype: dict
    """
    try:
        match = REGEXP_MENTAT_PIDF.match(pid_file)
        if not match:
            return None

        pid = None
        with open(pid_file_path, 'r', encoding="utf8") as pidf:
            pid = pidf.read()
        pid = int(pid)

        fsstat = os.stat(pid_file_path)
        return {
            'name':    match.group(1),
            'file':    pid_file,
            'path':    pid_file_path,
            'pid':     int(pid),
            'paralel': bool(match.group(2)),
            'size':    fsstat.st_size,
            'atime':   datetime.datetime.utcfromtimestamp(fsstat.st_atime),
            'mtime':   datetime.datetime.utcfromtimestamp(fsstat.st_mtime)
        }
    except Exception:
        return None

[docs]def analyze_pid_files(pid_dir_path):
    """
    Analyze all PID files in given run directory.

    Example of returned structure::

        {
            'mentat-enricher.py': {9356: {'atime': datetime.datetime(2018, 1, 23, 8, 25, 16, 439742),
                                          'file': 'mentat-enricher.py.pid',
                                          'mtime': datetime.datetime(2018, 1, 23, 8, 25, 14, 319733),
                                          'name': 'mentat-enricher.py',
                                          'paralel': False,
                                          'path': '/var/mentat/run/mentat-enricher.py.pid',
                                          'pid': 9356,
                                          'size': 5}},
            'mentat-inspector.py': {9362: {'atime': datetime.datetime(2018, 1, 23, 8, 25, 16, 439742),
                                           'file': 'mentat-inspector.py.pid',
                                           'mtime': datetime.datetime(2018, 1, 23, 8, 25, 14, 947736),
                                           'name': 'mentat-inspector.py',
                                           'paralel': False,
                                           'path': '/var/mentat/run/mentat-inspector.py.pid',
                                           'pid': 9362,
                                           'size': 5}},
            'mentat-storage.py': {9349: {'atime': datetime.datetime(2018, 1, 23, 8, 25, 16, 439742),
                                         'file': 'mentat-storage.py.pid',
                                         'mtime': datetime.datetime(2018, 1, 23, 8, 25, 12, 943727),
                                         'name': 'mentat-storage.py',
                                         'paralel': False,
                                         'path': '/var/mentat/run/mentat-storage.py.pid',
                                         'pid': 9349,
                                         'size': 5}}
        }

    :param str pid_dir_path: path to directory containing PID files.
    :return: Structure containing parsed information for all PID files.
    :rtype: dict
    """
    pid_files = collections.defaultdict(dict)

    all_files = os.listdir(pid_dir_path)
    for pid_file in all_files:
        pid_file_path = os.path.join(pid_dir_path, pid_file)
        if not os.path.isfile(pid_file_path):
            continue

        record = analyze_pid_file(pid_file, pid_file_path)
        if not record:
            continue

        pid_files[record['name']][record['pid']] = record
    return dict(pid_files)

[docs]def analyze_cron_file(cron_file, cron_file_path, cron_links):
    """
    Analyze given cron file.

    Example of returned structure::

        {
            'atime': datetime.datetime(2018, 1, 21, 9, 13, 48, 34648),
            'file': 'mentat-statistician-py.cron',
            'link': None,
            'mtime': datetime.datetime(2017, 7, 19, 10, 25, 30),
            'name': 'mentat-statistician-py',
            'path': '/etc/mentat/cron/mentat-statistician-py.cron',
            'size': 429
        }

    :param str cron_file: Basename of the cron file.
    :param str cron_file_path: Full path to the cron file.
    :param dict cron_links: Dictionary containing existing links in cron directory.
    :return: Structure containing parsed cron file information.
    :rtype: dict
    """
    try:
        match = REGEXP_MENTAT_CRONF.match(cron_file)
        if not match:
            return None

        fsstat = os.stat(cron_file_path)
        return {
            'name':  match.group(1),
            'file':  cron_file,
            'path':  cron_file_path,
            'size':  fsstat.st_size,
            'atime': datetime.datetime.utcfromtimestamp(fsstat.st_atime),
            'mtime': datetime.datetime.utcfromtimestamp(fsstat.st_mtime),
            'link':  cron_links.get(cron_file_path, None)
        }
    except Exception:
        return None

[docs]def analyze_cron_files(cfg_dir_path, cron_dir_path):
    """
    Analyze all cron files in config and cron directory.

    Example of returned structure::

        {
            'mentat-precache-py': {'atime': datetime.datetime(2018, 1, 21, 9, 13, 45),
                                   'file': 'mentat-precache-py.cron',
                                   'link': None,
                                   'mtime': datetime.datetime(2017, 9, 1, 11, 10, 17),
                                   'name': 'mentat-precache-py',
                                   'path': '/etc/mentat/cron/mentat-precache-py.cron',
                                   'size': 417},
            'mentat-statistician-py': {'atime': datetime.datetime(2018, 1, 21, 9, 13, 48, 34648),
                                       'file': 'mentat-statistician-py.cron',
                                       'link': None,
                                       'mtime': datetime.datetime(2017, 7, 19, 10, 25, 30),
                                       'name': 'mentat-statistician-py.cron',
                                       'path': '/etc/mentat/cron/mentat-statistician-py.cron',
                                       'size': 429}
        }

    :param str cfg_dir_path: Path to configuration directory containing cron scripts.
    :param str cron_dir_path: Path to system cron directory.
    :return: Structure containing parsed cron file information.
    :rtype: dict
    """
    cron_files = {}
    cron_links = {}

    crn_all_files = os.listdir(cron_dir_path)
    for cron_file in crn_all_files:
        cron_file_path = os.path.join(cron_dir_path, cron_file)
        if not os.path.islink(cron_file_path):
            continue
        cron_links[os.readlink(cron_file_path)] = cron_file_path

    cfg_all_files = os.listdir(cfg_dir_path)
    for cron_file in cfg_all_files:
        cron_file_path = os.path.join(cfg_dir_path, cron_file)
        if not os.path.isfile(cron_file_path):
            continue

        record = analyze_cron_file(cron_file, cron_file_path, cron_links)
        if not record:
            continue

        cron_files[record['name']] = record
    return cron_files

[docs]def analyze_log_file(log_file, log_file_path):
    """
    Analyze given log file.

    Example of returned structure::

        {
            'atime': datetime.datetime(2018, 1, 22, 15, 11, 15, 562358),
            'file': 'mentat-storage.py.log',
            'mtime': datetime.datetime(2018, 1, 23, 9, 8, 43, 403734),
            'name': 'mentat-storage.py',
            'path': '/var/mentat/log/mentat-storage.py.log',
            'size': 5831678
        }

    :param str log_file: Basename of the log file.
    :param str log_file_path: Full path to the log file.
    :return: Structure containing parsed log file information.
    :rtype: dict
    """
    try:
        match = REGEXP_MENTAT_LOGF.match(log_file)
        if not match:
            return None

        fsstat = os.stat(log_file_path)
        return {
            'name':  match.group(1),
            'file':  log_file,
            'path':  log_file_path,
            'size':  fsstat.st_size,
            'atime': datetime.datetime.utcfromtimestamp(fsstat.st_atime),
            'mtime': datetime.datetime.utcfromtimestamp(fsstat.st_mtime)
        }
    except Exception:
        return None

[docs]def analyze_log_files(log_dir_path):
    """
    Analyze all PID files in run directory.

    Example of returned structure::

        {
            'mentat-enricher.py': {'atime': datetime.datetime(2018, 1, 9, 12, 25, 26, 338720),
                                   'file': 'mentat-enricher.py.log',
                                   'mtime': datetime.datetime(2018, 1, 23, 9, 8, 38, 163710),
                                   'name': 'mentat-enricher.py',
                                   'path': '/var/mentat/log/mentat-enricher.py.log',
                                   'size': 6057586},
            'mentat-inspector.py': {'atime': datetime.datetime(2018, 1, 18, 17, 5, 22, 734164),
                                    'file': 'mentat-inspector.py.log',
                                    'mtime': datetime.datetime(2018, 1, 23, 9, 8, 35, 291697),
                                    'name': 'mentat-inspector.py',
                                    'path': '/var/mentat/log/mentat-inspector.py.log',
                                    'size': 8156449},
            'mentat-storage.py': {'atime': datetime.datetime(2018, 1, 22, 15, 11, 15, 562358),
                                  'file': 'mentat-storage.py.log',
                                  'mtime': datetime.datetime(2018, 1, 23, 9, 8, 43, 403734),
                                  'name': 'mentat-storage.py',
                                  'path': '/var/mentat/log/mentat-storage.py.log',
                                  'size': 5831678}
        }

    :param str log_dir_path: Path to directory containing log files.
    :return: Structure containing parsed log file information.
    :rtype: dict
    """
    log_files = {}

    all_files = os.listdir(log_dir_path)
    for log_file in all_files:
        log_file_path = os.path.join(log_dir_path, log_file)
        if not os.path.isfile(log_file_path):
            continue

        record = analyze_log_file(log_file, log_file_path)
        if not record:
            continue

        log_files[record['name']] = record
    return log_files

[docs]def analyze_runlog_file(runlog_file, runlog_file_path):
    """
    Analyze given runlog file.

    Example of returned structure::

        {
            'atime': datetime.datetime(2018, 1, 22, 16, 33, 56, 766819),
            'data': {...},
            'file': '201801221611.runlog',
            'mtime': datetime.datetime(2018, 1, 22, 15, 30, 0, 427902),
            'name': '201801221611',
            'path': '/var/mentat/run/mentat-storage.py/201801221611.runlog',
            'size': 1209
        }

    :param str runlog_file: Basename of the runlog file.
    :param str runlog_file_path: Full path to the runlog file.
    :return: Structure containing parsed runlog file information.
    :rtype: dict
    """
    try:
        match = REGEXP_MENTAT_RLOGF.match(runlog_file)
        if not match:
            return None

        fsstat = os.stat(runlog_file_path)
        return {
            'name':  match.group(1),
            'file':  runlog_file,
            'path':  runlog_file_path,
            'size':  fsstat.st_size,
            'atime': datetime.datetime.utcfromtimestamp(fsstat.st_atime),
            'mtime': datetime.datetime.utcfromtimestamp(fsstat.st_mtime),
            'data':  pyzenkit.jsonconf.json_load(runlog_file_path)
        }
    except Exception:
        return None

[docs]def analyze_runlog_files(run_dir_path, limit = None):
    """
    Analyze all runlog files in run directory.

    :param str run_dir_path: Path to directory containing run files.
    :return: Structure containing parsed runlog file information.
    :rtype: dict
    """
    runlog_files = collections.defaultdict(dict)

    all_files = os.listdir(run_dir_path)
    for runlog_dir in all_files:
        runlog_dir_path = os.path.join(run_dir_path, runlog_dir)
        if not os.path.isdir(runlog_dir_path):
            continue

        all_rl_files = sorted(os.listdir(runlog_dir_path), reverse = True)
        file_counter = 0
        for runlog_file in all_rl_files:
            runlog_file_path = os.path.join(runlog_dir_path, runlog_file)
            if not os.path.isfile(runlog_file_path):
                continue

            record = analyze_runlog_file(runlog_file, runlog_file_path)
            if not record:
                continue

            file_counter += 1
            if limit and file_counter > limit:
                break

            runlog_files[runlog_dir][record['name']] = record
    return dict(runlog_files)

[docs]def analyze_cache_file(cache_file, cache_file_path):
    """
    Analyze given cache file.

    Example of returned structure::

        {
            'atime': datetime.datetime(2018, 1, 22, 15, 11, 15, 562358),
            'file': 'itemset-stat-detectors.json',
            'mtime': datetime.datetime(2018, 1, 23, 9, 8, 43, 403734),
            'name': 'itemset-stat-detectors',
            'path': '/var/mentat/cache/itemset-stat-detectors.json',
            'size': 5831678
        }

    :param str cache_file: Basename of the cache file.
    :param str cache_file_path: Full path to the cache file.
    :return: Structure containing parsed cache file information.
    :rtype: dict
    """
    try:
        match = REGEXP_MENTAT_CACHEF.match(cache_file)
        if not match:
            return None

        fsstat = os.stat(cache_file_path)
        return {
            'name':  match.group(1),
            'file':  cache_file,
            'path':  cache_file_path,
            'size':  fsstat.st_size,
            'atime': datetime.datetime.utcfromtimestamp(fsstat.st_atime),
            'mtime': datetime.datetime.utcfromtimestamp(fsstat.st_mtime),
            'data':  pyzenkit.jsonconf.json_load(cache_file_path)
        }
    except Exception:
        return None

[docs]def analyze_cache_files(cache_dir_path):
    """
    Analyze all cache files in cache directory.

    Example of returned structure::

        {
            'itemset-stat-detectors': {'atime': datetime.datetime(2018, 1, 9, 12, 25, 26, 338720),
                                       'file': 'itemset-stat-detectors.json',
                                       'mtime': datetime.datetime(2018, 1, 23, 9, 8, 38, 163710),
                                       'name': 'mentat-enricher.py',
                                       'path': '/var/mentat/cache/itemset-stat-detectors.json',
                                       'size': 6057586,
                                       'data': {...}}
        }

    :param str cache_dir_path: Path to directory containing cache files.
    :return: Structure containing parsed cache file information.
    :rtype: dict
    """
    cache_files = {}

    all_files = os.listdir(cache_dir_path)
    for cache_file in all_files:
        cache_file_path = os.path.join(cache_dir_path, cache_file)
        if not os.path.isfile(cache_file_path):
            continue

        record = analyze_cache_file(cache_file, cache_file_path)
        if not record:
            continue

        cache_files[record['name']] = record
    return cache_files

#-------------------------------------------------------------------------------


[docs]def module_status(mod_data, pidf_data, proc_data, overall_status):
    """
    Analyze status of given module.
    """
    # Check the consistency of running processes and pid files.
    consistent = True
    if pidf_data:
        for pid in pidf_data.keys():
            if not proc_data or not pid in proc_data:
                overall_status['messages']['error'].append((
                    "Process '{}' is dead, but pid file '{}' exists".format(
                        pid,
                        pidf_data[pid]['path']
                    ),
                    'pidfile',
                    pidf_data[pid]['path']
                ))
                consistent = False
    if proc_data:
        for pid in proc_data.keys():
            if not pidf_data or not pid in pidf_data:
                overall_status['messages']['error'].append((
                    "Process '{}':'{}' is running, but  pid file is missing".format(
                        pid,
                        proc_data[pid]['name']
                    ),
                    'process',
                    pid
                ))
                consistent = False

    # PID file exists and process is running.
    if pidf_data and proc_data:

        # Check the number of running processes
        if mod_data.paralel:
            if mod_data.count > len(proc_data.keys()):
                return (
                    STATUS_RT_RUNNING_FEWER,
                    "There are fewer instances running than required ({}:{})".format(mod_data.count, len(proc_data.keys()))
                )
            if mod_data.count < len(proc_data.keys()):
                return (
                    STATUS_RT_RUNNING_MORE,
                    "There are more instances running than required ({}:{})".format(mod_data.count, len(proc_data.keys()))
                )

        # Process is running or service is OK
        if consistent:
            return (
                STATUS_RT_RUNNING_OK,
                "Process is running or service is OK ({})".format(len(proc_data.keys()))
            )
        return (
            STATUS_RT_RUNNING_INCONSISTENT,
            "Process is running in inconsistent state"
        )

    # PID file(s) exist(s) and any process is not running
    if pidf_data:
        if mod_data.paralel:
            return (
                STATUS_RT_DEAD_PF_EXISTS,
                "Processes are dead, but some pid files exist"
            )
        return (
            STATUS_RT_DEAD_PF_EXISTS,
            "Process is dead, but pid file exist"
        )

    # PID file(s) do(es) not exist, but some process is running
    if proc_data:
        if mod_data.paralel:
            return (
                STATUS_RT_RUNNING_PF_MISSING,
                "Processes are running, but pid files are missing"
            )
        return (
            STATUS_RT_RUNNING_PF_MISSING,
            "Process is running, but pid file is missing"
        )

    # Process is not running
    return (
        STATUS_RT_NOT_RUNNING,
        "Process is not running or service is stopped"
    )

    # TODO: Process is dead and /var/lock lock file exists
    #return STATUS_RT_DEAD_LOCK_EXISTS
    # TODO: Process or service status is unknown
    #return STATUS_RT_UNKNOWN

[docs]def cronjob_status(cronj_data, cronf_data, overall_status):
    """
    Analyze status of given cron module.
    """
    if cronf_data and cronf_data['link']:
        return (
            STATUS_CJ_ENABLED,
            "Cronjob is enabled"
        )
    return (
        STATUS_CJ_DISABLED,
        "Cronjob is disabled"
    )

[docs]def system_status(modules, cronjobs, cfg_dir_path, cron_dir_path, log_dir_path, run_dir_path):
    """
    Analyze status of all modules and cronjobs and detect additional problems.
    """
    status = {}
    status['dt']           = datetime.datetime.utcnow()
    status['modules']      = {}
    status['cronjobs']     = {}
    status['messages']     = {'info': [], 'notice': [], 'warning': [], 'error': []}
    status['processes']    = analyze_process_list_ps()
    status['pid_files']    = analyze_pid_files(run_dir_path)
    status['log_files']    = analyze_log_files(log_dir_path)
    status['runlog_files'] = analyze_runlog_files(run_dir_path, limit = 1)
    status['cron_files']   = analyze_cron_files(os.path.join(cfg_dir_path, 'cron'), cron_dir_path)
    status['resultm']      = None
    status['resultc']      = None
    status['result']       = None


    # A) Analyze status of configured modules.
    for mname, mdata in modules.items():
        status['modules'][mname] = module_status(
            mdata,
            status['pid_files'].get(mname, None),
            status['processes'].get(mname, None),
            status
        )

    # B) Analyze status of configured cronjob modules.
    for mname, mdata in cronjobs.items():
        status['cronjobs'][mname] = cronjob_status(
            mdata,
            status['cron_files'].get(mname, None),
            status
        )

    # -----

    _analyze_unconfigured_pid_files(status, modules)
    _analyze_unconfigured_modules(status, modules)
    _analyze_unconfigured_cronjobs(status, cronjobs)

    # -----

    # Determine overall status of real-time processing modules.
    for mname, mstatus in status['modules'].items():
        if not status['resultm']:
            status['resultm'] = (mstatus[0], OVERALL_MODULE_STATUS_MESSAGES[mstatus[0]])
        elif status['resultm'][0] != mstatus[0]:
            status['resultm'] = (STATUS_RT_UNKNOWN, OVERALL_MODULE_STATUS_MESSAGES[STATUS_RT_UNKNOWN])
    if not status['resultm']:
        status['resultm'] = (STATUS_RT_NOT_RUNNING, OVERALL_MODULE_STATUS_MESSAGES[STATUS_RT_NOT_RUNNING])

    # Determine overall status of cronjob modules.
    for mname, mstatus in status['cronjobs'].items():
        if not status['resultc']:
            status['resultc'] = (mstatus[0], OVERALL_CRONJOB_STATUS_MESSAGES[mstatus[0]])
        elif status['resultc'][0] != mstatus[0]:
            status['resultc'] = (STATUS_CJ_UNKNOWN, OVERALL_CRONJOB_STATUS_MESSAGES[STATUS_CJ_UNKNOWN])
    if not status['resultc']:
        status['resultc'] = (STATUS_CJ_DISABLED, OVERALL_CRONJOB_STATUS_MESSAGES[STATUS_CJ_DISABLED])

    # Determine overall status of the whole system.
    if status['resultm'][0] != status['resultc'][0]:
        status['result'] = (STATUS_UNKNOWN, OVERALL_STATUS_MESSAGES[STATUS_UNKNOWN])
    else:
        status['result'] = (status['resultm'][0], OVERALL_STATUS_MESSAGES[status['resultm'][0]])

    return status

[docs]def analyze_versions():
    """
    Analyze versions of various relevant dependencies (like PostgreSQL, ...).
    """
    result = {}

    out = subprocess.check_output(['psql','-V'])
    result['postgresql'] = out.decode('utf-8').strip()

    return result

#-------------------------------------------------------------------------------

def _analyze_unconfigured_pid_files(status, modules):
    """
    Analyze list of all PID files and find any that do not belong to known modules.
    """
    for mname in sorted(status['pid_files'].keys()):
        if mname in modules:
            continue
        for pid in sorted(status['pid_files'][mname].keys()):
            status['messages']['info'].append((
                "Unknown pid file '{}' for PID '{}'".format(
                    status['pid_files'][mname][pid]['path'],
                    pid
                ),
                'pidfile',
                status['pid_files'][mname][pid]['path']
            ))

def _analyze_unconfigured_modules(status, modules):
    """
    Analyze list of all processes files and find any that do not belong to known modules.
    """
    for mname in sorted(status['processes'].keys()):
        if mname in modules:
            continue
        for pid in sorted(status['processes'][mname].keys()):
            status['messages']['info'].append((
                "Unknown process '{}' with PID '{}'".format(
                    status['processes'][mname][pid]['exec'],
                    pid
                ),
                'pidfile',
                pid
            ))

def _analyze_unconfigured_cronjobs(status, cronjobs):
    """
    Analyze list of all cron files and find any that do not belong to known cronjob
    modules.
    """
    for mname in sorted(status['cron_files'].keys()):
        if mname in cronjobs:
            continue
        if status['cron_files'][mname]['link']:
            status['messages']['info'].append((
                "Unconfigured cron file '{}' for cron module '{}'".format(
                    status['cron_files'][mname]['link'],
                    status['cron_files'][mname]['path']
                ),
                'cronfile',
                status['cron_files'][mname]['path']
            ))