Source code for ionosphere.ionosphere

from __future__ import division
import logging
import os
from os import kill, getpid, listdir
from os.path import join, isfile
from sys import version_info
try:
    from Queue import Empty
except:
    from queue import Empty
from time import time, sleep
from threading import Thread
# @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
# Use Redis sets in place of Manager().list to reduce memory and number of
# processes
# from multiprocessing import Process, Manager
from multiprocessing import Process
import re
from shutil import rmtree
# import csv
from ast import literal_eval
from datetime import datetime

from redis import StrictRedis
import traceback
import mysql.connector
# from mysql.connector import errorcode

from sqlalchemy.sql import select

# @added 20180715 - Task #2446: Optimize Ionosphere
#                   Branch #2270: luminosity
from sqlalchemy.sql import desc

# @added 20161213 - Branch #1790: test_tsfresh
# To match the new order introduced via the test_tsfresh method
import numpy as np
# import pandas as pd

# @added 20170107 - Feature #1852: Ionosphere - features_profile matched graphite graphs
#                   Feature #1844: ionosphere_matched DB table
from tsfresh import __version__ as tsfresh_version

# @added 20170809 - Task #2132: Optimise Ionosphere DB usage
from pymemcache.client.base import Client as pymemcache_Client

# @added 20180617 - Feature #2404: Ionosphere - fluid approximation
import pandas as pd
from tsfresh.feature_extraction import (
    extract_features, ReasonableFeatureExtractionSettings)

import settings
from skyline_functions import (
    fail_check, mysql_select, write_data_to_file, send_graphite_metric,
    # @added 20170825 - Task #2132: Optimise Ionosphere DB usage
    # @modified 20190408 - Feature #2484: FULL_DURATION feature profiles
    # Moved to common_functions
    # get_memcache_metric_object)
    mkdir_p)

# @added 20161221 - calculate features for every anomaly, instead of making the
# user do it in the frontend or calling the webapp constantly in a cron like
# manner.  Decouple Ionosphere from the webapp.
from features_profile import calculate_features_profile

# @modified 20170107 - Feature #1844: ionosphere_matched DB table
# Added ionosphere_matched_meta
from database import (
    get_engine, ionosphere_table_meta,
    # @added 20170825 - Task #2132: Optimise Ionosphere DB usage
    # @modified 20190408 - Feature #2484: FULL_DURATION feature profiles
    # Moved to common_functions
    # metrics_table_meta,
    ionosphere_matched_table_meta)
from tsfresh_feature_names import TSFRESH_FEATURES

# @added 20170114 - Feature #1854: Ionosphere learn
# @modified 20170117 - Feature #1854: Ionosphere learn - generations
# Renamed the function from simple learn to the meme it has become
# from learn import learn
from learn import ionosphere_learn

# @added 20170306 - Feature #1960: ionosphere_layers
from layers import run_layer_algorithms

# @added 20190322 - Feature #2484: FULL_DURATION feature profiles
from common_functions import (
    get_metrics_db_object, get_calculated_features)
# @added 20190327 - Feature #2484
from echo import ionosphere_echo

skyline_app = 'ionosphere'
skyline_app_logger = '%sLog' % skyline_app
logger = logging.getLogger(skyline_app_logger)
skyline_app_logfile = '%s/%s.log' % (settings.LOG_PATH, skyline_app)
skyline_app_loglock = '%s.lock' % skyline_app_logfile
skyline_app_logwait = '%s.wait' % skyline_app_logfile

python_version = int(version_info[0])

this_host = str(os.uname()[1])

# Converting one settings variable into a local variable, just because it is a
# long string otherwise.
try:
    ENABLE_IONOSPHERE_DEBUG = settings.ENABLE_IONOSPHERE_DEBUG
except:
    logger.error('error :: cannot determine ENABLE_IONOSPHERE_DEBUG from settings')
    ENABLE_IONOSPHERE_DEBUG = False

try:
    SERVER_METRIC_PATH = '.%s' % settings.SERVER_METRICS_NAME
    if SERVER_METRIC_PATH == '.':
        SERVER_METRIC_PATH = ''
except:
    SERVER_METRIC_PATH = ''

# @added 20180819 - Task #2526: Hard code IONOSPHERE_PROCESSES to 1
# Number of processes to assign to Ionosphere, however Ionosphere should never
# need more than 1 and is effectively hard coded as such currently.  This
# variable is only declared for the purpose of maintaining a standard set up in
# each module and to possibly enable more than one processor on Ionosphere in
# the future, should there be a requirement for Ionosphere to analyse the
# metrics quicker.  Running Ionosphere with more than one process is untested
# and currently it is hard coded to be 1
# (https://github.com/earthgecko/skyline/issues/69)
try:
    IONOSPHERE_PROCESSES = settings.IONOSPHERE_PROCESSES
    if IONOSPHERE_PROCESSES != 1:
        IONOSPHERE_PROCESSES = 1
except:
    IONOSPHERE_PROCESSES = 1

# @added 20190524 - Bug #3050: Ionosphere - Skyline and Graphite feedback
# Do not run checks if namespace has matched multiple times in the
# last 10 minutes.  However determining which Skyline related metrics
# are feeding back are quite difficult to ascetain.  So use the
# ionosphere_busy logic again and use or find the skyline host namespace
# and if busy do not analyse the Skyline host namespace while
# ionosphere is busy.
try:
    SKYLINE_FEEDBACK_NAMESPACES = settings.SKYLINE_FEEDBACK_NAMESPACES
except:
    # Let us take a guess
    try:
        graphite_host = settings.GRAPHITE_HOST
        graphite_hostname = graphite_host.split('.', -1)[0]
        SKYLINE_FEEDBACK_NAMESPACES = [settings.SERVER_METRICS_NAME, graphite_hostname]
    except:
        SKYLINE_FEEDBACK_NAMESPACES = [this_host]

skyline_app_graphite_namespace = 'skyline.%s%s' % (skyline_app, SERVER_METRIC_PATH)

max_age_seconds = settings.IONOSPHERE_CHECK_MAX_AGE

# Database configuration
config = {'user': settings.PANORAMA_DBUSER,
          'password': settings.PANORAMA_DBUSERPASS,
          'host': settings.PANORAMA_DBHOST,
          'port': settings.PANORAMA_DBPORT,
          'database': settings.PANORAMA_DATABASE,
          'raise_on_warnings': True}

failed_checks_dir = '%s_failed' % settings.IONOSPHERE_CHECK_PATH
last_purge_key = '%s.last_purge_ts' % skyline_app

LOCAL_DEBUG = False


[docs]class Ionosphere(Thread):
    """
    The Ionosphere class which controls the ionosphere thread and spawned
    processes.
    """

    def __init__(self, parent_pid):
        """
        Initialize Ionosphere

        Define Redis and memcached connections

        """
        super(Ionosphere, self).__init__()
        # @modified 20180519 - Feature #2378: Add redis auth to Skyline and rebrow
        if settings.REDIS_PASSWORD:
            self.redis_conn = StrictRedis(password=settings.REDIS_PASSWORD, unix_socket_path=settings.REDIS_SOCKET_PATH)
        else:
            self.redis_conn = StrictRedis(unix_socket_path=settings.REDIS_SOCKET_PATH)
        self.daemon = True
        self.parent_pid = parent_pid
        self.current_pid = getpid()
        self.mysql_conn = mysql.connector.connect(**config)
        # @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
        #                      Task #3032: Debug number of Python processes and memory use
        #                      Branch #3002: docker
        # Reduce amount of Manager instances that are used as each requires a
        # copy of entire memory to be copied into each subprocess so this
        # results in a python process per Manager instance, using as much
        # memory as the parent.  OK on a server, not so much in a container.
        # Disabled all the Manager().list() below and replaced with Redis sets
        # self.anomalous_metrics = Manager().list()
        # self.not_anomalous = Manager().list()
        # self.features_profiles_checked = Manager().list()
        # self.training_metrics = Manager().list()
        # self.sent_to_panorama = Manager().list()
        # @added 20170108 - Feature #1830: Ionosphere alerts
        # Added lists of ionosphere_smtp_alerter_metrics and
        # ionosphere_non_smtp_alerter_metrics
        # self.ionosphere_smtp_alerter_metrics = Manager().list()
        # self.ionosphere_non_smtp_alerter_metrics = Manager().list()
        # @added 20170306 - Feature #1960: ionosphere_layers
        # self.layers_checked = Manager().list()
        # @added 20170809 - Task #2132: Optimise Ionosphere DB usage
        if settings.MEMCACHE_ENABLED:
            self.memcache_client = pymemcache_Client((settings.MEMCACHED_SERVER_IP, settings.MEMCACHED_SERVER_PORT), connect_timeout=0.1, timeout=0.2)
        else:
            self.memcache_client = None

[docs]    def check_if_parent_is_alive(self):
        """
        Self explanatory
        """
        try:
            kill(self.current_pid, 0)
            kill(self.parent_pid, 0)
        except:
            exit(0)

    """
    These are the ionosphere mysql functions used to surface and input
    ionosphere data for timeseries.
    """

[docs]    def mysql_insert(self, insert):
        """
        Insert data into mysql table

        :param insert: the insert string
        :type insert: str
        :return: int
        :rtype: int or boolean

        - **Example usage**::

            query = 'insert into host (host) VALUES (\'this_host\')'
            result = self.mysql_insert(query)

        .. note::
            - If the MySQL query fails a boolean will be returned not a tuple
                * ``False``
                * ``None``

        """

        try:
            cnx = mysql.connector.connect(**config)
            if ENABLE_IONOSPHERE_DEBUG:
                logger.info('debug :: connected to mysql')
        except mysql.connector.Error as err:
            logger.error('error :: mysql error - %s' % str(err))
            logger.error('error :: failed to connect to mysql')
            raise

        if cnx:
            try:
                cursor = cnx.cursor()
                cursor.execute(insert)
                inserted_id = cursor.lastrowid
                # Make sure data is committed to the database
                cnx.commit()
                cursor.close()
                cnx.close()
                return inserted_id
            except mysql.connector.Error as err:
                logger.error('error :: mysql error - %s' % str(err))
                logger.error('Failed to insert record')
                cnx.close()
                raise
        else:
            cnx.close()
            return False

        return False

[docs]    def purge_old_data_dirs(self, dir_path, older_than):
        time_now = time()
        logger.info(
            'Cleaning old training data from %s older than %s seconds' %
            (dir_path, str(older_than)))
        try:
            for path, folders, files in os.walk(dir_path):
                for folder in folders[:]:
                    folder_path = os.path.join(path, folder)
                    # Only timestamped directories are removed
                    if re.match('\d{10}', folder):
                        if ENABLE_IONOSPHERE_DEBUG:
                            logger.info('debug :: matched - %s' % folder_path)
                        if (time_now - os.path.getmtime(folder_path)) > older_than:
                            try:
                                rmtree(folder_path)
                                logger.info('removed - %s' % folder_path)
                            except:
                                logger.error('error :: failed to rmtree %s' % folder_path)
        except:
            logger.info(traceback.format_exc())
            logger.error('error :: purge_old_data_dirs - os.walk')

        last_purge_ts = int(time())
        try:
            self.redis_conn.setex(last_purge_key, 1800, last_purge_ts)
            logger.info('updated Redis key for %s' % last_purge_key)
        except:
            logger.error('error :: failed to update Redis key for %s' % last_purge_key)

        backup_purge_ts_file = '%s/last_purge_ts.txt' % (settings.IONOSPHERE_DATA_FOLDER)
        try:
            write_data_to_file(skyline_app, backup_purge_ts_file, 'w', last_purge_ts)
            logger.info('updated the backup_purge_ts_file with %s' % str(last_purge_ts))
        except:
            logger.error('error :: failed to update the backup_purge_ts_file - %s' % backup_purge_ts_file)
        return

[docs]    def remove_metric_check_file(self, metric_check_file):
        if os.path.isfile(str(metric_check_file)):
            try:
                os.remove(str(metric_check_file))
                logger.info('metric_check_file removed - %s' % str(metric_check_file))
            except OSError:
                pass
        return


# @added 20161228 - Feature #1828: ionosphere - mirage Redis data features
#                   Branch #922: Ionosphere
# Bringing Ionosphere online - do alert on Ionosphere metrics
[docs]    def manage_ionosphere_unique_metrics(self):
        """
        Create a Redis set of all Ionosphere enabled metrics.

        :param i: python process id
        :return: returns True

        """

        def get_an_engine():
            try:
                engine, log_msg, trace = get_engine(skyline_app)
                return engine, log_msg, trace
            except:
                trace = traceback.format_exc()
                logger.error('%s' % trace)
                log_msg = 'error :: failed to get MySQL engine for manage_ionosphere_unique_metrics'
                logger.error('%s' % log_msg)
                return None, log_msg, trace

        ionosphere_unique_metrics_count = 0
        redis_ionosphere_unique_metrics = None
        ionosphere_unique_metrics = []
        try:
            # ionosphere_unique_metrics = list(self.redis_conn.smembers('ionosphere.unique_metrics'))
            redis_ionosphere_unique_metrics = self.redis_conn.smembers('ionosphere.unique_metrics')
        except:
            logger.error(traceback.format_exc())
            logger.error('error :: failed to get ionosphere.unique_metrics from Redis')
            # ionosphere_unique_metrics = []

        if redis_ionosphere_unique_metrics is not None:
            ionosphere_unique_metrics = list(redis_ionosphere_unique_metrics)
            ionosphere_unique_metrics_count = len(ionosphere_unique_metrics)
            logger.info('Redis ionosphere.unique_metrics set has %s metrics' % (str(ionosphere_unique_metrics_count)))
        else:
            logger.info('Redis ionosphere.unique_metrics unknown setting to []')
            ionosphere_unique_metrics = []

        manage_ionosphere_unique_metrics = True
        manage_ionosphere_unique_metrics_key = []
        try:
            manage_ionosphere_unique_metrics_key = self.redis_conn.get('ionosphere.manage_ionosphere_unique_metrics')
        except Exception as e:
            if LOCAL_DEBUG:
                logger.error('error :: could not query Redis for ionosphere.manage_ionosphere_unique_metrics key: %s' % str(e))

        if manage_ionosphere_unique_metrics_key is not None:
            manage_ionosphere_unique_metrics = False

        logger.info('getting MySQL engine for ionosphere_enabled_metrics')
        try:
            engine, log_msg, trace = get_an_engine()
            logger.info(log_msg)
        except:
            logger.error(traceback.format_exc())
            logger.error('error :: could not get a MySQL engine for ionosphere_enabled_metrics')
            return False
        if not engine:
            logger.error('error :: MySQL engine not obtained for ionosphere_enabled_metrics')
            return False

        # Determine the metrics that have ionosphere_enabled
        # @added 20170103 - Task #1658: Patterning Skyline Ionosphere
        # TODO: We need 2 sets not just ionosphere.unique_metrics otherwise
        #       if a metric is switch from Analyzer to Mirage will send all
        #       matched anomalies to Ionosphere even if there is no features
        #       profile at the specified duration.
        # ionosphere.analyzer.unique_metrics (at FULL_DURATION)
        # ionosphere.mirage.unique_metrics (NOT at FULL_DURATION)
        # @modified 20170108 - Feature #1852: Ionosphere - features_profile matched graphite graphs
        # Yes those ^^ are needed, MySQL join?
        ionosphere_enabled_metrics = []
        ionosphere_metrics_count = 0
        query_ok = False
        try:
            stmt = 'select metric from metrics where ionosphere_enabled=1'
            connection = engine.connect()
            for row in engine.execute(stmt):
                metric_basename = row['metric']
                metric_name = '%s%s' % (str(settings.FULL_NAMESPACE), str(metric_basename))
                ionosphere_enabled_metrics.append(metric_name)
            connection.close()
            query_ok = True
        except:
            logger.error(traceback.format_exc())
            logger.error('error :: could not determine ionosphere_enabled metrics from the DB to manage ionosphere.unique_metrics Redis set')

        ionosphere_metrics_count = len(ionosphere_enabled_metrics)
        logger.info('db has %s ionosphere_enabled metrics' % (str(ionosphere_metrics_count)))

        # @added 20190528 - Branch #3002: docker
        if ionosphere_metrics_count == 0:
            ionosphere_enabled_metrics = ['none']

        if manage_ionosphere_unique_metrics:
            # Testing the query was fine and Ionosphere metrics can go to 0 if
            # all were disabled
            if query_ok:
                manage_ionosphere_unique_metrics = True
            else:
                manage_ionosphere_unique_metrics = False

        if manage_ionosphere_unique_metrics:
            for metric_name in ionosphere_enabled_metrics:
                try:
                    self.redis_conn.sadd('ionosphere.new_unique_metrics', metric_name)
                    # logger.info('added %s to ionosphere.new_unique_metrics Redis set' % metric_name)
                except:
                    logger.error(traceback.format_exc())
                    logger.info('error :: failed to add %s to ionosphere.new_unique_metrics Redis set' % metric_name)
                try:
                    self.redis_conn.setex('ionosphere.manage_ionosphere_unique_metrics', 300, time())
                except:
                    logger.error('error :: failed to set key :: ionosphere.manage_ionosphere_unique_metrics')
            try:
                logger.info('replacing Redis ionosphere.unique_metrics via rename of ionosphere.new_unique_metrics')
                self.redis_conn.rename('ionosphere.new_unique_metrics', 'ionosphere.unique_metrics')
                manage_ionosphere_unique_metrics = False
                ionosphere_unique_metrics = []
            except Exception as e:
                if str(e) == 'no such key':
                    logger.info('could not rename Redis set ionosphere.new_unique_metrics to ionosphere.unique_metrics: %s' % str(e))
                else:
                    logger.error('error :: could not rename Redis set ionosphere.new_unique_metrics to ionosphere.unique_metrics: %s' % str(e))
            try:
                self.redis_conn.setex('ionosphere.manage_ionosphere_unique_metrics', 300, time())
            except:
                logger.error('error :: failed to set key :: ionosphere.manage_ionosphere_unique_metrics')
            redis_ionosphere_unique_metrics = []
            try:
                # ionosphere_unique_metrics = list(self.redis_conn.smembers('ionosphere.unique_metrics'))
                redis_ionosphere_unique_metrics = self.redis_conn.smembers('ionosphere.unique_metrics')
            except:
                logger.error(traceback.format_exc())
                logger.error('error :: failed to get ionosphere.unique_metrics from Redis')
                # ionosphere_unique_metrics = []

            if redis_ionosphere_unique_metrics is not None:
                ionosphere_unique_metrics = list(redis_ionosphere_unique_metrics)
                ionosphere_unique_metrics_count = len(ionosphere_unique_metrics)
                logger.info('the new Redis ionosphere.unique_metrics set has %s metrics' % (str(ionosphere_unique_metrics_count)))
            else:
                logger.info('Redis ionosphere.unique_metrics unknown setting to []')
                ionosphere_unique_metrics = []

        if engine:
            try:
                engine.dispose()
            except:
                logger.error(traceback.format_exc())
                logger.error('error :: calling engine.dispose()')

        return True

    # @added 20161230 - Feature #1830: Ionosphere alerts
    #                   Bug #1460: panorama check file fails
    #                   Panorama check file fails #24
    # Get rid of the skyline_functions imp as imp is deprecated in py3 anyway
[docs]    def new_load_metric_vars(self, metric_vars_file):
        """
        Load the metric variables for a check from a metric check variables file

        :param metric_vars_file: the path and filename to the metric variables files
        :type metric_vars_file: str
        :return: the metric_vars list or ``False``
        :rtype: list

        """
        if os.path.isfile(metric_vars_file):
            logger.info(
                'loading metric variables from metric_check_file - %s' % (
                    str(metric_vars_file)))
        else:
            logger.error(
                'error :: loading metric variables from metric_check_file - file not found - %s' % (
                    str(metric_vars_file)))
            return False

        metric_vars = []
        with open(metric_vars_file) as f:
            for line in f:
                no_new_line = line.replace('\n', '')
                no_equal_line = no_new_line.replace(' = ', ',')
                array = str(no_equal_line.split(',', 1))
                add_line = literal_eval(array)
                metric_vars.append(add_line)

        string_keys = ['metric', 'anomaly_dir', 'added_by', 'app', 'source']
        float_keys = ['value']
        # @modified 20170127 - Feature #1886: Ionosphere learn - child like parent with evolutionary maturity
        # Added ionosphere_parent_id, always zero from Analyzer and Mirage
        int_keys = [
            'from_timestamp', 'metric_timestamp', 'added_at', 'full_duration',
            'ionosphere_parent_id']
        array_keys = ['algorithms', 'triggered_algorithms']
        boolean_keys = ['graphite_metric', 'run_crucible_tests']

        metric_vars_array = []
        for var_array in metric_vars:
            key = None
            value = None
            if var_array[0] in string_keys:
                key = var_array[0]
                value_str = str(var_array[1]).replace("'", '')
                value = str(value_str)
                if var_array[0] == 'metric':
                    metric = value
            if var_array[0] in float_keys:
                key = var_array[0]
                value_str = str(var_array[1]).replace("'", '')
                value = float(value_str)
            if var_array[0] in int_keys:
                key = var_array[0]
                value_str = str(var_array[1]).replace("'", '')
                value = int(value_str)
            if var_array[0] in array_keys:
                key = var_array[0]
                value = literal_eval(str(var_array[1]))
            if var_array[0] in boolean_keys:
                key = var_array[0]
                if str(var_array[1]) == 'True':
                    value = True
                else:
                    value = False
            if key:
                metric_vars_array.append([key, value])

            if len(metric_vars_array) == 0:
                logger.error(
                    'error :: loading metric variables - none found' % (
                        str(metric_vars_file)))
                return False

        logger.info('debug :: metric_vars for %s' % str(metric))
        logger.info('debug :: %s' % str(metric_vars_array))

        return metric_vars_array

# @added 20170109 - Feature #1854: Ionosphere learn
# Added the spawn_learn_process after determining to is not fit to bolt learn
# inside of ionosphere.py in its entirety, no point in more conditional nesting
# and bulking up ionosphere.py with more learn parameter to spin_process etc
# ionosphere.py works, as good as it gets, so extended with learn.py.  This uses
# the same no memory leak pattern that was adopted for smtp_alerts.
[docs]    def spawn_learn_process(self, i, timestamp):
        """
        Spawn a process to learn.

        This is used for Ionosphere to learn if anomalous metrics remain
        anomalous over time, as the resolution decreases.  It follows the
        multiprocessing methodology the was introduced in Analyzer and Mirage
        in the context of the process objects being cleared down and the learn
        processes cannot create memory leaks as the process always terminates or
        is terminated this prevents any memory leaks in the parent.

        """
        # @modified 20170117 - Feature #1854: Ionosphere learn - generations
        # Renamed the function from simple learn to the meme it has become
        # learn(timestamp)
        ionosphere_learn(timestamp)

    # @added 20190326 - Feature #2484: FULL_DURATION feature profiles
[docs]    def process_ionosphere_echo(self, i, metric_check_file):
        """
        Spawn a process_ionosphere_echo check to create features profiles at
        settings.FULL_DURATION for Mirage metrics

        :param i: python process id
        :param metric_check_file: full path to the metric check file
        :type i: object
        :type metric_check_file: str
        :return: boolean
        :rtype: boolean

        """

        try:
            # Load and validate metric variables
            metric_vars_array = self.new_load_metric_vars(str(metric_check_file))
        except:
            logger.info(traceback.format_exc())
            logger.error('error :: process_ionosphere_echo :: failed to load metric variables from check file - %s' % (metric_check_file))
            return
        added_by = None
        try:
            key = 'added_by'
            value_list = [var_array[1] for var_array in metric_vars_array if var_array[0] == key]
            added_by = str(value_list[0])
            if settings.ENABLE_IONOSPHERE_DEBUG:
                logger.info('debug :: metric variable - added_by - %s' % added_by)
        except:
            logger.error('error :: process_ionosphere_echo failed to read added_by variable from check file - %s' % (metric_check_file))
            added_by = None
        if not added_by:
            return
        if added_by != 'mirage':
            logger.info('process_ionosphere_echo :: only mirage metrics are processed not metrics added_by %s' % added_by)
            return
        metric = None
        try:
            # metric_vars.metric
            key = 'metric'
            value_list = [var_array[1] for var_array in metric_vars_array if var_array[0] == key]
            metric = str(value_list[0])
            if settings.ENABLE_IONOSPHERE_DEBUG:
                logger.info('debug :: metric variable - metric - %s' % metric)
        except:
            logger.info(traceback.format_exc())
            logger.error('error :: failed to read metric variable from check file - %s' % (metric_check_file))
            metric = None
        if not metric:
            logger.error('error :: process_ionosphere_echo failed to load metric variable from check file - %s' % (metric_check_file))
            return

        # @added 20190413 - Feature #2484: FULL_DURATION feature profiles
        # Only process if it is an ionosphere enabled metric
        try:
            ionosphere_unique_metrics = list(self.redis_conn.smembers('ionosphere.unique_metrics'))
        except:
            logger.error(traceback.format_exc())
            logger.error('error :: failed to get ionosphere.unique_metrics from Redis')
            ionosphere_unique_metrics = []
        if ionosphere_unique_metrics:
            # @modified 20190413 - Bug #2942: process_ionosphere_echo metric mismatch
            #                      Feature #2484: FULL_DURATION feature profiles
            # Matching bug for not in list comprehension it must be an absolute
            # match
            # if not metric in ionosphere_unique_metrics:
            metric_name = '%s%s' % (str(settings.FULL_NAMESPACE), str(metric))
            # @modified 20190522: Task #3034: Reduce multiprocessing Manager list usage
            # if not metric_name in ionosphere_unique_metrics:
            if metric_name not in ionosphere_unique_metrics:
                logger.info('process_ionosphere_echo :: only ionosphere enabled metrics are processed, skipping %s' % metric)
                return

        full_duration = None
        try:
            # metric_vars.full_duration
            key = 'full_duration'
            value_list = [var_array[1] for var_array in metric_vars_array if var_array[0] == key]
            full_duration = int(value_list[0])
            if settings.ENABLE_IONOSPHERE_DEBUG:
                logger.info('debug :: metric variable - full_duration - %s' % str(full_duration))
        except:
            logger.error('error :: process_ionosphere_echo failed to read full_duration variable from check file - %s' % (metric_check_file))
            full_duration = None
        if not full_duration:
            return

        logger.info('process_ionosphere_echo :: processing - %s' % (metric))
        ionosphere_echo(metric, full_duration)

    # @modified 20190404 - Bug #2904: Initial Ionosphere echo load and Ionosphere feedback
    #                      Feature #2484: FULL_DURATION feature profiles
    # Added the ionosphere_busy parameter
    # def spin_process(self, i, metric_check_file):
[docs]    def spin_process(self, i, metric_check_file, ionosphere_busy):
        """
        Assign an anomalous metric to check against features profiles.

        :param i: python process id
        :param metric_check_file: full path to the metric check file
        :param ionosphere_busy: whether to Ionosphere manage and alternate
            between normal Ionosphere and echo analysis
        :type i: object
        :type metric_check_file: str
        :type ionosphere_busy: boolen
        :return: int
        :rtype: int or boolean

        """

        def get_an_engine():
            try:
                engine, log_msg, trace = get_engine(skyline_app)
                return engine, log_msg, trace
            except:
                logger.error(traceback.format_exc())
                log_msg = 'error :: failed to get MySQL engine in spin_process'
                logger.error('error :: failed to get MySQL engine in spin_process')
                return None, log_msg, trace

        def engine_disposal(engine):
            if engine:
                try:
                    engine.dispose()
                except:
                    logger.error(traceback.format_exc())
                    logger.error('error :: calling engine.dispose()')
            return

        child_process_pid = os.getpid()
        logger.info('child_process_pid - %s' % str(child_process_pid))

        try:
            ionosphere_max_runtime = settings.IONOSPHERE_MAX_RUNTIME
        except:
            ionosphere_max_runtime = 120

        if settings.ENABLE_IONOSPHERE_DEBUG:
            logger.info('debug :: processing metric check - %s' % metric_check_file)

        if not os.path.isfile(str(metric_check_file)):
            logger.error('error :: file not found - metric_check_file - %s' % (str(metric_check_file)))
            return

        engine = None
        anomalous_timeseries = False

        check_file_name = os.path.basename(str(metric_check_file))
        if settings.ENABLE_IONOSPHERE_DEBUG:
            logger.info('debug :: check_file_name - %s' % check_file_name)
        check_file_timestamp = check_file_name.split('.', 1)[0]
        if settings.ENABLE_IONOSPHERE_DEBUG:
            logger.info('debug :: check_file_timestamp - %s' % str(check_file_timestamp))
        check_file_metricname_txt = check_file_name.split('.', 1)[1]
        if settings.ENABLE_IONOSPHERE_DEBUG:
            logger.info('debug :: check_file_metricname_txt - %s' % check_file_metricname_txt)
        check_file_metricname = check_file_metricname_txt.replace('.txt', '')
        if settings.ENABLE_IONOSPHERE_DEBUG:
            logger.info('debug :: check_file_metricname - %s' % check_file_metricname)
        check_file_metricname_dir = check_file_metricname.replace('.', '/')
        if settings.ENABLE_IONOSPHERE_DEBUG:
            logger.info('debug :: check_file_metricname_dir - %s' % check_file_metricname_dir)

        metric_failed_check_dir = '%s/%s/%s' % (failed_checks_dir, check_file_metricname_dir, check_file_timestamp)

        failed_check_file = '%s/%s' % (metric_failed_check_dir, check_file_name)
        if settings.ENABLE_IONOSPHERE_DEBUG:
            logger.info('debug :: failed_check_file - %s' % failed_check_file)

        # @added 20170307 - Feature #1960: ionosphere_layers - ionosphere_check_cache_key
        # This Redis cache key check was added to prevent Ionosphere from
        # running riot on checks if for some reason the check_file is not
        # removed which happens if some exception is not handled as found out
        # again during yesterday's development of run_layer_algorithms.  It was
        # a good reminder of how fast Skyline can iterate.
        ionosphere_check_cache_key = 'ionosphere.check.%s' % check_file_name
        check_done = False
        try:
            check_done = self.redis_conn.get(ionosphere_check_cache_key)
        except Exception as e:
            logger.error('error :: could not query Redis for cache_key: %s' % e)
        if not check_done:
            logger.info('check done check - no check cache key - %s' % ionosphere_check_cache_key)
        else:
            # @modified 20181113 - Task #2680: Remove Ionosphere check files is key exists
            # This was here for initially debugging, no longer needed
            # logger.error('error :: a check cache key exists - %s' % ionosphere_check_cache_key)
            # logger.error('error :: failing check to prevent multiple iterations over this check')
            # fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
            logger.info('a check cache key exists - %s' % (ionosphere_check_cache_key))
            logger.info('to prevent multiple iterations over this check removing %s' % (
                str(metric_check_file)))
            self.remove_metric_check_file(str(metric_check_file))
            return
        try:
            check_process_start = int(time())
            # @modified 20190412 - Task #2824: Test redis-py upgrade
            #                      Task #2926: Update dependencies
            # redis-py 3.x only accepts user data as bytes, strings or
            # numbers (ints, longs and floats).  All 2.X users should
            # make sure that the keys and values they pass into redis-py
            # are either bytes, strings or numbers.  Added cache_key_value
            # self.redis_conn.setex(
            #   ionosphere_check_cache_key, 300, [check_process_start])
            self.redis_conn.setex(
                ionosphere_check_cache_key, 300, check_process_start)
            logger.info(
                'added Redis check key - %s' % (ionosphere_check_cache_key))
        except:
            logger.error(traceback.format_exc())
            logger.error(
                'error :: failed to add Redis check key - %s' % (ionosphere_check_cache_key))
            logger.error('error :: failing check to prevent multiple iterations over this check')
            fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
            return

        try:
            # Load and validate metric variables
            # @modified 20161231 - Feature #1830: Ionosphere alerts
            #                      Bug #1460: panorama check file fails
            #                      Panorama check file fails #24
            # Get rid of the skyline_functions imp as imp is deprecated in py3 anyway
            # Use def new_load_metric_vars(self, metric_vars_file):
            # metric_vars = load_metric_vars(skyline_app, str(metric_check_file))
            metric_vars_array = self.new_load_metric_vars(str(metric_check_file))
        except:
            logger.info(traceback.format_exc())
            logger.error('error :: failed to load metric variables from check file - %s' % (metric_check_file))
            fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
            return

        # Test metric variables
        # We use a pythonic methodology to test if the variables are defined,
        # this ensures that if any of the variables are not set for some reason
        # we can handle unexpected data or situations gracefully and try and
        # ensure that the process does not hang.
        metric = None
        try:
            # metric_vars.metric
            # metric = str(metric_vars.metric)
            key = 'metric'
            value_list = [var_array[1] for var_array in metric_vars_array if var_array[0] == key]
            metric = str(value_list[0])
            base_name = metric
            if settings.ENABLE_IONOSPHERE_DEBUG:
                logger.info('debug :: metric variable - metric - %s' % metric)
        except:
            logger.info(traceback.format_exc())
            logger.error('error :: failed to read metric variable from check file - %s' % (metric_check_file))
            metric = None

        if not metric:
            logger.error('error :: failed to load metric variable from check file - %s' % (metric_check_file))
            fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
            return

        value = None
        try:
            # metric_vars.value
            # value = str(metric_vars.value)
            key = 'value'
            value_list = [var_array[1] for var_array in metric_vars_array if var_array[0] == key]
            value = float(value_list[0])
            anomalous_value = value
            if settings.ENABLE_IONOSPHERE_DEBUG:
                logger.info('debug :: metric variable - value - %s' % str(value))
        except:
            logger.error('error :: failed to read value variable from check file - %s' % (metric_check_file))
            value = None

        if not value:
            # @modified 20181119 - Bug #2708: Failing to load metric vars
            if value == 0.0:
                pass
            else:
                logger.error('error :: failed to load value variable from check file - %s' % (metric_check_file))
                fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
                return

        from_timestamp = None
        try:
            # metric_vars.from_timestamp
            # from_timestamp = str(metric_vars.from_timestamp)
            key = 'from_timestamp'
            value_list = [var_array[1] for var_array in metric_vars_array if var_array[0] == key]
            from_timestamp = int(value_list[0])
            if settings.ENABLE_IONOSPHERE_DEBUG:
                logger.info('debug :: metric variable - from_timestamp - %s' % str(from_timestamp))
        except:
            # @added 20160822 - Bug #1460: panorama check file fails
            # Added exception handling here
            logger.info(traceback.format_exc())
            logger.error('error :: failed to read from_timestamp variable from check file - %s' % (metric_check_file))
            fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
            return

        if not from_timestamp:
            logger.error('error :: failed to load from_timestamp variable from check file - %s' % (metric_check_file))
            fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
            return

        metric_timestamp = None
        try:
            # metric_vars.metric_timestamp
            # metric_timestamp = str(metric_vars.metric_timestamp)
            key = 'metric_timestamp'
            value_list = [var_array[1] for var_array in metric_vars_array if var_array[0] == key]
            metric_timestamp = int(value_list[0])
            if settings.ENABLE_IONOSPHERE_DEBUG:
                logger.info('debug :: metric variable - metric_timestamp - %s' % str(metric_timestamp))
        except:
            logger.error('error :: failed to read metric_timestamp variable from check file - %s' % (metric_check_file))
            metric_timestamp = None

        if not metric_timestamp:
            logger.error('error :: failed to load metric_timestamp variable from check file - %s' % (metric_check_file))
            fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
            return

        try:
            # metric_vars.algorithms
            # algorithms = metric_vars.algorithms
            key = 'algorithms'
            value_list = [var_array[1] for var_array in metric_vars_array if var_array[0] == key]
            algorithms = value_list[0]
            if settings.ENABLE_IONOSPHERE_DEBUG:
                logger.info('debug :: metric variable - algorithms - %s' % str(algorithms))
        except:
            logger.error('error :: failed to read algorithms variable from check file setting to all - %s' % (metric_check_file))
            algorithms = 'all'

        try:
            # metric_vars.triggered_algorithms
            # triggered_algorithms = metric_vars.triggered_algorithms
            key = 'triggered_algorithms'
            value_list = [var_array[1] for var_array in metric_vars_array if var_array[0] == key]
            triggered_algorithms = value_list[0]
            if settings.ENABLE_IONOSPHERE_DEBUG:
                logger.info('debug :: metric variable - triggered_algorithms - %s' % str(triggered_algorithms))
        except:
            logger.error('error :: failed to read triggered_algorithms variable from check file setting to all - %s' % (metric_check_file))
            triggered_algorithms = 'all'

        added_by = None
        try:
            # metric_vars.added_by
            # added_by = str(metric_vars.added_by)
            key = 'added_by'
            value_list = [var_array[1] for var_array in metric_vars_array if var_array[0] == key]
            added_by = str(value_list[0])
            if settings.ENABLE_IONOSPHERE_DEBUG:
                logger.info('debug :: metric variable - added_by - %s' % added_by)
        except:
            logger.error('error :: failed to read added_by variable from check file - %s' % (metric_check_file))
            added_by = None

        if not added_by:
            fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
            return

        # @added 20170117 - Feature #1854: Ionosphere learn - generations
        if str(added_by) == 'ionosphere_learn':
            logger.info('debug :: metric variable - added_by - %s' % added_by)

        try:
            # metric_vars.added_at
            # added_at = str(metric_vars.added_at)
            key = 'added_at'
            value_list = [var_array[1] for var_array in metric_vars_array if var_array[0] == key]
            added_at = int(value_list[0])
            if settings.ENABLE_IONOSPHERE_DEBUG:
                logger.info('debug :: metric variable - added_at - %s' % str(added_at))
        except:
            logger.error('error :: failed to read added_at variable from check file setting to all - %s' % (metric_check_file))
            added_at = metric_timestamp

        # @added 20161228 - Feature #1828: ionosphere - mirage Redis data features
        # Added full_duration which needs to be recorded to allow Mirage metrics
        # to be profiled on Redis timeseries data at FULL_DURATION
        full_duration = None
        try:
            # metric_vars.full_duration
            # full_duration = str(metric_vars.full_duration)
            key = 'full_duration'
            value_list = [var_array[1] for var_array in metric_vars_array if var_array[0] == key]
            full_duration = int(value_list[0])
            if settings.ENABLE_IONOSPHERE_DEBUG:
                logger.info('debug :: metric variable - full_duration - %s' % str(full_duration))
        except:
            logger.error('error :: failed to read full_duration variable from check file - %s' % (metric_check_file))
            full_duration = None

        if not full_duration:
            fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
            return

        # @added 20170127 - Feature #1886: Ionosphere learn - child like parent with evolutionary maturity
        # Added ionosphere_parent_id, always zero from Analyzer and Mirage
        ionosphere_parent_id = None
        ionosphere_parent_id_determined = False
        try:
            key = 'ionosphere_parent_id'
            value_list = [var_array[1] for var_array in metric_vars_array if var_array[0] == key]
            ionosphere_parent_id = int(value_list[0])
            ionosphere_parent_id_determined = True
            if settings.ENABLE_IONOSPHERE_DEBUG:
                logger.info('debug :: metric variable - ionosphere_parent_id - %s' % str(ionosphere_parent_id))
        except:
            logger.error('error :: failed to read ionosphere_parent_id variable from check file - %s' % (metric_check_file))
            ionosphere_parent_id = None

        if not ionosphere_parent_id_determined:
            logger.error('error :: failed to determine ionosphere_parent_id variable from check file - %s' % (metric_check_file))
            fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
            return

        # @modified 20170116 - Feature #1854: Ionosphere learn
        # Do not check the cache key or anomaly age if added by ionosphere_learn
        if added_by != 'ionosphere_learn':
            # @added 20170101 - Feature #1830: Ionosphere alerts
            # Remove check file is an alert key exists
            cache_key = 'ionosphere.%s.alert.%s.%s' % (added_by, metric_timestamp, base_name)
            last_alert = False
            try:
                last_alert = self.redis_conn.get(cache_key)
            except Exception as e:
                logger.error('error :: could not query Redis for cache_key: %s' % e)
            if not last_alert:
                logger.info('debug :: no alert cache key - %s' % cache_key)
            else:
                logger.info('debug :: removing check - alert cache key exists - %s' % cache_key)
                self.remove_metric_check_file(str(metric_check_file))
                return

            now = time()
            anomaly_age = int(now) - int(metric_timestamp)
            if anomaly_age > max_age_seconds:
                logger.info(
                    'Ionosphere check max age exceeded - %s - %s seconds old, older than %s seconds discarding' % (
                        metric, str(anomaly_age), str(max_age_seconds)))
                with open(metric_check_file, 'rt') as fr:
                    metric_check_file_contents = fr.readlines()
                    logger.info(
                        'debug :: metric check file contents\n%s' % (str(metric_check_file_contents)))
                    self.remove_metric_check_file(str(metric_check_file))
                    return
        else:
            logger.info('processing check_file for ionosphere_learn - %s' % str(metric_check_file))

        # @added 20161222 - ionosphere should extract features for every anomaly
        # check that is sent through and calculate a feature_profile ready for
        # submission by the user if they so choose.  Further ionosphere could
        # make itself more useful by comparing any training data profiles to
        # further anomalies, however the feature profiles for subsequent
        # anomalies may be similar enough to match a few times and each a closer
        # match to the next.
        training_metric = False

        metrics_id = None
        metric_ionosphere_enabled = None

        # @added 20170115 - Feature #1854: Ionosphere learn - generations
        # Create the metrics_db_object so it is available to determine all
        # the details of all features profiles for the metric, this has all
        # the generations values avaialble in it.  Here we go! Learn!
        metrics_db_object = None

        # @modified 20190325 - Feature #2484: FULL_DURATION feature profiles
        # Moved get_metrics_db_object block to common_functions.py
        try:
            metrics_db_object = get_metrics_db_object(base_name)
        except:
            logger.error(traceback.format_exc())
            logger.error('error :: could not determine metrics_db_object from get_metrics_db_object for %s' % base_name)

        if metrics_db_object:
            metrics_id = None
            try:
                metrics_id = int(metrics_db_object['id'])
            except:
                # @added 20190509 - Bug #2984: Ionosphere - could not determine values from metrics_db_object
                # Added a traceback here to debug an issue
                logger.error(traceback.format_exc())
                logger.error('error :: could not determine id from metrics_db_object for %s' % base_name)
                metrics_id = None
                metric_ionosphere_enabled = None
                training_metric = True
            if metrics_id:
                # @modified 20190510 - Bug #2984: Ionosphere - could not determine values from metrics_db_object
                # metric_ionosphere_enabled = int(metrics_db_object['ionosphere_enabled'])
                metric_ionosphere_enabled = None
                try:
                    metric_ionosphere_enabled = int(metrics_db_object['ionosphere_enabled'])
                except:
                    logger.error(traceback.format_exc())
                    logger.error('error :: could not determine ionosphere_enabled from metrics_db_object for %s' % base_name)
                if metric_ionosphere_enabled is not None:
                    training_metric = False
                else:
                    training_metric = True
                if metric_ionosphere_enabled == 1:
                    training_metric = False
                if metric_ionosphere_enabled == 0:
                    training_metric = True
        else:
            metrics_id = None
            metric_ionosphere_enabled = None
            training_metric = True
            logger.error('error :: could not determine metric id from memcache or metrics tables for %s' % base_name)
            fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
            return

        # @added 20190524 - Bug #3050: Ionosphere - Skyline and Graphite feedback
        # Do not run checks if namespace has matched multiple times in the
        # last 10 minutes.  However determining which Skyline related metrics
        # are feeding back are quite difficult to ascetain.  So use the
        # ionosphere_busy logic again and use or find the skyline host namespace
        # and if busy do not analyse the Skyline host namespace while
        # ionosphere is busy.
        feedback_metric = False
        if ionosphere_busy:
            metric_namespace_elements = base_name.split('.')
            for to_skip in SKYLINE_FEEDBACK_NAMESPACES:
                if to_skip in base_name:
                    feedback_metric = True
                    break
                to_skip_namespace_elements = to_skip.split('.')
                elements_matched = set(metric_namespace_elements) & set(to_skip_namespace_elements)
                if len(elements_matched) == len(to_skip_namespace_elements):
                    feedback_metric = True
                    break
            if feedback_metric:
                cache_key = 'ionosphere.feedback_metric.checked.%s' % (base_name)
                logger.info('feedback metric identified adding Redis key with 600 TTL - %s' % cache_key)
                try:
                    self.redis_conn.setex(cache_key, 600, int(time()))
                except:
                    logger.info(traceback.format_exc())
                    logger.error('error :: failed to add %s key to Redis' % (
                        str(cache_key)))

        # @added 20170116 - Feature #1854: Ionosphere learn - generations
        # If this is added_by ionosphere_learn the id is only
        # added if the use_full_duration_days features profile
        # is less than max_generations as if it is at the max
        # then a new features profile cannot be created from it
        # even if it is a match.
        metric_max_generations = None
        if added_by == 'ionosphere_learn':
            try:
                metric_max_generations = int(metrics_db_object['max_generations'])
                logger.info('determing max_generations for ionosphere_learn check - %s - %s' % (str(metric_max_generations), base_name))
            except:
                logger.error(traceback.format_exc())
                logger.error('error ::ionosphere_learn check could not determine the metric max_generations from the metrics_db_object for %s' % base_name)
            if not metric_max_generations:
                logger.error('error ::ionosphere_learn check cannot continue without max_generations for %s' % base_name)
                fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
                if engine:
                    engine_disposal(engine)
                return

        # @added 20190522 - Task #3034: Reduce multiprocessing Manager list usage
        # The Redis ionosphere.ionosphere_non_smtp_alerter_metrics list is created here to
        # replace the self.ionosphere_non_smtp_alerter_metrics Manager.list in the below
        # section
        ionosphere_non_smtp_alerter_metrics = []
        try:
            ionosphere_non_smtp_alerter_metrics = list(self.redis_conn.smembers('ionosphere.ionosphere_non_smtp_alerter_metrics'))
        except:
            logger.info(traceback.format_exc())
            logger.error('error :: failed to generate a list from the ionosphere.ionosphere_non_smtp_alerter_metrics Redis set')
            ionosphere_non_smtp_alerter_metrics = []

        # @added 20170108 - Feature #1830: Ionosphere alerts
        # Only process smtp_alerter_metrics
        if training_metric:
            # @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
            # if base_name in self.ionosphere_non_smtp_alerter_metrics:
            if base_name in ionosphere_non_smtp_alerter_metrics:
                logger.error('error :: Ionosphere does not handle metrics that do not have a smtp alert context removing check for %s' % (base_name))
                self.remove_metric_check_file(str(metric_check_file))
                if engine:
                    engine_disposal(engine)
                return
            else:
                # @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
                # self.training_metrics.append(base_name)
                redis_set = 'ionosphere.training_metrics'
                data = str(base_name)
                try:
                    self.redis_conn.sadd(redis_set, data)
                except:
                    logger.info(traceback.format_exc())
                    logger.error('error :: failed to add %s to Redis set %s' % (
                        str(data), str(redis_set)))

        logger.info(
            'ionosphere_enabled is %s for metric id %s - %s' % (
                str(metric_ionosphere_enabled), str(metrics_id),
                base_name))

        if training_metric:
            logger.info('Ionosphere is not enabled on %s' % (base_name))
        else:
            logger.info('Ionosphere is enabled on %s' % (base_name))

        # @added 20161210 - Branch #922: ionosphere
        #                   Task #1658: Patterning Skyline Ionosphere
        # Only continue if there is a training data json timeseries file
        metric_timeseries_dir = base_name.replace('.', '/')

        # @modified 20170115 - Feature #1854: Ionosphere learn
        # Allowing the bifurcation of the metric_training_data_dir based on
        # whether added_by is ionosphere_learn or not, this allows Ionosphere to
        # be brought online to start evaluating the learn features profiles at
        # 30 days or whatever the learn_full_duration_days is for the metric
        # that is being automatically learnt uses these fuller duration features
        # to determine if a new training data set has been created for an
        # ionosphere_enabled metric.  Here Ionosphere starts to try and get
        # clever, let us hope not too clever, but this is where the
        # max_percent_diff_from_origin and max_generations comes in. So ...
        # here we go, a really "Crazy feedback loop" @astanway :)  I would say
        # that this is going to be way more useful than the last referenced one
        # in https://github.com/etsy/skyline/pull/90#r13592782 ;)  This is it
        # 20170115202500 UTC Ionosphere really is now really going to begin.
        # Here we go! Learn!
        # metric_training_data_dir = '%s/%s/%s' % (
        #     settings.IONOSPHERE_DATA_FOLDER, metric_timestamp,
        #     metric_timeseries_dir)
        if added_by != 'ionosphere_learn':
            metric_training_data_dir = '%s/%s/%s' % (
                settings.IONOSPHERE_DATA_FOLDER, metric_timestamp,
                metric_timeseries_dir)
        else:
            # Here we go! Learn you bugger!  SUCH A BIG THANKS TO tsfresh!
            # And flowjob and The White Stripes, @matzhouse, her and the Dude.
            metric_training_data_dir = '%s/%s/%s' % (
                settings.IONOSPHERE_LEARN_FOLDER, metric_timestamp,
                metric_timeseries_dir)

        anomaly_json = '%s/%s.json' % (metric_training_data_dir, base_name)
        if os.path.isfile(anomaly_json):
            logger.info('training data ts json available - %s' % (anomaly_json))
        else:
            logger.error('error :: training data ts json was not found - %s' % (anomaly_json))
            fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
            if engine:
                engine_disposal(engine)
            return

        # @added 20161228 - Feature #1828: ionosphere - mirage Redis data features
        # The timeseries full_duration needs to be recorded to allow Mirage metrics to
        # be profiled on Redis timeseries data at FULL_DURATION
        # e.g. mirage.redis.24h.json
        if training_metric:
            logger.info('training metric - %s' % (base_name))

        redis_anomaly_json = False
        if added_by == 'mirage':
            logger.info('checking training data Redis json is available')
            # Always calculate features for both the SECOND_ORDER_RESOLUTION_SECONDS
            # timeseries data and the FULL_DURATION Redis timeseries data.
            # It is always preferable to create a features profile on a FULL_DURATION
            # data set, unless the user is flagging the actual Mirage timeseries as
            # not anomalous.  In the Mirage context the not anomalous may often be more
            # "visibile" in the FULL_DURATION view and if so should be matched on the
            # FULL_DURATION timeseries data, even if it is a Mirage metric.
            # Features profiles can be created for a Mirage metric on both the
            # FULL_DURATION and the SECOND_ORDER_RESOLUTION_SECONDS data sets, however
            # only one should be needed.
            # A features profile should always be created at the highest resolution
            # possible, FULL_DURATION data, wherever possible.
            try:
                full_duration_hours = str(int(settings.FULL_DURATION / 3600))
                redis_anomaly_json = '%s/%s.mirage.redis.%sh.json' % (metric_training_data_dir, base_name, full_duration_hours)
                if os.path.isfile(redis_anomaly_json):
                    logger.info('training data Redis full duration ts json available - %s' % (redis_anomaly_json))
                else:
                    logger.info('no training data Redis full duration json was not found - %s' % (redis_anomaly_json))
            except:
                logger.error(traceback.format_exc())
                logger.error('error :: training data Redis full duration json was not found - %s' % (redis_anomaly_json))

        # @added 20161209 - Branch #922: ionosphere
        #                   Task #1658: Patterning Skyline Ionosphere
        # Use SQLAlchemy, mysql.connector is still upstairs ^^ but starting the
        # move to SQLAlchemy now that all the webapp Ionosphere SQLAlchemy
        # patterns work and the database lay out if defined we can begin on the
        # data side.  Ionosphere was put together backwards, like tsfresh was
        # learnt.  It was the people input first here in many ways, which is
        # exactly how it was suppose to be.
        # This is now the Ionosphere meat.
        # Get a MySQL engine only if not training_metric
        if not training_metric:
            if not metrics_id:
                logger.error('error :: metric id not known')
                fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
                if engine:
                    engine_disposal(engine)
                return False

            # @added 20170101 - Feature #1836: ionosphere - local features profiles disk cache
            # Cache fp ids for 300 seconds?

            # @added 20170804 - Bug #2130: MySQL - Aborted_clients
            # Set a conditional here to only get_an_engine if no engine, this
            # is probably responsible for the Aborted_clients, as it would have
            # left the accquired engine orphaned
            # Testing on skyline-dev-3-40g-gra1 Fri Aug  4 16:08:14 UTC 2017
            if not engine:
                logger.info('getting MySQL engine')
                try:
                    engine, log_msg, trace = get_an_engine()
                    logger.info(log_msg)
                except:
                    logger.error(traceback.format_exc())
                    logger.error('error :: could not get a MySQL engine to get fp_ids')

            if not engine:
                logger.error('error :: engine not obtained to get fp_ids')

            try:
                ionosphere_table, log_msg, trace = ionosphere_table_meta(skyline_app, engine)
                logger.info(log_msg)
                logger.info('ionosphere_table OK')
            except:
                logger.error(traceback.format_exc())
                logger.error('error :: failed to get ionosphere_table meta for %s' % base_name)

            # Determine the fp_ids that exist for the metric
            fp_ids = []
            fp_ids_found = False
            # @added 20170108 - Feature #1842: Ionosphere - Graphite now graphs
            # Added all_fp_ids so that we can handle multiple durations and not
            # error and reminds me of the needed metrics by FULL_DURATION
            # ionosphere.analyzer.unique_metrics (at FULL_DURATION)
            # ionosphere.mirage.unique_metrics (NOT at FULL_DURATION)
            all_fp_ids = []

            # @added 20170115 - Feature #1854: Ionosphere learn - generations
            # Create the fp_ids_db_object so it is available to determine all
            # the details of all features profiles for the metric, this has all
            # the generations values avaialble in it.
            # Here we go! Learn!
            # @modified 20170308 - Feature #1960: ionosphere_layers
            # Not currently used - fp_ids_db_object
            # fp_ids_db_object = None

            # @added 20170306 - Feature #1960: ionosphere_layers
            # Here we go, let us TEACH you properly.
            # Set result to None here to fix a interpolation error below
            result = None
            fp_layers_ids = []
            fp_layers_present = False

            # @added 20190326 - Feature #2484: FULL_DURATION feature profiles
            # After the features profile evaluations this fps_db_object will
            # be used to determine what settings.FULL_DURATION features
            # profiles need to be created for ionosphere_echo
            fps_db_object = None

            # @added 20190919 - Feature #2484: FULL_DURATION feature profiles
            # Set both fp_count_with_echo and fp_count to 0 initially so that
            # if the are echo fps, then the database can be updated with the
            # fp_count_with_echo value for fp_count in the ionosphere_matched
            # table
            fp_count = 0
            fp_count_with_echo = 0

            try:
                connection = engine.connect()
                # @modified 2018075 - Task #2446: Optimize Ionosphere
                #                     Branch #2270: luminosity
                # Order by the latest features profile, this also results in the
                # layers ids being ordered by latest too.
                # stmt = select([ionosphere_table]).where(ionosphere_table.c.metric_id == metrics_id)
                stmt = select([ionosphere_table]).where(ionosphere_table.c.metric_id == metrics_id).order_by(desc(ionosphere_table.c.id))
                result = connection.execute(stmt)
                # @added 20190326 - Feature #2484: FULL_DURATION feature profiles
                # To be used for ionosphere_echo
                fps_db_object = [{column: value for column, value in rowproxy.items()} for rowproxy in result]

                # for row in result:
                for row in fps_db_object:
                    if row['enabled'] != 1:
                        continue
                    if row['deleted'] == 1:
                        continue

                    fp_id = row['id']

                    # @added 20170306 - Feature #1960: ionosphere_layers
                    # Here we go, let us TEACH you properly
                    fp_layers_id = int(row['layers_id'])
                    if fp_layers_id > 0:
                        fp_layers_present = True
                    # @modified 20181013 - Feature #2430: Ionosphere validate learnt features profiles page
                    # Only add the fp_layers_id if > 0
                    # fp_layers_ids.append(fp_layers_id)
                    if fp_layers_id > 0:
                        if fp_layers_id not in fp_layers_ids:
                            fp_layers_ids.append(fp_layers_id)

                    # @added 20170108 - Feature #1842: Ionosphere - Graphite now graphs
                    # Added all_fp_ids
                    all_fp_ids.append(int(fp_id))

                    if int(row['full_duration']) == int(full_duration):
                        # @modified 20170116 - Feature #1854: Ionosphere learn - generations
                        # Handle ionosphere_learn
                        if added_by != 'ionosphere_learn':
                            fp_ids.append(int(fp_id))
                            logger.info('using fp id %s matched full_duration %s - %s' % (str(fp_id), str(full_duration), base_name))
                        else:
                            # @added 20170116 - Feature #1854: Ionosphere learn - generations
                            # If this is added_by ionosphere_learn the id is only
                            # added if the use_full_duration_days features profile
                            # is less than max_generations as if it is at the max
                            # then a new features profile cannot be created from it
                            # even if it is were to match.  Ionosphere learn is
                            # limited here on generation.
                            # Set the default as max e.g. not allowed
                            current_fp_generation = int(metric_max_generations)
                            try:
                                current_fp_generation = row['generation']
                                if int(current_fp_generation) < int(metric_max_generations):
                                    fp_ids.append(int(fp_id))
                                    logger.info(
                                        'valid ionosphere_learn generation %s - fp id %s matched full_duration %s - %s' % (
                                            str(current_fp_generation), str(fp_id),
                                            str(full_duration), base_name))
                                else:
                                    logger.info(
                                        'ionosphere_learn cannot check due to max_generations of %s would be exceeded, current generation %s - fp id %s matched full_duration %s - %s' % (
                                            str(metric_max_generations), str(current_fp_generation), str(fp_id),
                                            str(full_duration), base_name))
                            except:
                                logger.error(traceback.format_exc())
                                logger.error(
                                    'error :: ionosphere_learn check could not determine the fp generation of fp id %s from the row object for %s' % (
                                        str(fp_id), base_name))
                    else:
                        logger.info('not using fp id %s not matched full_duration %s - %s' % (str(fp_id), str(full_duration), base_name))

                # @added 20170115 - Feature #1854: Ionosphere learn - generations
                # Create the fp_ids_db_object so it is available throughout
                # Here we go! Learn!
                # @modified 20170308 - Feature #1960: ionosphere_layers
                # Not currently used - fp_ids_db_object
                # fp_ids_db_object = row
                connection.close()
                fp_count = len(fp_ids)
                logger.info('determined %s fp ids for %s' % (str(fp_count), base_name))
                # @added 20170309 - Feature #1960: ionosphere_layers
                fp_layers_count = len(fp_layers_ids)
                logger.info('determined %s layers ids for %s' % (str(fp_layers_count), base_name))

            except:
                logger.error(traceback.format_exc())
                logger.error('error :: could not determine fp ids from DB for %s' % base_name)
                fp_count = 0
                # @added 20170309 - Feature #1960: ionosphere_layers
                fp_layers_count = 0

            # @added 20170306 - Feature #1960: ionosphere_layers
            # Corrected the interpolation of the fp_ids_db_object above where it
            # was set to the last row only, however it was not used anyway.
            # Here we go, let us TEACH you properly.  We only evaluate
            # @modified 20170308 - Feature #1960: ionosphere_layers
            # Not currently used - fp_ids_db_object
            # if result:
            #     fp_ids_db_object = result

            if len(fp_ids) == 0:
                logger.info('there are no fp ids that match full duration for %s' % base_name)
            else:
                fp_ids_found = True

            if not fp_ids_found:
                logger.info('no fp ids were found for %s at %s' % (base_name, str(full_duration)))
                # @modified 20170108 - Feature #1842: Ionosphere - Graphite now graphs
                # Use all_fp_ids so that we can handle multiple durations
                # fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
                if len(all_fp_ids) == 0:
                    logger.error('error :: Ionosphere is enabled on %s but has no feature_profiles' % (base_name))
                    fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
                else:
                    self.remove_metric_check_file(str(metric_check_file))
                if engine:
                    engine_disposal(engine)
                return

        # @added 20161221 - TODO: why not calculate the features of every
        # anomaly so the the use does not have to do it and wait for the
        # features to be calculated.
        # Check the features were calculated by the webapp
        calculated_feature_file = '%s/%s.tsfresh.input.csv.features.transposed.csv' % (metric_training_data_dir, base_name)
        calculated_feature_file_found = False
        if os.path.isfile(calculated_feature_file):
            logger.info('calculated features available - %s' % (calculated_feature_file))
            calculated_feature_file_found = True

        # @added 20170115 - Feature #1854: Ionosphere learn - generations
        # ionosphere_learn should always provide the features profile csv
        # Ionosphere does not create features profiles for learn, it only
        # checks them.
        # Here we go! Learn!
        if added_by == 'ionosphere_learn':
            if not calculated_feature_file_found:
                logger.error('error :: no ionosphere_learn calculated_feature_file file found - %s' % calculated_feature_file)
                fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
                if engine:
                    engine_disposal(engine)
                return

        if not calculated_feature_file_found:
            if training_metric:
                # Allow Graphite resources to be created if they are not an alert
                # was not sent therefore features do not need to be calculated
                check_time = int(time())
                check_age = check_time - int(added_at)
                if check_age < 5:
                    sleep(5)
                graphite_file_count = len([f for f in os.listdir(metric_training_data_dir)
                                           if f.endswith('.png') and
                                           os.path.isfile(os.path.join(metric_training_data_dir, f))])
                if graphite_file_count == 0:
                    logger.info('not calculating features no anomaly Graphite alert resources created in %s' % (metric_training_data_dir))
                    self.remove_metric_check_file(str(metric_check_file))
                    if engine:
                        engine_disposal(engine)
                    return
                else:
                    logger.info('anomaly Graphite alert resources found in %s' % (metric_training_data_dir))

        context = skyline_app
        f_calc = None
        if not calculated_feature_file_found:
            try:
                fp_csv, successful, fp_exists, fp_id, log_msg, traceback_format_exc, f_calc = calculate_features_profile(skyline_app, metric_timestamp, base_name, context)
            except:
                logger.error(traceback.format_exc())
                logger.error('error :: failed to calculate features')
                fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
                if engine:
                    engine_disposal(engine)
                return

        if os.path.isfile(calculated_feature_file):
            logger.info('calculated features available - %s' % (calculated_feature_file))
            calculated_feature_file_found = True
            if f_calc:
                send_metric_name = '%s.features_calculation_time' % skyline_app_graphite_namespace
                f_calc_time = '%.2f' % float(f_calc)
                try:
                    send_graphite_metric(skyline_app, send_metric_name, f_calc_time)
                except:
                    logger.error(traceback.format_exc())
                    logger.error('error :: failed to send calculate features')

            if training_metric:
                logger.info('training metric done')
                self.remove_metric_check_file(str(metric_check_file))
                # TODO: make ionosphere more useful, compare any other
                # available training_metric profiles here and match, not in the
                # db context, in the training context.
                if engine:
                    engine_disposal(engine)
                return

        if not calculated_feature_file_found:
            logger.error('error :: calculated features file not available - %s' % (calculated_feature_file))
            fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
            if engine:
                engine_disposal(engine)
            return

        # @modified 20161213 - Branch #1790: test_tsfresh
        # TODO: Match the test_tsfresh method
        # Create an array of the calculated features
        calculated_features = []
        if calculated_feature_file_found:
            calculated_features = get_calculated_features(calculated_feature_file)

        if len(calculated_features) == 0:
            logger.error('error :: no calculated features were determined from - %s' % (calculated_feature_file))
            fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
            if engine:
                engine_disposal(engine)
            return
        else:
            logger.info('%s calculated features determined' % (str(len(calculated_feature_file))))

        # @added 2018075 - Task #2446: Optimize Ionosphere
        #                  Branch #2270: luminosity
        fp_checked = 0
        # @modified 20181014 - Feature #2430: Ionosphere validate learnt features profiles page
        # layers_checked = 0
        layers_checked_count = 0

        # @added 20190314 - Feature #2484: FULL_DURATION feature profiles
        # Here we add the bifurcation to also create a features
        # profile at FULL_DURATION for all Mirage metrics.  With a
        # view to increase the number of matches trained metric
        # achieve by also allowing for the creation and comparing of
        # the FULL_DURATION features profiles as well.
        echo_check = False
        echo_calculated_feature_file = False
        echo_calculated_feature_file_found = False
        echo_calculated_features = []
        echo_fp_ids = []
        echo_anomalous_timeseries = None
        if added_by == 'mirage':
            try:
                echo_enabled = settings.IONOSPHERE_ECHO_ENABLED
            except:
                echo_enabled = False
            if echo_enabled:
                echo_check = True

        # @added 20190403 - Bug #2904: Initial Ionosphere echo load and Ionosphere feedback
        #                   Feature #2484: FULL_DURATION feature profiles
        # If there are more than 4 metric check files, alternate between normal
        # Ionosphere Mirage features profile checks and Ionosphere echo features
        # profile checks.
        if echo_check:
            if ionosphere_busy:
                # Check the ionosphere_echo metric Redis keys to see which check
                # to run, ionosphere or ionosphere_echo.  If Ionosphere is busy,
                # Ionosphere will alternate between normal Ionosphere features
                # profiles (Mirage duration) and Ionosphere echo features
                # profiles (FULL_DURATION) comparison.
                echo_ionosphere_check_cache_key = 'ionosphere_echo.ionosphere.check.%s' % base_name
                echo_ionosphere_check_key = False
                try:
                    echo_ionosphere_check_key = self.redis_conn.get(echo_ionosphere_check_cache_key)
                except Exception as e:
                    logger.error('error :: could not query Redis for cache_key: %s' % e)
                echo_ionosphere_echo_check_cache_key = 'ionosphere_echo.echo.check.%s' % base_name
                echo_ionosphere_echo_check_key = False
                try:
                    echo_ionosphere_echo_check_key = self.redis_conn.get(echo_ionosphere_echo_check_cache_key)
                except Exception as e:
                    logger.error('error :: could not query Redis for cache_key: %s' % e)

                create_ionosphere_echo_check_key = False
                remove_ionosphere_echo_check_key = False
                # If neither the ionosphere or the ionosphere_echo key exist do
                # only check ionosphere
                if not echo_ionosphere_check_key:
                    if not echo_ionosphere_echo_check_key:
                        echo_check = False
                        logger.info('ionosphere_busy - only running normal Mirage feature profiles checks, skipping ionosphere_echo checks')
                        create_ionosphere_echo_check_key = echo_ionosphere_check_cache_key
                # If the ionosphere_echo key exists only check ionosphere
                if echo_ionosphere_echo_check_key:
                    echo_check = False
                    logger.info('ionosphere_busy - only running normal Mirage feature profiles checks, skipping ionosphere_echo checks')
                    create_ionosphere_echo_check_key = echo_ionosphere_check_cache_key
                    remove_ionosphere_echo_check_key = echo_ionosphere_echo_check_cache_key
                # If ionosphere_echo key exists only check ionosphere
                if echo_ionosphere_check_key:
                    echo_check = True
                    logger.info('ionosphere_busy - skipping the normal Mirage feature profiles checks as run last time and running ionosphere_echo checks this time')
                    # Remove the Mirage features profiles from the
                    fp_ids = []
                    logger.info('ionosphere_busy - removed %s Mirage feature profile ids from fp_ids' % str(fp_count))
                    create_ionosphere_echo_check_key = echo_ionosphere_echo_check_cache_key
                    remove_ionosphere_echo_check_key = echo_ionosphere_check_cache_key
                if remove_ionosphere_echo_check_key:
                    try:
                        self.redis_conn.delete(remove_ionosphere_echo_check_key)
                        logger.info(
                            'deleted Redis check key - %s' % (remove_ionosphere_echo_check_key))
                    except:
                        logger.error(traceback.format_exc())
                        logger.error(
                            'error :: failed to delete Redis check key - %s' % (remove_ionosphere_echo_check_key))
                if create_ionosphere_echo_check_key:
                    try:
                        key_created_at = int(time())
                        self.redis_conn.setex(
                            # @modified 20190412 - Task #2824: Test redis-py upgrade
                            #                      Task #2926: Update dependencies
                            # create_ionosphere_echo_check_key, 300, [key_created_at])
                            create_ionosphere_echo_check_key, 300, key_created_at)
                        logger.info(
                            'created Redis check key - %s' % (create_ionosphere_echo_check_key))
                    except:
                        logger.error(traceback.format_exc())
                        logger.error(
                            'error :: failed to create Redis check key - %s' % (create_ionosphere_echo_check_key))

        if echo_check:
            try:
                if fps_db_object:
                    for row in fps_db_object:
                        if int(row['full_duration']) == int(settings.FULL_DURATION):
                            fp_ids.append(int(row['id']))
                            echo_fp_ids.append(int(row['id']))
                            logger.info('appending ionosphere_echo fp id %s matched full_duration  of %s - %s' % (str(row['id']), str(settings.FULL_DURATION), base_name))
                fp_count_with_echo = len(fp_ids)
                echo_fp_count = len(echo_fp_ids)
                if echo_fp_count == 0:
                    echo_check = False
                if echo_fp_count > 0:
                    logger.info('added an additional %s echo fp ids for %s' % (str(echo_fp_count), base_name))
                    logger.info('determined a total of %s fp ids (incl. echo) for %s' % (str(fp_count_with_echo), base_name))
                    echo_calculated_feature_file = '%s/%s.echo.tsfresh.input.csv.features.transposed.csv' % (metric_training_data_dir, base_name)
                    if os.path.isfile(echo_calculated_feature_file):
                        logger.info('echo calculated features available - %s' % (echo_calculated_feature_file))
                        echo_calculated_feature_file_found = True
                    else:
                        use_context = 'ionosphere_echo_check'
                        f_calc = None
                        try:
                            fp_csv, successful, fp_exists, fp_id, log_msg, traceback_format_exc, f_calc = calculate_features_profile(skyline_app, metric_timestamp, base_name, use_context)
                        except:
                            logger.error(traceback.format_exc())
                            logger.error('error :: failed to calculate features')
                    if os.path.isfile(echo_calculated_feature_file):
                        logger.info('echo calculated features available - %s' % (echo_calculated_feature_file))
                        echo_calculated_feature_file_found = True
                    echo_calculated_features = []
                    if echo_calculated_feature_file_found:
                        try:
                            echo_calculated_features = get_calculated_features(echo_calculated_feature_file)
                        except:
                            # 20190412 - just for debug
                            logger.error(traceback.format_exc())
                            logger.error('error :: ionosphere_echo_check no echo_calculated_features were determined')
                            echo_calculated_features = False
            except:
                logger.error(traceback.format_exc())
                logger.error('error :: failed to process echo')

        # Compare calculated features to feature values for each fp id
        not_anomalous = False
        if calculated_feature_file_found:
            for fp_id in fp_ids:
                if not metrics_id:
                    logger.error('error :: metric id not known')
                    fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))
                    if engine:
                        engine_disposal(engine)
                    return False

                # @added 20190404 - Bug #2904: Initial Ionosphere echo load and Ionosphere feedback
                #                   Feature #2484: FULL_DURATION feature profiles
                # If the Ionosphere features profile checks are approaching the
                # ionosphere_max_runtime, skip the remaining checks.
                time_now_check = int(time())
                # Allow 5 seconds for layers checks to be done
                max_runtime_tolereance = ionosphere_max_runtime - 5
                running_for = time_now_check - check_process_start
                if running_for >= max_runtime_tolereance:
                    logger.info('features profile checks have been running for %s seconds, the ionosphere_max_runtime is about to be breached, skipping remaining features profile checks' % str(running_for))
                    break

                # @added 20190327 - Feature #2484: FULL_DURATION feature profiles
                check_type = 'ionosphere'
                if echo_check:
                    for echo_fp_id in echo_fp_ids:
                        if fp_id == echo_fp_id:
                            check_type = 'ionosphere_echo_check'
                if check_type == 'ionosphere_echo_check':
                    if not echo_calculated_features:
                        continue

                # @added 2018075 - Task #2446: Optimize Ionosphere
                #                  Branch #2270: luminosity
                fp_checked += 1

                # @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
                # Use Redis set instead of Manager().list to reduce memory
                # self.features_profiles_checked.append(fp_id)
                redis_set = 'ionosphere.features_profiles_checked'
                data = str(fp_id)
                try:
                    self.redis_conn.sadd(redis_set, data)
                except:
                    logger.info(traceback.format_exc())
                    logger.error('error :: failed to add %s to Redis set %s' % (
                        str(data), str(redis_set)))

                features_count = None
                fp_features = []
                # Get features for fp_id from z_fp_<metric_id> table where the
                # features profile is the same full_duration
                metric_fp_table = 'z_fp_%s' % str(metrics_id)

                # @added 20170804 - Bug #2130: MySQL - Aborted_clients
                # Set a conditional here to only get_an_engine if no engine, this
                # is probably responsible for the Aborted_clients, as it would have
                # left the accquired engine orphaned
                # Testing on skyline-dev-3-40g-gra1 Fri Aug  4 16:08:14 UTC 2017
                if not engine:
                    try:
                        engine, log_msg, trace = get_an_engine()
                    except:
                        logger.error(traceback.format_exc())
                        logger.error('error :: could not get a MySQL engine for feature_id and values from %s' % metric_fp_table)

                if not engine:
                    logger.error('error :: engine not obtained for feature_id and values from %s' % metric_fp_table)

                # @added 20170809 - Task #2132: Optimise Ionosphere DB usage
                # First check to determine if the fp_id has data in memcache
                # before querying the database
                fp_id_feature_values = None
                if settings.MEMCACHE_ENABLED:
                    fp_id_feature_values_key = 'fp.id.%s.feature.values' % str(fp_id)
                    try:
                        fp_id_feature_values = self.memcache_client.get(fp_id_feature_values_key)
                        # if memcache does not have the key the response to the
                        # client is None, it does not except
                    except:
                        logger.error('error :: failed to get %s from memcache' % fp_id_feature_values_key)
                    try:
                        self.memcache_client.close()
                    except:
                        # @modified 20170913 - Task #2160: Test skyline with bandit
                        # pass
                        logger.error('error :: failed to close memcache_client')
                    if fp_id_feature_values:
                        fp_features = literal_eval(fp_id_feature_values)
                        logger.info('using memcache %s key data' % fp_id_feature_values_key)

                if not fp_features:
                    try:
                        # @modified 20170913 - Task #2160: Test skyline with bandit
                        # Added nosec to exclude from bandit tests
                        stmt = 'SELECT feature_id, value FROM %s WHERE fp_id=%s' % (metric_fp_table, str(fp_id))  # nosec
                        connection = engine.connect()
                        for row in engine.execute(stmt):
                            fp_feature_id = int(row['feature_id'])
                            fp_value = float(row['value'])
                            fp_features.append([fp_feature_id, fp_value])
                        connection.close()
                        features_count = len(fp_features)
                        logger.info('determined %s features for fp_id %s' % (str(features_count), str(fp_id)))
                    except:
                        logger.error(traceback.format_exc())
                        logger.error('error :: could not determine feature_id, value from %s' % metric_fp_table)
                    if fp_features and settings.MEMCACHE_ENABLED:
                        fp_id_feature_values_key = 'fp.id.%s.feature.values' % str(fp_id)
                        try:
                            self.memcache_client.set(fp_id_feature_values_key, fp_features)
                            logger.info('populated memcache %s key' % fp_id_feature_values_key)
                        except:
                            logger.error('error :: failed to set %s in memcache' % fp_id_feature_values_key)

                # @added 20170809 - Task #2132: Optimise Ionosphere DB usage
                if settings.MEMCACHE_ENABLED:
                    try:
                        self.memcache_client.close()
                    except:
                        # @modified 20170913 - Task #2160: Test skyline with bandit
                        # pass
                        logger.error('error :: failed to close memcache_client')

                # @added 20170107 - Feature #1852: Ionosphere - features_profile matched graphite graphs
                #                   Feature #1844: ionosphere_matched DB table
                # Added the calculated features sum for verification purposes
                all_calc_features_sum_list = []

                # @added 20190327 - Feature #2484: FULL_DURATION feature profiles
                if check_type == 'ionosphere':
                    use_calculated_features = calculated_features
                if check_type == 'ionosphere_echo_check':
                    use_calculated_features = echo_calculated_features

                # @modified 20190327 - Feature #2484: FULL_DURATION feature profiles
                # Bifurcate for ionosphere_echo_check
                # for feature_name, calc_value in calculated_features:
                for feature_name, calc_value in use_calculated_features:
                    all_calc_features_sum_list.append(float(calc_value))
                all_calc_features_sum = sum(all_calc_features_sum_list)

                # Convert feature names in calculated_features to their id
                logger.info('converting tsfresh feature names to Skyline feature ids')
                calc_features_by_id = []
                # @modified 20190327 - Feature #2484: FULL_DURATION feature profiles
                # Bifurcate for ionosphere_echo_check
                # for feature_name, calc_value in calculated_features:
                for feature_name, calc_value in use_calculated_features:
                    for skyline_feature_id, name in TSFRESH_FEATURES:
                        if feature_name == name:
                            calc_features_by_id.append([skyline_feature_id, float(calc_value)])

                # Determine what features each data has, extract only values for
                # common features.
                logger.info('determining common features')
                relevant_fp_feature_values = []
                relevant_calc_feature_values = []
                for skyline_feature_id, calc_value in calc_features_by_id:
                    for fp_feature_id, fp_value in fp_features:
                        if skyline_feature_id == fp_feature_id:
                            relevant_fp_feature_values.append(fp_value)
                            relevant_calc_feature_values.append(calc_value)

                # Determine the sum of each set
                relevant_fp_feature_values_count = len(relevant_fp_feature_values)
                relevant_calc_feature_values_count = len(relevant_calc_feature_values)
                if relevant_fp_feature_values_count != relevant_calc_feature_values_count:
                    logger.error('error :: mismatch in number of common features')
                    logger.error('error :: relevant_fp_feature_values_count - %s' % str(relevant_fp_feature_values_count))
                    logger.error('error :: relevant_calc_feature_values_count - %s' % str(relevant_calc_feature_values_count))
                    continue
                else:
                    logger.info('comparing on %s common features' % str(relevant_fp_feature_values_count))

                if relevant_fp_feature_values_count == 0:
                    logger.error('error :: relevant_fp_feature_values_count is zero')
                    continue

                # Determine the sum of each set
                sum_fp_values = sum(relevant_fp_feature_values)
                sum_calc_values = sum(relevant_calc_feature_values)
                logger.info(
                    'sum of the values of the %s common features in features profile - %s' % (
                        str(relevant_fp_feature_values_count), str(sum_fp_values)))
                logger.info(
                    'sum of the values of the %s common features in the calculated features - %s' % (
                        str(relevant_calc_feature_values_count), str(sum_calc_values)))

                # Determine whether each set is positive or negative
                # # if the same carry on
                # # if both negative, make then both positive
                # Sum fp values, Sum calculated - handle negatives like features_sum :: -3389570699080000.0000000000
                # Determine whether each set is positive or negative
                # # if the same carry on
                # # if both negative, make then both positive postive_sums
                fp_sum_array = [sum_fp_values]
                calc_sum_array = [sum_calc_values]

                percent_different = 100
                sums_array = np.array([sum_fp_values, sum_calc_values], dtype=float)
                try:
                    calc_percent_different = np.diff(sums_array) / sums_array[:-1] * 100.
                    percent_different = calc_percent_different[0]
                    logger.info('percent_different between common features sums - %s' % str(percent_different))
                except:
                    logger.error(traceback.format_exc())
                    logger.error('error :: failed to calculate percent_different')
                    continue

                almost_equal = None
                try:
                    np.testing.assert_array_almost_equal(fp_sum_array, calc_sum_array)
                    almost_equal = True
                except:
                    almost_equal = False

                if almost_equal:
                    not_anomalous = True
                    # @modified 20170118 - Bug #1860: Debug learn not matched in ionosphere
                    # This broke it, no variable was interpolated
                    # logger.info('common features sums are almost equal, not anomalous' % str(relevant_fp_feature_values_count))
                    logger.info('common features sums are almost equal, not anomalous')

                # @added 20161229 - Feature #1830: Ionosphere alerts
                # Update the features profile checked count and time
                logger.info('updating checked details in db for %s' % (str(fp_id)))
                # update matched_count in ionosphere_table
                checked_timestamp = int(time())

                # @added 20170804 - Bug #2130: MySQL - Aborted_clients
                # Set a conditional here to only get_an_engine if no engine, this
                # is probably responsible for the Aborted_clients, as it would have
                # left the accquired engine orphaned
                # Testing on skyline-dev-3-40g-gra1 Fri Aug  4 16:08:14 UTC 2017
                if not engine:
                    try:
                        engine, log_msg, trace = get_an_engine()
                    except:
                        logger.error(traceback.format_exc())
                        logger.error('error :: could not get a MySQL engine to update checked details in db for %s' % (str(fp_id)))
                if not engine:
                    logger.error('error :: engine not obtained to update checked details in db for %s' % (str(fp_id)))

                try:
                    connection = engine.connect()
                    connection.execute(
                        ionosphere_table.update(
                            ionosphere_table.c.id == fp_id).
                        values(checked_count=ionosphere_table.c.checked_count + 1,
                               last_checked=checked_timestamp))
                    connection.close()
                    logger.info('updated checked_count for %s' % str(fp_id))
                except:
                    logger.error(traceback.format_exc())
                    logger.error('error :: could not update checked_count and last_checked for %s ' % str(fp_id))

                # if diff_in_sums <= 1%:
                if percent_different < 0:
                    new_pdiff = percent_different * -1
                    percent_different = new_pdiff

                # @added 20190327 - Feature #2484: FULL_DURATION feature profiles
                # Bifurcate for ionosphere_echo_check
                if check_type == 'ionosphere':
                    use_percent_similar = float(settings.IONOSPHERE_FEATURES_PERCENT_SIMILAR)
                if check_type == 'ionosphere_echo_check':
                    try:
                        use_percent_similar = float(settings.IONOSPHERE_ECHO_FEATURES_PERCENT_SIMILAR)
                    except:
                        use_percent_similar = 2.0

                # @modified 20190327 - Feature #2484: FULL_DURATION feature profiles
                # Bifurcate for ionosphere_echo_check
                # if percent_different < settings.IONOSPHERE_FEATURES_PERCENT_SIMILAR:
                if percent_different < use_percent_similar:
                    not_anomalous = True
                    # log
                    logger.info('not anomalous - features profile match - %s' % base_name)
                    logger.info(
                        'calculated features sum are within %s percent of fp_id %s with %s, not anomalous' %
                        (str(use_percent_similar),
                            str(fp_id), str(percent_different)))
                    if check_type == 'ionosphere_echo_check':
                        logger.info('ionosphere_echo_check - not anomalous with fp id %s for %s' % (str(fp_id), base_name))

                # @added 20180617 - Feature #2404: Ionosphere - fluid approximation
                # Now if not matched use Min-Max scaling as per
                # http://sebastianraschka.com/Articles/2014_about_feature_scaling.html#numpy
                # Min-Max scale the fp time series z_ts_<metric_id> SELECT WHERE fp_id
                #   or from memcache to create minmax_fp_ts
                # Min-Max scale the current time series to create minmax_anomalous_ts
                # Create features profiles for minmax_fp_ts
                # Create features profiles for minmax_anomalous_ts
                try:
                    minmax_scaling_enabled = settings.IONOSPHERE_MINMAX_SCALING_ENABLED
                except:
                    minmax_scaling_enabled = False
                minmax_not_anomalous = False
                minmax_check = False
                minmax = 0
                if not not_anomalous:
                    if minmax_scaling_enabled:
                        minmax_check = True

                if added_by == 'ionosphere_learn' and minmax_check:
                    minmax_check = False
                    logger.info('ionosphere_learn job not minmax scaling')

                if minmax_check:
                    logger.info('running minmax scaling')
                    # First check to determine if the z_ts_<mertic_id> for the fp
                    # has data in memcache before querying the database
                    metric_fp_ts_table = 'z_ts_%s' % str(metrics_id)
                    fp_id_metric_ts = []
                    if settings.MEMCACHE_ENABLED:
                        fp_id_metric_ts_key = 'fp.%s.%s.ts' % (str(fp_id), str(metrics_id))
                        try:
                            fp_id_metric_ts_object = self.memcache_client.get(fp_id_metric_ts_key)
                            # if memcache does not have the key the response to the
                            # client is None, it does not except
                        except:
                            logger.error('error :: failed to get %s from memcache' % fp_id_metric_ts_key)
                        try:
                            self.memcache_client.close()
                        except:
                            logger.error('error :: failed to close memcache_client')
                        if fp_id_metric_ts_object:
                            fp_id_metric_ts = literal_eval(fp_id_metric_ts_object)
                            logger.info('used memcache %s key data to populate fp_id_metric_ts with %s data points' % (fp_id_metric_ts_key, str(len(fp_id_metric_ts))))
                        else:
                            logger.info('no memcache %s key data, will use database' % fp_id_metric_ts_key)
                    if not fp_id_metric_ts:
                        if LOCAL_DEBUG:
                            logger.debug('debug :: getting data from %s database table for fp id %s to populate the fp_id_metric_ts list' % (metric_fp_ts_table, str(fp_id)))
                        try:
                            stmt = 'SELECT timestamp, value FROM %s WHERE fp_id=%s' % (metric_fp_ts_table, str(fp_id))  # nosec
                            connection = engine.connect()
                            for row in engine.execute(stmt):
                                fp_id_ts_timestamp = int(row['timestamp'])
                                fp_id_ts_value = float(row['value'])
                                fp_id_metric_ts.append([fp_id_ts_timestamp, fp_id_ts_value])
                            connection.close()
                            values_count = len(fp_id_metric_ts)
                            logger.info('determined %s values for the fp_id time series %s for %s' % (str(values_count), str(fp_id), str(base_name)))
                        except:
                            logger.error(traceback.format_exc())
                            logger.error('error :: could not determine timestamps and values from %s' % metric_fp_ts_table)

                        if fp_id_metric_ts and settings.MEMCACHE_ENABLED:
                            fp_id_metric_ts_key = 'fp.%s.%s.ts' % (str(fp_id), str(metrics_id))
                            try:
                                self.memcache_client.set(fp_id_metric_ts_key, fp_id_metric_ts)
                                logger.info('populated memcache %s key' % fp_id_metric_ts_key)
                            except:
                                logger.error('error :: failed to set %s in memcache' % fp_id_metric_ts_key)
                            try:
                                self.memcache_client.close()
                            except:
                                logger.error('error :: failed to close memcache_client')

                    # Get anomalous time series
                    anomalous_ts_values_count = 0
                    if fp_id_metric_ts:
                        anomalous_timeseries_not_defined = True
                        try:
                            test_anomalous_timeseries = anomalous_timeseries
                            if len(test_anomalous_timeseries) > 0:
                                anomalous_timeseries_not_defined = False
                        except:
                            logger.info('anomalous_timeseries is not defined loading from anomaly json')

                        timeseries_dir = base_name.replace('.', '/')
                        metric_data_dir = '%s/%s/%s' % (
                            settings.IONOSPHERE_DATA_FOLDER, metric_timestamp,
                            timeseries_dir)
                        anomaly_json = '%s/%s.json' % (metric_data_dir, base_name)

                        # @added 20190327 - Feature #2484: FULL_DURATION feature profiles
                        # Bifurcate for ionosphere_echo_check
                        if check_type == 'ionosphere_echo_check':
                            anomaly_json = redis_anomaly_json
                            if not echo_anomalous_timeseries:
                                try:
                                    with open((redis_anomaly_json), 'r') as f:
                                        raw_timeseries = f.read()
                                    timeseries_array_str = str(raw_timeseries).replace('(', '[').replace(')', ']')
                                    del raw_timeseries
                                    echo_anomalous_timeseries = literal_eval(timeseries_array_str)
                                    del timeseries_array_str
                                    if len(echo_anomalous_timeseries) > 0:
                                        logger.info('echo_anomalous_timeseries was populated from anomaly json %s with %s data points from for creating the minmax_anomalous_ts' % (redis_anomaly_json, str(len(echo_anomalous_timeseries))))
                                    else:
                                        logger.error('error :: echo_anomalous_timeseries for minmax_anomalous_ts is not populated from anomaly json - %s' % redis_anomaly_json)
                                except:
                                    logger.error(traceback.format_exc())
                                    logger.error('error :: could not create echo_anomalous_timeseries from anomaly json %s' % redis_anomaly_json)
                            else:
                                logger.info('echo_anomalous_timeseries has %s data points from for creating the minmax_anomalous_ts' % (str(len(echo_anomalous_timeseries))))

                        # @modified 20190327 - Feature #2484: FULL_DURATION feature profiles
                        # if anomalous_timeseries_not_defined:
                        if anomalous_timeseries_not_defined and check_type == 'ionosphere':
                            try:
                                with open((anomaly_json), 'r') as f:
                                    raw_timeseries = f.read()
                                timeseries_array_str = str(raw_timeseries).replace('(', '[').replace(')', ']')
                                del raw_timeseries
                                anomalous_timeseries = literal_eval(timeseries_array_str)
                                del timeseries_array_str
                                if len(anomalous_timeseries) > 0:
                                    logger.info('anomalous_timeseries was populated from anomaly json %s with %s data points from for creating the minmax_anomalous_ts' % (anomaly_json, str(len(anomalous_timeseries))))
                                else:
                                    logger.error('error :: anomalous_timeseries for minmax_anomalous_ts is not populated from anomaly json - %s' % anomaly_json)
                            except:
                                logger.error(traceback.format_exc())
                                logger.error('error :: could not create anomalous_timeseries from anomaly json %s' % anomaly_json)
                        else:
                            if check_type == 'ionosphere':
                                logger.info('anomalous_timeseries has %s data points from for creating the minmax_anomalous_ts' % (str(len(anomalous_timeseries))))

                        # @added 20190327 - Feature #2484: FULL_DURATION feature profiles
                        if check_type == 'ionosphere':
                            use_anomalous_timeseries = anomalous_timeseries
                        if check_type == 'ionosphere_echo_check':
                            use_anomalous_timeseries = echo_anomalous_timeseries

                        anomalous_ts_values_count = len(use_anomalous_timeseries)
                    # @added 20180621 - Feature #2404: Ionosphere - fluid approximation
                    # Check ranges and only Min-Max scale if the 2 time series
                    # are similar in range
                    # @added 20180819 - Bug #2534: Ionosphere - fluid approximation - IONOSPHERE_MINMAX_SCALING_RANGE_TOLERANCE on low ranges
                    # TODO
                    try:
                        range_tolerance = settings.IONOSPHERE_MINMAX_SCALING_RANGE_TOLERANCE
                    except:
                        range_tolerance = 0.15
                    range_tolerance_percentage = range_tolerance * 100
                    check_range = False
                    range_similar = False
                    if fp_id_metric_ts:
                        if anomalous_ts_values_count > 0:
                            check_range = True
                    lower_range_similar = False
                    upper_range_similar = False
                    if check_range:
                        try:
                            minmax_fp_values = [x[1] for x in fp_id_metric_ts]
                            min_fp_value = min(minmax_fp_values)
                            max_fp_value = max(minmax_fp_values)
                        except:
                            min_fp_value = False
                            max_fp_value = False
                        try:
                            minmax_anomalous_values = [x2[1] for x2 in use_anomalous_timeseries]
                            min_anomalous_value = min(minmax_anomalous_values)
                            max_anomalous_value = max(minmax_anomalous_values)
                        except:
                            min_anomalous_value = False
                            max_anomalous_value = False
                        lower_range_not_same = True
                        try:
                            try:
                                if int(min_fp_value) == int(min_anomalous_value):
                                    lower_range_not_same = False
                                    lower_range_similar = True
                                    logger.info('min value of fp_id_metric_ts (%s) and anomalous_timeseries (%s) are the same' % (
                                        str(min_fp_value), str(min_anomalous_value)))
                            except:
                                lower_range_not_same = True
                            if min_fp_value and min_anomalous_value and lower_range_not_same:
                                if int(min_fp_value) == int(min_anomalous_value):
                                    lower_range_similar = True
                                    logger.info('min value of fp_id_metric_ts (%s) and anomalous_timeseries (%s) are the same' % (
                                        str(min_fp_value), str(min_anomalous_value)))
                                else:
                                    lower_min_fp_value = int(min_fp_value - (min_fp_value * range_tolerance))
                                    upper_min_fp_value = int(min_fp_value + (min_fp_value * range_tolerance))
                                    if int(min_anomalous_value) in range(lower_min_fp_value, upper_min_fp_value):
                                        lower_range_similar = True
                                        logger.info('min value of fp_id_metric_ts (%s) and anomalous_timeseries (%s) are similar within %s percent of each other' % (
                                            str(min_fp_value),
                                            str(min_anomalous_value),
                                            str(range_tolerance_percentage)))
                            if not lower_range_similar:
                                logger.info('lower range of fp_id_metric_ts (%s) and anomalous_timeseries (%s) are not similar' % (
                                    str(min_fp_value), str(min_anomalous_value)))
                            upper_range_not_same = True
                            try:
                                if int(max_fp_value) == int(max_anomalous_value):
                                    upper_range_not_same = False
                                    upper_range_similar = True
                                    logger.info('max value of fp_id_metric_ts (%s) and anomalous_timeseries (%s) are the same' % (
                                        str(max_fp_value), str(max_anomalous_value)))
                            except:
                                upper_range_not_same = True
                            if max_fp_value and max_anomalous_value and lower_range_similar and upper_range_not_same:
                                # @added 20180717 - Task #2446: Optimize Ionosphere
                                #                   Feature #2404: Ionosphere - fluid approximation
                                # On low values such as 1 and 2, the range_tolerance
                                # should be adjusted to account for the very small
                                # range. TODO
                                lower_max_fp_value = int(max_fp_value - (max_fp_value * range_tolerance))
                                upper_max_fp_value = int(max_fp_value + (max_fp_value * range_tolerance))
                                if int(max_anomalous_value) in range(lower_max_fp_value, upper_max_fp_value):
                                    upper_range_similar = True
                                    logger.info('max value of fp_id_metric_ts (%s) and anomalous_timeseries (%s) are similar within %s percent of each other' % (
                                        str(max_fp_value), str(max_anomalous_value),
                                        str(range_tolerance_percentage)))
                                else:
                                    logger.info('max value of fp_id_metric_ts (%s) and anomalous_timeseries (%s) are not similar' % (
                                        str(max_fp_value), str(max_anomalous_value)))
                        except:
                            logger.error(traceback.format_exc())
                            logger.error('error :: could not calculate range similarity with the current anomalous_timeseries and the fp id %s time series' % (str(fp_id)))

                    if lower_range_similar and upper_range_similar:
                        range_similar = True
                    else:
                        logger.info('the ranges of fp_id_metric_ts and anomalous_timeseries differ significantly Min-Max scaling will be skipped')

                    minmax_fp_ts = []
                    # if fp_id_metric_ts:
                    if range_similar:
                        if LOCAL_DEBUG:
                            logger.debug('debug :: creating minmax_fp_ts from minmax scaled fp_id_metric_ts')
                        try:
                            minmax_fp_values = [x[1] for x in fp_id_metric_ts]
                            x_np = np.asarray(minmax_fp_values)
                            # Min-Max scaling
                            np_minmax = (x_np - x_np.min()) / (x_np.max() - x_np.min())
                            for (ts, v) in zip(fp_id_metric_ts, np_minmax):
                                minmax_fp_ts.append([ts[0], v])
                            logger.info('minmax_fp_ts list populated with the minmax scaled time series with %s data points' % str(len(minmax_fp_ts)))
                        except:
                            logger.error(traceback.format_exc())
                            logger.error('error :: could not minmax scale fp id %s time series for %s' % (str(fp_id), str(base_name)))
                        if not minmax_fp_ts:
                            logger.error('error :: minmax_fp_ts list not populated')

                    minmax_anomalous_ts = []
                    if minmax_fp_ts:
                        # Only process if they are approximately the same length
                        minmax_fp_ts_values_count = len(minmax_fp_ts)
                        if minmax_fp_ts_values_count - anomalous_ts_values_count in range(-14, 14):
                            try:
                                minmax_anomalous_values = [x2[1] for x2 in use_anomalous_timeseries]
                                x_np = np.asarray(minmax_anomalous_values)
                                # Min-Max scaling
                                np_minmax = (x_np - x_np.min()) / (x_np.max() - x_np.min())
                                for (ts, v) in zip(fp_id_metric_ts, np_minmax):
                                    minmax_anomalous_ts.append([ts[0], v])
                            except:
                                logger.error(traceback.format_exc())
                                logger.error('error :: could not determine np_minmax with current time series anomalous_timeseries and fp id %s time series' % (str(fp_id)))
                            if len(minmax_anomalous_ts) > 0:
                                logger.info('minmax_anomalous_ts is populated with %s data points' % str(len(minmax_anomalous_ts)))
                            else:
                                logger.error('error :: minmax_anomalous_ts is not populated')
                        else:
                            logger.info('minmax scaled check will be skipped - anomalous_ts_values_count is %s and minmax_fp_ts is %s' % (str(anomalous_ts_values_count), str(minmax_fp_ts_values_count)))

                    minmax_fp_ts_csv = '%s/fpid.%s.%s.minmax_fp_ts.tsfresh.input.std.csv' % (
                        settings.SKYLINE_TMP_DIR, str(fp_id), base_name)
                    minmax_fp_fname_out = minmax_fp_ts_csv + '.transposed.csv'
                    anomalous_ts_csv = '%s/%s.%s.minmax_anomalous_ts.tsfresh.std.csv' % (
                        settings.SKYLINE_TMP_DIR, metric_timestamp, base_name)
                    anomalous_fp_fname_out = anomalous_ts_csv + '.transposed.csv'

                    tsf_settings = ReasonableFeatureExtractionSettings()
                    tsf_settings.disable_progressbar = True
                    minmax_fp_features_sum = None
                    minmax_anomalous_features_sum = None
                    if minmax_anomalous_ts and minmax_fp_ts:
                        if LOCAL_DEBUG:
                            logger.debug('debug :: analyzing minmax_fp_ts and minmax_anomalous_ts')
                        if not os.path.isfile(minmax_fp_ts_csv):
                            if LOCAL_DEBUG:
                                logger.debug('debug :: creating %s from minmax_fp_ts' % minmax_fp_ts_csv)
                            datapoints = minmax_fp_ts
                            converted = []
                            for datapoint in datapoints:
                                try:
                                    new_datapoint = [float(datapoint[0]), float(datapoint[1])]
                                    converted.append(new_datapoint)
                                except:  # nosec
                                    continue
                            del datapoints
                            if LOCAL_DEBUG:
                                if len(converted) > 0:
                                    logger.debug('debug :: converted is populated')
                                else:
                                    logger.debug('debug :: error :: converted is not populated')
                            for ts, value in converted:
                                try:
                                    utc_ts_line = '%s,%s,%s\n' % (base_name, str(int(ts)), str(value))
                                    with open(minmax_fp_ts_csv, 'a') as fh:
                                        fh.write(utc_ts_line)
                                except:
                                    logger.error(traceback.format_exc())
                                    logger.error('error :: could not write to file %s' % (str(minmax_fp_ts_csv)))
                            del converted
                        else:
                            logger.info('file found %s, using for data' % minmax_fp_ts_csv)

                        if not os.path.isfile(minmax_fp_ts_csv):
                            logger.error('error :: file not found %s' % minmax_fp_ts_csv)
                        else:
                            logger.info('file exists to create the minmax_fp_ts data frame from - %s' % minmax_fp_ts_csv)

                        try:
                            df = pd.read_csv(minmax_fp_ts_csv, delimiter=',', header=None, names=['metric', 'timestamp', 'value'])
                            df.columns = ['metric', 'timestamp', 'value']
                        except:
                            logger.error(traceback.format_exc())
                            logger.error('error :: failed to created data frame from %s' % (str(minmax_fp_ts_csv)))
                        try:
                            df_features = extract_features(
                                df, column_id='metric', column_sort='timestamp', column_kind=None,
                                column_value=None, feature_extraction_settings=tsf_settings)
                        except:
                            logger.error(traceback.format_exc())
                            logger.error('error :: failed to created df_features from %s' % (str(minmax_fp_ts_csv)))
                        del df
                        # Create transposed features csv
                        if not os.path.isfile(minmax_fp_fname_out):
                            # Transpose
                            df_t = df_features.transpose()
                            df_t.to_csv(minmax_fp_fname_out)
                            del df_t
                        else:
                            if LOCAL_DEBUG:
                                logger.debug('debug :: file exists - %s' % minmax_fp_fname_out)
                        try:
                            # Calculate the count and sum of the features values
                            df_sum = pd.read_csv(
                                minmax_fp_fname_out, delimiter=',', header=0,
                                names=['feature_name', 'value'])
                            df_sum.columns = ['feature_name', 'value']
                            df_sum['feature_name'] = df_sum['feature_name'].astype(str)
                            df_sum['value'] = df_sum['value'].astype(float)
                            minmax_fp_features_count = len(df_sum['value'])
                            minmax_fp_features_sum = df_sum['value'].sum()
                            logger.info('minmax_fp_ts - features_count: %s, features_sum: %s' % (str(minmax_fp_features_count), str(minmax_fp_features_sum)))
                        except:
                            logger.error(traceback.format_exc())
                            logger.error('error :: failed to created df_sum from %s' % (str(minmax_fp_fname_out)))

                        if minmax_fp_features_count > 0:
                            if LOCAL_DEBUG:
                                logger.debug('debug :: minmax_fp_features_count of the minmax_fp_ts is %s' % str(minmax_fp_features_count))
                        else:
                            logger.error('error :: minmax_fp_features_count is %s' % str(minmax_fp_features_count))

                        if not os.path.isfile(anomalous_ts_csv):
                            datapoints = minmax_anomalous_ts
                            converted = []
                            for datapoint in datapoints:
                                try:
                                    new_datapoint = [float(datapoint[0]), float(datapoint[1])]
                                    converted.append(new_datapoint)
                                except:  # nosec
                                    continue
                            del datapoints
                            for ts, value in converted:
                                utc_ts_line = '%s,%s,%s\n' % (base_name, str(int(ts)), str(value))
                                with open(anomalous_ts_csv, 'a') as fh:
                                    fh.write(utc_ts_line)
                            del converted

                        df = pd.read_csv(anomalous_ts_csv, delimiter=',', header=None, names=['metric', 'timestamp', 'value'])
                        df.columns = ['metric', 'timestamp', 'value']
                        df_features_current = extract_features(
                            df, column_id='metric', column_sort='timestamp', column_kind=None,
                            column_value=None, feature_extraction_settings=tsf_settings)

                        del df

                        # Create transposed features csv
                        if not os.path.isfile(anomalous_fp_fname_out):
                            # Transpose
                            df_t = df_features_current.transpose()
                            df_t.to_csv(anomalous_fp_fname_out)
                            del df_t
                        # Calculate the count and sum of the features values
                        df_sum_2 = pd.read_csv(
                            anomalous_fp_fname_out, delimiter=',', header=0,
                            names=['feature_name', 'value'])
                        df_sum_2.columns = ['feature_name', 'value']
                        df_sum_2['feature_name'] = df_sum_2['feature_name'].astype(str)
                        df_sum_2['value'] = df_sum_2['value'].astype(float)
                        minmax_anomalous_features_count = len(df_sum_2['value'])
                        minmax_anomalous_features_sum = df_sum_2['value'].sum()
                        logger.info('minmax_anomalous_ts - minmax_anomalous_features_count: %s, minmax_anomalous_features_sum: %s' % (
                            str(minmax_anomalous_features_count),
                            str(minmax_anomalous_features_sum)))

                    if minmax_fp_features_sum and minmax_anomalous_features_sum:
                        percent_different = None
                        try:
                            fp_sum_array = [minmax_fp_features_sum]
                            calc_sum_array = [minmax_anomalous_features_sum]
                            percent_different = 100
                            sums_array = np.array([minmax_fp_features_sum, minmax_anomalous_features_sum], dtype=float)
                            calc_percent_different = np.diff(sums_array) / sums_array[:-1] * 100.
                            percent_different = calc_percent_different[0]
                            logger.info('percent_different between minmax scaled features sums - %s' % str(percent_different))
                        except:
                            logger.error(traceback.format_exc())
                            logger.error('error :: failed to calculate percent_different from minmax scaled features sums')

                        if percent_different:
                            almost_equal = None
                            try:
                                np.testing.assert_array_almost_equal(fp_sum_array, calc_sum_array)
                                almost_equal = True
                            except:
                                almost_equal = False

                            if almost_equal:
                                minmax_not_anomalous = True
                                logger.info('minmax scaled common features sums are almost equal, not anomalous')

                            # if diff_in_sums <= 1%:
                            if percent_different < 0:
                                new_pdiff = percent_different * -1
                                percent_different = new_pdiff

                            # @added 20190327 - Feature #2484: FULL_DURATION feature profiles
                            # Bifurcate for ionosphere_echo_check
                            if check_type == 'ionosphere':
                                mm_use_percent_similar = float(settings.IONOSPHERE_FEATURES_PERCENT_SIMILAR)
                            if check_type == 'ionosphere_echo_check':
                                try:
                                    mm_use_percent_similar = float(settings.IONOSPHERE_ECHO_MINMAX_SCALING_FEATURES_PERCENT_SIMILAR)
                                except:
                                    mm_use_percent_similar = 3.5

                            # @modified 20190327 - Feature #2484: FULL_DURATION feature profiles
                            # if percent_different < settings.IONOSPHERE_FEATURES_PERCENT_SIMILAR:
                            if percent_different < mm_use_percent_similar:
                                minmax_not_anomalous = True
                                # log
                                logger.info('not anomalous - minmax scaled features profile match - %s - %s' % (base_name, str(minmax_not_anomalous)))
                                logger.info(
                                    'minmax scaled calculated features sum are within %s percent of fp_id %s with %s, not anomalous' %
                                    (str(mm_use_percent_similar),
                                        str(fp_id), str(percent_different)))
                                if check_type == 'ionosphere_echo_check':
                                    logger.info('ionosphere_echo_check :: not anomalous - minmax scaled features profile match - %s' % (base_name))

                            if minmax_not_anomalous:
                                not_anomalous = True
                                minmax = 1
                                # Created time series resources for graphing in
                                # the matched page
                            try:
                                if os.path.isfile(minmax_fp_ts_csv):
                                    self.remove_metric_check_file(str(minmax_fp_ts_csv))
                            except:
                                pass
                            try:
                                if os.path.isfile(minmax_fp_fname_out):
                                    self.remove_metric_check_file(str(minmax_fp_fname_out))
                            except:
                                pass

                # @added 20190327 - Feature #2484: FULL_DURATION feature profiles
                # Clean up echo files
                if echo_check:
                    echo_calculated_feature_file = '%s/%s.echo.tsfresh.input.csv.features.transposed.csv' % (metric_training_data_dir, base_name)
                    try:
                        if os.path.isfile(echo_calculated_feature_file):
                            self.remove_metric_check_file(str(echo_calculated_feature_file))
                    except:
                        pass
                    echo_features_file = '%s/%s.%s.echo.fp.details.txt' % (metric_training_data_dir, str(metric_timestamp), base_name)
                    try:
                        if os.path.isfile(echo_features_file):
                            self.remove_metric_check_file(str(echo_features_file))
                    except:
                        pass

                # Clean up
                if minmax_check:
                    try:
                        clean_file = anomalous_ts_csv
                        if os.path.isfile(anomalous_ts_csv):
                            self.remove_metric_check_file(str(anomalous_ts_csv))
                        logger.info('cleaned up - %s' % clean_file)
                    except:
                        logger.info('no anomalous_ts_csv file to clean up')
                    try:
                        clean_file = anomalous_fp_fname_out
                        if os.path.isfile(anomalous_fp_fname_out):
                            self.remove_metric_check_file(str(anomalous_fp_fname_out))
                        logger.info('cleaned up - %s' % clean_file)
                    except:
                        logger.info('no anomalous_fp_fname_out file to clean up')
                # END - Feature #2404: Ionosphere - fluid approximation

                if not_anomalous:
                    # @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
                    # self.not_anomalous.append(base_name)
                    redis_set = 'ionosphere.not_anomalous'
                    data = base_name
                    try:
                        self.redis_conn.sadd(redis_set, data)
                    except:
                        logger.info(traceback.format_exc())
                        logger.error('error :: failed to add %s to Redis set %s' % (
                            str(data), str(redis_set)))

                    # update matched_count in ionosphere_table
                    matched_timestamp = int(time())
                    # @added 20170804 - Bug #2130: MySQL - Aborted_clients
                    # Set a conditional here to only get_an_engine if no engine, this
                    # is probably responsible for the Aborted_clients, as it would have
                    # left the accquired engine orphaned
                    # Testing on skyline-dev-3-40g-gra1 Fri Aug  4 16:08:14 UTC 2017
                    if not engine:
                        try:
                            engine, log_msg, trace = get_an_engine()
                        except:
                            logger.error(traceback.format_exc())
                            logger.error('error :: could not get a MySQL engine to update matched details in db for %s' % (str(fp_id)))
                    if not engine:
                        logger.error('error :: engine not obtained to update matched details in db for %s' % (str(fp_id)))

                    try:
                        connection = engine.connect()
                        connection.execute(
                            ionosphere_table.update(
                                ionosphere_table.c.id == fp_id).
                            values(matched_count=ionosphere_table.c.matched_count + 1,
                                   last_matched=matched_timestamp))
                        connection.close()
                        logger.info('updated matched_count for %s' % str(fp_id))
                    except:
                        logger.error(traceback.format_exc())
                        logger.error('error :: could not update matched_count and last_matched for %s ' % str(fp_id))

                    # @added 20170107 - Feature #1844: ionosphere_matched DB table
                    # Added ionosphere_matched update
                    # @modified 20170804 - Bug #2130: MySQL - Aborted_clients
                    # Set a conditional here to only get_an_engine if no engine, this
                    # is probably responsible for the Aborted_clients, as it would have
                    # left the accquired engine orphaned
                    # Testing on skyline-dev-3-40g-gra1 Fri Aug  4 16:08:14 UTC 2017
                    if not engine:
                        try:
                            engine, log_msg, trace = get_an_engine()
                        except:
                            logger.error(traceback.format_exc())
                            logger.error('error :: could not get a MySQL engine to update ionosphere_matched for %s' % (str(fp_id)))
                    if not engine:
                        logger.error('error :: engine not obtained to update ionosphere_matched for %s' % (str(fp_id)))

                    try:
                        ionosphere_matched_table, log_msg, trace = ionosphere_matched_table_meta(skyline_app, engine)
                        logger.info(log_msg)
                        logger.info('ionosphere_matched_table OK')
                    except:
                        logger.error(traceback.format_exc())
                        logger.error('error :: failed to get ionosphere_matched_table meta for %s' % base_name)

                    # @added 20180620 - Feature #2404: Ionosphere - fluid approximation
                    # Added minmax scaling values
                    if minmax_not_anomalous == 1:
                        minmax_fp_features_sum = float(minmax_fp_features_sum)
                        minmax_fp_features_count = int(minmax_fp_features_count)
                        minmax_anomalous_features_sum = float(minmax_anomalous_features_sum)
                        minmax_anomalous_features_count = int(minmax_anomalous_features_count)
                    else:
                        minmax_fp_features_sum = 0
                        minmax_fp_features_count = 0
                        minmax_anomalous_features_sum = 0
                        minmax_anomalous_features_count = 0

                    # @added 20190919 - Feature #2484: FULL_DURATION feature profiles
                    # If there are additional echo fps then the database can be
                    # updated with the fp_count_with_echo value for fp_count in
                    # the ionosphere_matched table
                    if fp_count_with_echo > fp_count:
                        fp_count = fp_count_with_echo

                    try:
                        connection = engine.connect()
                        # @modified 20170107 - Feature #1852: Ionosphere - features_profile matched graphite graphs
                        #                      Feature #1844: ionosphere_matched DB table
                        # Added all_calc_features_sum, all_calc_features_count,
                        # sum_calc_values, common_features_count, tsfresh_version
                        ins = ionosphere_matched_table.insert().values(
                            fp_id=int(fp_id),
                            metric_timestamp=int(metric_timestamp),
                            all_calc_features_sum=float(all_calc_features_sum),
                            all_calc_features_count=len(all_calc_features_sum_list),
                            sum_common_values=float(sum_calc_values),
                            common_features_count=int(relevant_calc_feature_values_count),
                            tsfresh_version=str(tsfresh_version),
                            # @added 20180620 - Feature #2404: Ionosphere - fluid approximation
                            # Added minmax scaling values
                            minmax=minmax,
                            minmax_fp_features_sum=minmax_fp_features_sum,
                            minmax_fp_features_count=minmax_fp_features_count,
                            minmax_anomalous_features_sum=minmax_anomalous_features_sum,
                            minmax_anomalous_features_count=minmax_anomalous_features_count,
                            # @added 2018075 - Task #2446: Optimize Ionosphere
                            #                  Branch #2270: luminosity
                            fp_count=fp_count, fp_checked=fp_checked)
                        result = connection.execute(ins)
                        connection.close()
                        new_matched_id = result.inserted_primary_key[0]
                        # @modified 20180620 - Feature #2404: Ionosphere - fluid approximation
                        # Added minmax
                        if minmax == 0:
                            logger.info('new ionosphere_matched id: %s' % str(new_matched_id))
                        else:
                            logger.info('new minmax scaled ionosphere_matched id: %s' % str(new_matched_id))
                    except:
                        logger.error(traceback.format_exc())
                        logger.error(
                            'error :: could not update ionosphere_matched for %s with with timestamp %s' % (
                                str(fp_id), str(metric_timestamp)))

                    # @added 20170331 - Task #1988: Review - Ionosphere layers - always show layers
                    #                   Feature #1960: ionosphere_layers
                    # Added mirror functionality of the layers_id_matched_file
                    # for feature profile matches too as it has proved useful
                    # in the frontend with regards to training data sets being
                    # matched by layers and can do the same for in the frontend
                    # training data for feature profile matches too.
                    if not_anomalous:
                        profile_id_matched_file = '%s/%s.profile_id_matched.fp_id' % (
                            metric_training_data_dir, base_name)
                        if not os.path.isfile(profile_id_matched_file):
                            try:
                                write_data_to_file(skyline_app, profile_id_matched_file, 'w', str(fp_id))
                                logger.info('added matched fp_id %s - %s' % (
                                    str(fp_id), profile_id_matched_file))
                            except:
                                logger.info(traceback.format_exc())
                                logger.error('error :: added matched fp_id %s - %s' % (
                                    str(fp_id), profile_id_matched_file))

                    # @added 20170115 - Feature #1854: Ionosphere learn - generations
                    # Stop on the first match
                    break

                # https://docs.scipy.org/doc/numpy/reference/generated/numpy.testing.assert_almost_equal.html
                # @added 20161214 - Add a between timeframe option, e.g. if
                # fp match, only see this as not anomalous if hour (and or min)
                # is between x and y - handle rollovers, cron log archives, etc.
                logger.info('debug :: %s is a features profile for %s' % (str(fp_id), base_name))

            # @added 20170115 - Feature #1854: Ionosphere learn - generations
            # If this is an ionosphere_learn check them we handle it before
            # the others and exit and ionosphere_learn uses the Redis work
            # queue. Here we go! Learn!
            if added_by == 'ionosphere_learn':
                if not_anomalous:
                    logger.info('an ionosphere_learn metric has been found to be not anomalous before')

                    # @added 20170607 - Feature #2010: Ionosphere learn - rate limiting profile learning
                    learning_rate_limited = False
                    now = int(time())
                    rate_limit_timestamp = now - 3600
                    rate_limit_datetime = datetime.fromtimestamp(rate_limit_timestamp)
                    f = '%Y-%m-%d %H:%M:%S'
                    after_datetime = rate_limit_datetime.strftime(f)
                    try:
                        connection = engine.connect()
                        # @modified 20170913 - Task #2160: Test skyline with bandit
                        # Added nosec to exclude from bandit tests
                        result = connection.execute(
                            'SELECT * FROM ionosphere WHERE metric_id=%s AND created_timestamp > \'%s\' AND generation > 1' % (str(metrics_id), str(after_datetime)))  # nosec
                        for row in result:
                            last_full_duration = row['full_duration']
                            if int(full_duration) <= int(last_full_duration):
                                learning_rate_limited = True
                                break
                    except:
                        logger.error(traceback.format_exc())
                        logger.error('error :: determining whether learning should be rate limited')
                    if learning_rate_limited:
                        logger.info('learning currently dynamically rate limited on %s' % str(base_name))
                        # Exit the ionosphere_learn check
                        self.remove_metric_check_file(str(metric_check_file))
                        if engine:
                            engine_disposal(engine)
                        return
                    else:
                        logger.info('learning is not currently rate limited on %s' % str(base_name))

                    # @added 20170605 - Bug #2038: Ionosphere learn parent generation incorrect
                    # Determine generation of the matched fp not the last in the
                    # list
                    try:
                        # @modified 20170913 - Task #2160: Test skyline with bandit
                        # Added nosec to exclude from bandit tests
                        stmt = 'SELECT generation FROM ionosphere WHERE id=%s' % str(fp_id)  # nosec
                        connection = engine.connect()
                        for row in engine.execute(stmt):
                            matched_fp_generation = int(row['generation'])
                        connection.close()
                        logger.info(
                            'determined matched fp_id %s is a generation %s profile' % (
                                str(fp_id), str(matched_fp_generation)))
                        current_fp_generation = matched_fp_generation
                    except:
                        logger.error(traceback.format_exc())
                        logger.error('error :: could not determine generation from ionosphere table for fp id %s' % str(fp_id))

                    logger.info(
                        'ionosphere_learn metric matches the generation %s features profile id %s - %s' % (
                            str(current_fp_generation), str(fp_id), base_name))
                    # Added Redis to work_set, learn will then go off and create
                    # the features profile with the parent training data if
                    # less than max_generations, although ionosphere_learn
                    # should not should Ionosphere any work if the result would
                    # be greater than max_generations
                    logger.info('adding work item to Redis set ionosphere.learn.work')
                    ionosphere_job = 'learn_fp_learnt'
                    work_deadline = 'Soft'
                    try:
                        logger.info(
                            'LEARNT :: adding work to Redis ionosphere.learn.work set - [\'%s\', \'%s\', %s, \'%s\', %s, %s] to create a learnt features profile' % (
                                work_deadline, str(ionosphere_job), str(metric_timestamp), base_name,
                                str(fp_id), str(current_fp_generation)))
                        # modified 20190412 - Task #2824: Test redis-py upgrade
                        #                     Task #2926: Update dependencies
                        # self.redis_conn.sadd('ionosphere.learn.work', ['Soft', str(ionosphere_job), int(metric_timestamp), base_name, int(fp_id), int(current_fp_generation)])
                        self.redis_conn.sadd('ionosphere.learn.work', str(['Soft', str(ionosphere_job), int(metric_timestamp), base_name, int(fp_id), int(current_fp_generation)]))
                    except:
                        logger.error(traceback.format_exc())
                        logger.error(
                            'error :: failed adding work to Redis ionosphere.learn.work set - [\'%s\', \'%s\', %s, \'%s\', %s, %s] to make a learn features profile later' % (
                                work_deadline, str(ionosphere_job), str(metric_timestamp), base_name,
                                str(fp_id), str(current_fp_generation)))

                # Exit the ionosphere_learn check
                self.remove_metric_check_file(str(metric_check_file))
                if engine:
                    engine_disposal(engine)
                return

            # @added 20170306 - Feature #1960: ionosphere_layers
            # Here we go, let us TEACH you properly.  We only evaluate
            # the Ionosphere layer algorithms after Skyline has had an
            # an opportunity to match the original and learnt features
            # profiles.  This enables the original, evolutionary,
            # generations based learning to be continually evaluated.
            # This needs to happen for any future implemenation of
            # Feature #1888: Ionosphere learn - evolutionary maturity forget
            logger.info('layers algorithms check')
            check_layers_algorithms = False
            if not not_anomalous:
                check_layers_algorithms = True
                if added_by == 'ionosphere_learn':
                    check_layers_algorithms = False
                    logger.info('ionosphere_learn - layers algorithms check - False')
                else:
                    logger.info('layers algorithms check - True, %s layers to be checked' % str(fp_layers_count))
            else:
                logger.info('a features profile matched as not_anomalous - layers algorithms check - False')

            if check_layers_algorithms and fp_layers_present:
                full_duration_in_hours = int(settings.FULL_DURATION) / 3600
                mirage_full_duration_json_file = '%s/%s.mirage.redis.%sh.json' % (
                    metric_training_data_dir, base_name,
                    str(int(full_duration_in_hours)))
                if os.path.isfile(mirage_full_duration_json_file):
                    full_duration_json_file = mirage_full_duration_json_file
                else:
                    full_duration_json_file = '%s/%s.json' % (metric_training_data_dir, base_name)

                anomalous_timeseries = None
                if os.path.isfile(full_duration_json_file):
                    logger.info('full duration ts json available for layers check - %s' % (full_duration_json_file))
                    try:
                        # Read the timeseries json file
                        with open((full_duration_json_file), 'r') as f:
                            raw_timeseries = f.read()
                        timeseries_array_str = str(raw_timeseries).replace('(', '[').replace(')', ']')
                        anomalous_timeseries = literal_eval(timeseries_array_str)
                    except:
                        logger.error(traceback.format_exc())
                        logger.error('error :: could not load json for layers check - %s' % (base_name))
                    logger.info('data points surfaced for layers check - %s' % (len(anomalous_timeseries)))
                else:
                    logger.error('error :: full duration ts json for layers was not found - %s' % (full_duration_json_file))

                matched_layers_id = None
                for layers_id in fp_layers_ids:
                    if not_anomalous:
                        logger.info('checking layers_id %s - %s layers profiles of %s possible layers' % (
                            str(layers_id), str(layers_checked_count), str(fp_layers_count)))
                    if not_anomalous:
                        logger.info('skipping checking layers_id %s - %s layers profiles of %s possible layers as layer id %s already matched' % (
                            str(layers_id), str(layers_checked_count), str(fp_layers_count), str(matched_layers_id)))
                        continue
                    if int(layers_id) != 0:

                        # @added 2018075 - Task #2446: Optimize Ionosphere
                        #                  Branch #2270: luminosity
                        # @modified 20181014 - Feature #2430: Ionosphere validate learnt features profiles page
                        # layers_checked += 1
                        layers_checked_count += 1

                        # @added 20190522 - Task #3034: Reduce multiprocessing Manager list usage
                        # Added to Redis set here and commented out the
                        # self.layers_checked.append in the try below this
                        redis_set = 'ionosphere.layers_checked'
                        data = layers_id
                        try:
                            self.redis_conn.sadd(redis_set, data)
                        except:
                            logger.info(traceback.format_exc())
                            logger.error('error :: failed to add %s to Redis set %s' % (
                                str(data), str(redis_set)))

                        # Get the layers algorithms and run then on the timeseries
                        # @modified 20170307 - Feature #1960: ionosphere_layers
                        # Use except on everything, remember how fast Skyline can iterate
                        try:
                            # @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
                            # Added to the ionosphere.layers_checked Redis set
                            # above
                            # self.layers_checked.append(layers_id)

                            # @added 2018075 - Task #2446: Optimize Ionosphere
                            #                  Branch #2270: luminosity
                            # not_anomalous = run_layer_algorithms(base_name, layers_id, anomalous_timeseries)
                            # @modified 20181013 - Feature #2430: Ionosphere validate learnt features profiles page
                            # not_anomalous = run_layer_algorithms(base_name, layers_id, anomalous_timeseries, fp_layers_count, layers_checked)
                            not_anomalous = run_layer_algorithms(base_name, layers_id, anomalous_timeseries, fp_layers_count, layers_checked_count)
                            if not_anomalous:
                                matched_layers_id = layers_id
                        except:
                            logger.error(traceback.format_exc())
                            logger.error('error :: run_layer_algorithms failed for layers_id - %s' % (str(layers_id)))
                        if not_anomalous:
                            logger.info('not_anomalous :: layers_id %s was matched after checking %s layers profiles of %s possible layers' % (
                                str(layers_id), str(layers_checked_count), str(fp_layers_count)))
                        else:
                            logger.info('still anomalous :: layers_id %s was NOT matched after checking %s layers profiles of %s possible layers' % (
                                str(layers_id), str(layers_checked_count), str(fp_layers_count)))
                if not not_anomalous:
                    logger.info('anomalous - no features profiles layers were matched - %s' % base_name)

                # @added 20170308 - Feature #1960: ionosphere_layers
                #                   Feature #1854: Ionosphere learn
                # A create a layer_id matched txt file in the training_data dir
                # to advise the operator if a training_data set has been matched
                # by a layer.  Further below if app is not ionosphere_learn a
                # 'learn_fp_generation' ionosphere_job is added so ionosphere_learn
                # can still try and learning from the existing features profiles
                # that exist even if a layer matched as not_anomalous.
                if not_anomalous:
                    layers_id_matched_file = '%s/%s.layers_id_matched.layers_id' % (
                        metric_training_data_dir, base_name)
                    if not os.path.isfile(layers_id_matched_file):
                        try:
                            write_data_to_file(skyline_app, layers_id_matched_file, 'w', str(matched_layers_id))
                            logger.info('added matched layers_id %s - %s' % (
                                str(matched_layers_id), layers_id_matched_file))
                        except:
                            logger.info(traceback.format_exc())
                            logger.error('error :: added matched layers_id %s - %s' % (
                                str(matched_layers_id), layers_id_matched_file))
            else:
                logger.info('no layers algorithm check required')
            # Ionosphere layers DONE

            if not not_anomalous:
                logger.info('anomalous - no feature profiles were matched - %s' % base_name)

                # @added 20170116 - Feature #1854: Ionosphere learn
                # If this is an ionosphere_learn check an Ionosphere alert will
                # not be sent back to Analyzer, Mirage or the ionosphere.learn.work
                # Redis set. We exit, work is done.
                if added_by == 'ionosphere_learn':
                    logger.info('ionosphere_learn check complete - %s' % base_name)
                    self.remove_metric_check_file(str(metric_check_file))
                    if engine:
                        engine_disposal(engine)
                    return

                # @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
                # self.anomalous_metrics.append(base_name)
                redis_set = 'ionosphere.anomalous_metrics'
                data = base_name
                try:
                    self.redis_conn.sadd(redis_set, data)
                except:
                    logger.info(traceback.format_exc())
                    logger.error('error :: failed to add %s to Redis set %s' % (
                        str(data), str(redis_set)))

                # Send to panorama as Analyzer and Mirage will only alert on the
                # anomaly, they will not push it to Panorama
                if settings.PANORAMA_ENABLED:
                    if not os.path.exists(settings.PANORAMA_CHECK_PATH):
                        mkdir_p(settings.PANORAMA_CHECK_PATH)
                    # Note:
                    # The values are enclosed is single quoted intentionally
                    # as the imp.load_source used results in a shift in the
                    # decimal position when double quoted, e.g.
                    # value = "5622.0" gets imported as
                    # 2016-03-02 12:53:26 :: 28569 :: metric variable - value - 562.2
                    # single quoting results in the desired,
                    # 2016-03-02 13:16:17 :: 1515 :: metric variable - value - 5622.0
                    added_at = str(int(time()))
                    source = 'graphite'
                    panaroma_anomaly_data = 'metric = \'%s\'\n' \
                                            'value = \'%s\'\n' \
                                            'from_timestamp = \'%s\'\n' \
                                            'metric_timestamp = \'%s\'\n' \
                                            'algorithms = %s\n' \
                                            'triggered_algorithms = %s\n' \
                                            'app = \'%s\'\n' \
                                            'source = \'%s\'\n' \
                                            'added_by = \'%s\'\n' \
                                            'added_at = \'%s\'\n' \
                        % (base_name, str(anomalous_value), str(int(from_timestamp)),
                           str(int(metric_timestamp)), str(settings.ALGORITHMS),
                           str(triggered_algorithms), skyline_app, source,
                           this_host, added_at)

                    # Create an anomaly file with details about the anomaly
                    panaroma_anomaly_file = '%s/%s.%s.txt' % (
                        settings.PANORAMA_CHECK_PATH, added_at,
                        base_name)
                    try:
                        write_data_to_file(
                            skyline_app, panaroma_anomaly_file, 'w',
                            panaroma_anomaly_data)
                        logger.info('added panorama anomaly file :: %s' % (panaroma_anomaly_file))
                        # @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
                        # Moved to the Redis set function below
                        # self.sent_to_panorama.append(base_name)
                    except:
                        logger.error('error :: failed to add panorama anomaly file :: %s' % (panaroma_anomaly_file))
                        logger.info(traceback.format_exc())
                    # @added 20190522 - Task #3034: Reduce multiprocessing Manager list usage
                    redis_set = 'ionosphere.sent_to_panorama'
                    data = base_name
                    try:
                        self.redis_conn.sadd(redis_set, data)
                    except:
                        logger.info(traceback.format_exc())
                        logger.error('error :: failed to add %s to Redis set %s' % (
                            str(data), str(redis_set)))

            #     alert ... hmmm the harder part, maybe not all the resources
            #     are already created, so just determining ALERTS and firing a
            #     trigger_alert (pull in alerter.py and mirage_alerters.py?)
            #     OR send back to app via Redis
                # @modified 20170116 - Feature #1854: Ionosphere learn
                # Only do the cache_key if not ionosphere_learn
                if added_by != 'ionosphere_learn':
                    cache_key = 'ionosphere.%s.alert.%s.%s' % (added_by, metric_timestamp, base_name)
                    # added 20190412 - Task #2824: Test redis-py upgrade
                    #                  Task #2926: Update dependencies
                    # Added cache_key_value
                    cache_key_value = [float(anomalous_value), base_name, int(metric_timestamp), triggered_algorithms, full_duration]

                    try:
                        self.redis_conn.setex(
                            cache_key, 300,
                            # modified 20190412 - Task #2824: Test redis-py upgrade
                            #                     Task #2926: Update dependencies
                            # [float(anomalous_value), base_name, int(metric_timestamp), triggered_algorithms, full_duration])
                            str(cache_key_value))
                        logger.info(
                            'add Redis alert key - %s - %s' %
                            (cache_key, str(cache_key_value)))
                    except:
                        logger.error(traceback.format_exc())
                        logger.error(
                            'error :: failed to add Redis key - %s - [%s, \'%s\', %s, %s, %s]' %
                            (cache_key, str(anomalous_value), base_name, str(int(metric_timestamp)),
                                str(triggered_algorithms), str(full_duration)))

                # @added 20170116 - Feature #1854: Ionosphere learn
                # Added an ionosphere_learn job for the timeseries that did not
                # match any profiles.  Here we go! Learn!
                if added_by != 'ionosphere_learn':
                    ionosphere_job = 'learn_fp_generation'
                    logger.info(
                        'adding an ionosphere_learn %s job for the timeseries that did not match any profiles - %s' % (
                            ionosphere_job, base_name))
                    try:
                        logger.info(
                            'adding work to Redis ionosphere.learn.work set - [\'Soft\', \'%s\', %s, \'%s\', None, None] to make a learn features profile later' % (
                                str(ionosphere_job), str(int(metric_timestamp)),
                                base_name))
                        # modified 20190412 - Task #2824: Test redis-py upgrade
                        #                     Task #2926: Update dependencies
                        # self.redis_conn.sadd('ionosphere.learn.work', ['Soft', str(ionosphere_job), int(metric_timestamp), base_name, None, None])
                        self.redis_conn.sadd('ionosphere.learn.work', str(['Soft', str(ionosphere_job), int(metric_timestamp), base_name, None, None]))
                    except:
                        logger.error(traceback.format_exc())
                        logger.error(
                            'error :: failed adding work to Redis ionosphere.learn.work set - [\'Soft\', \'%s\', %s, \'%s\', None, None] to make a learn features profile later' % (
                                str(ionosphere_job), str(int(metric_timestamp)),
                                base_name))

                self.remove_metric_check_file(str(metric_check_file))
                if engine:
                    engine_disposal(engine)
                return

        self.remove_metric_check_file(str(metric_check_file))
        if engine:
            engine_disposal(engine)
        return

[docs]    def run(self):
        """
        Called when the process intializes.
        """

        # Log management to prevent overwriting
        # Allow the bin/<skyline_app>.d to manage the log
        if os.path.isfile(skyline_app_logwait):
            try:
                logger.info('removing %s' % skyline_app_logwait)
                os.remove(skyline_app_logwait)
            except OSError:
                logger.error('error :: failed to remove %s, continuing' % skyline_app_logwait)
                pass

        now = time()
        log_wait_for = now + 5
        while now < log_wait_for:
            if os.path.isfile(skyline_app_loglock):
                sleep(.1)
                now = time()
            else:
                now = log_wait_for + 1

        logger.info('starting %s run' % skyline_app)
        if os.path.isfile(skyline_app_loglock):
            logger.error('error :: bin/%s.d log management seems to have failed, continuing' % skyline_app)
            try:
                os.remove(skyline_app_loglock)
                logger.info('log lock file removed')
            except OSError:
                logger.error('error :: failed to remove %s, continuing' % skyline_app_loglock)
                pass
        else:
            logger.info('bin/%s.d log management done' % skyline_app)

        # @added 20190524 - Bug #3050: Ionosphere - Skyline and Graphite feedback
        logger.info('SKYLINE_FEEDBACK_NAMESPACES is set to %s' % str(SKYLINE_FEEDBACK_NAMESPACES))

        while 1:
            now = time()

            # Make sure Redis is up
            try:
                self.redis_conn.ping()
                if ENABLE_IONOSPHERE_DEBUG:
                    logger.info('debug :: connected to Redis')
            except:
                logger.error('error :: cannot connect to redis at socket path %s' % (
                    settings.REDIS_SOCKET_PATH))
                sleep(30)
                # @modified 20180519 - Feature #2378: Add redis auth to Skyline and rebrow
                if settings.REDIS_PASSWORD:
                    self.redis_conn = StrictRedis(password=settings.REDIS_PASSWORD, unix_socket_path=settings.REDIS_SOCKET_PATH)
                else:
                    self.redis_conn = StrictRedis(unix_socket_path=settings.REDIS_SOCKET_PATH)
                continue

            # Report app up
            try:
                self.redis_conn.setex(skyline_app, 120, now)
                logger.info('updated Redis key for %s up' % skyline_app)
            except:
                logger.error('error :: failed to update Redis key for %s up' % skyline_app)

            # purge_old_data_dirs after every check file run, this takes less
            # than a second and keeps the purging somewhat consistent with
            # input rate.
            try:
                logger.info('purging any old training data')
                self.purge_old_data_dirs(
                    settings.IONOSPHERE_DATA_FOLDER,
                    settings.IONOSPHERE_KEEP_TRAINING_TIMESERIES_FOR)
            except:
                logger.error('error :: purge_old_data_dirs - %s' % traceback.print_exc())
                if ENABLE_IONOSPHERE_DEBUG:
                    logger.info(
                        'debug :: self.purge_old_data_dirs(%s, %s)' %
                        settings.IONOSPHERE_DATA_FOLDER,
                        settings.IONOSPHERE_KEEP_TRAINING_TIMESERIES_FOR)

            # @added 20170110 - Feature #1854: Ionosphere learn
            # purge_old_data_dirs learn data
            if settings.IONOSPHERE_LEARN:
                try:
                    logger.info('purging any old learning data')
                    self.purge_old_data_dirs(
                        settings.IONOSPHERE_LEARN_FOLDER,
                        settings.IONOSPHERE_KEEP_TRAINING_TIMESERIES_FOR)
                except:
                    logger.error('error :: purge_old_data_dirs learn - %s' % traceback.print_exc())
                    if ENABLE_IONOSPHERE_DEBUG:
                        logger.info(
                            'debug :: self.purge_old_data_dirs(%s, %s)' %
                            settings.IONOSPHERE_LEARN_FOLDER,
                            settings.IONOSPHERE_KEEP_TRAINING_TIMESERIES_FOR)

            # @added 20170916 - Feature #1996: Ionosphere - matches page
            # Create the ionosphere_summary_memcache_object
            # @modified 20180103 - Feature #1996: Ionosphere - matches page
            # The ionosphere_summary_list memcache object is not managed in
            # ionosphere.py and was an artefact of some dev work that may
            # resume at some point
            # if settings.MEMCACHE_ENABLED:
            #     try:
            #         logger.info('updating the ionosphere_summary_memcache_object')
            #         self.update_ionosphere_summary_memcache_object
            #     except:
            #         logger.error('error :: update_ionosphere_summary_memcache_object - %s' % traceback.print_exc())

            # self.populate the database metatdata tables
            # What is my host id in the Skyline panorama DB?
            host_id = False

            # @added 20170825 - Task #2132: Optimise Ionosphere DB usage
            # Check memcached before MySQL
            if settings.MEMCACHE_ENABLED:
                hosts_id_key = 'hosts.id.%s' % this_host
                try:
                    host_id = self.memcache_client.get(hosts_id_key)
                    # if memcache does not have the key the response to the
                    # client is None, it does not except
                except:
                    logger.error('error :: failed to get %s from memcache' % hosts_id_key)
                try:
                    self.memcache_client.close()
                except:
                    # @modified 20170913 - Task #2160: Test skyline with bandit
                    # pass
                    logger.error('error :: failed to close memcache_client')
                if host_id:
                    logger.info('using memcache %s key data' % hosts_id_key)
                    logger.info('host_id: %s' % str(host_id))

            if not host_id:
                # @modified 20170913 - Task #2160: Test skyline with bandit
                # Added nosec to exclude from bandit tests
                query = 'select id FROM hosts WHERE host=\'%s\'' % this_host  # nosec
                results = mysql_select(skyline_app, query)
                if results:
                    host_id = results[0][0]
                    logger.info('host_id: %s' % str(host_id))
                else:
                    logger.info('failed to determine host id of %s' % this_host)
                if host_id and settings.MEMCACHE_ENABLED:
                    try:
                        self.memcache_client.set(hosts_id_key, int(host_id))
                        logger.info('populated memcache %s key' % hosts_id_key)
                    except:
                        logger.error('error :: failed to set %s in memcache' % hosts_id_key)
                    try:
                        self.memcache_client.close()
                    except:
                        # @modified 20170913 - Task #2160: Test skyline with bandit
                        # pass
                        logger.error('error :: failed to close memcache_client')

            # if not known - INSERT hostname INTO host
            if not host_id:
                logger.info('inserting %s into hosts table' % this_host)
                # @modified 20170913 - Task #2160: Test skyline with bandit
                # Added nosec to exclude from bandit tests
                query = 'insert into hosts (host) VALUES (\'%s\')' % this_host  # nosec
                host_id = self.mysql_insert(query)
                if host_id:
                    logger.info('new host_id: %s' % str(host_id))

            if not host_id:
                logger.error(
                    'error :: failed to determine populate %s into the hosts table' %
                    this_host)
                sleep(30)
                continue

            """
            Determine if any metric has been added to add
            """
            while True:
                metric_var_files = False
                try:
                    metric_var_files = [f for f in listdir(settings.IONOSPHERE_CHECK_PATH) if isfile(join(settings.IONOSPHERE_CHECK_PATH, f))]
                except:
                    logger.error('error :: failed to list files in check dir')
                    logger.info(traceback.format_exc())

                if not metric_var_files:
                    logger.info('sleeping 20 no metric check files')
                    sleep(20)
                    up_now = time()
                    # Report app up
                    try:
                        self.redis_conn.setex(skyline_app, 120, up_now)
                        logger.info('updated Redis key for %s up' % skyline_app)
                    except:
                        logger.error('error :: failed to update Redis key for %s up' % skyline_app)

                    # @added 20161228 - Feature #1828: ionosphere - mirage Redis data features
                    #                   Branch #922: Ionosphere
                    # Bringing Ionosphere online - do alert on Ionosphere metrics
                    # Manage the ionosphere.unique_metrics Redis set which is queried
                    # by Analyzer and Mirage, yes and we use multiprocessing
                    last_update = None
                    try:
                        last_update = self.redis_conn.get('ionosphere.manage_ionosphere_unique_metrics')
                    except Exception as e:
                        logger.error('error :: could not query Redis for ionosphere.manage_ionosphere_unique_metrics: %s' % e)

                    if not last_update:
                        pids = []
                        now = time()
                        try:
                            logger.info('starting manage_ionosphere_unique_metrics process')
                            p = Process(target=self.manage_ionosphere_unique_metrics)
                            pids.append(p)
                            p.start()
                        except:
                            logger.info(traceback.format_exc())
                            logger.error('error :: failed to start manage_ionosphere_unique_metrics')

                        # Self monitor process and terminate if run for too long
                        p_starts = time()
                        while time() - p_starts <= 5:
                            if any(p.is_alive() for p in pids):
                                # Just to avoid hogging the CPU
                                sleep(.1)
                            else:
                                # All the processes are done, break now.
                                time_to_run = time() - p_starts
                                logger.info(
                                    'manage_ionosphere_unique_metrics completed in %.2f seconds' % (
                                        time_to_run))
                                break
                        else:
                            # We only enter this if we didn't 'break' above.
                            logger.info('%s :: timed out, killing manage_ionosphere_unique_metrics process' % (skyline_app))
                            for p in pids:
                                try:
                                    p.terminate()
                                    # p.join()
                                    logger.info('%s :: killed manage_ionosphere_unique_metrics process' % (skyline_app))
                                except:
                                    logger.error(traceback.format_exc())
                                    logger.error('error :: killing all manage_ionosphere_unique_metrics processes')

                # Discover metric anomalies to insert
                metric_var_files = False
                try:
                    metric_var_files = [f for f in listdir(settings.IONOSPHERE_CHECK_PATH) if isfile(join(settings.IONOSPHERE_CHECK_PATH, f))]
                except:
                    logger.error('error :: failed to list files in check dir')
                    logger.info(traceback.format_exc())

                # @added 20170104 - Feature #1842: Ionosphere - Graphite now graphs
                #                   Task #1658: Patterning Skyline Ionosphere
                # Send Ionosphere metrics to Graphite every minute now that
                # Ionosphere is better tuned and Reset lists
                cache_key = '%s.sent_graphite_metrics' % skyline_app
                redis_sent_graphite_metrics = False
                try:
                    redis_sent_graphite_metrics = self.redis_conn.get(cache_key)
                except Exception as e:
                    logger.error('error :: could not query Redis for key %s: %s' % (cache_key, e))

                # Flush metrics to Graphite
                if not redis_sent_graphite_metrics:
                    try:
                        # @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
                        # not_anomalous = str(len(self.not_anomalous))
                        not_anomalous = str(len(list(self.redis_conn.smembers('ionosphere.not_anomalous'))))
                    except:
                        not_anomalous = '0'
                    logger.info('not_anomalous      :: %s' % not_anomalous)
                    send_metric_name = '%s.not_anomalous' % skyline_app_graphite_namespace
                    send_graphite_metric(skyline_app, send_metric_name, not_anomalous)

                    try:
                        # @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
                        # Use Redis set instead of Manager() list
                        # total_anomalies = str(len(self.anomalous_metrics))
                        total_anomalies = str(len(list(self.redis_conn.smembers('ionosphere.anomalous_metrics'))))
                    except:
                        total_anomalies = '0'
                    logger.info('total_anomalies    :: %s' % total_anomalies)
                    send_metric_name = '%s.total_anomalies' % skyline_app_graphite_namespace
                    send_graphite_metric(skyline_app, send_metric_name, total_anomalies)

                    try:
                        # @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
                        # training_metrics = str(len(self.training_metrics))
                        training_metrics = str(len(list(self.redis_conn.smembers('ionosphere.training_metrics'))))
                    except:
                        training_metrics = '0'
                    logger.info('training metrics   :: %s' % training_metrics)
                    send_metric_name = '%s.training_metrics' % skyline_app_graphite_namespace
                    send_graphite_metric(skyline_app, send_metric_name, training_metrics)

                    try:
                        # @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
                        # features_profiles_checked = str(len(self.features_profiles_checked))
                        features_profiles_checked = str(len(list(self.redis_conn.smembers('ionosphere.features_profiles_checked'))))
                    except:
                        features_profiles_checked = '0'
                    logger.info('fps checked count  :: %s' % features_profiles_checked)
                    send_metric_name = '%s.fps_checked' % skyline_app_graphite_namespace
                    # @modified 20170306 - Feature #1960: ionosphere_layers
                    # Corrected namespace
                    # send_graphite_metric(skyline_app, send_metric_name, not_anomalous)
                    send_graphite_metric(skyline_app, send_metric_name, features_profiles_checked)

                    # @added 20170306 - Feature #1960: ionosphere_layers
                    try:
                        # @modified 20181014 - Feature #2430: Ionosphere validate learnt features profiles page
                        # layers_checked = str(len(self.layers_checked))
                        # @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
                        # str_layers_checked = str(len(self.layers_checked))
                        str_layers_checked = str(len(list(self.redis_conn.smembers('ionosphere.layers_checked'))))
                    except:
                        str_layers_checked = '0'
                    logger.info('layers checked count  :: %s' % str_layers_checked)
                    send_metric_name = '%s.layers_checked' % skyline_app_graphite_namespace
                    send_graphite_metric(skyline_app, send_metric_name, str_layers_checked)

                    if settings.PANORAMA_ENABLED:
                        try:
                            # @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
                            # sent_to_panorama = str(len(self.sent_to_panorama))
                            sent_to_panorama = str(len(list(self.redis_conn.smembers('ionosphere.sent_to_panorama'))))
                        except:
                            sent_to_panorama = '0'
                        logger.info('sent_to_panorama   :: %s' % sent_to_panorama)
                        send_metric_name = '%s.sent_to_panorama' % skyline_app_graphite_namespace
                        send_graphite_metric(skyline_app, send_metric_name, sent_to_panorama)

                    sent_graphite_metrics_now = int(time())
                    try:
                        self.redis_conn.setex(cache_key, 59, sent_graphite_metrics_now)
                        logger.info('updated Redis key - %s' % cache_key)
                    except:
                        logger.error('error :: failed to update Redis key - %s up' % cache_key)

                    # Reset lists
                    # @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
                    # Use Redis sets instead of Manager().list()
                    # self.anomalous_metrics[:] = []
                    # self.not_anomalous[:] = []
                    # self.features_profiles_checked[:] = []
                    # self.training_metrics[:] = []
                    # self.sent_to_panorama[:] = []

                    # @added 20170306 - Feature #1960: ionosphere_layers
                    # @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
                    # Use Redis sets instead of Manager().list()
                    # self.layers_checked[:] = []

                    # @added 20190522 - Task #3034: Reduce multiprocessing Manager list usage
                    # Use Redis sets instead of Manager().list()
                    delete_redis_sets = [
                        'ionosphere.anomalous_metrics',
                        'ionosphere.not_anomalous',
                        'ionosphere.features_profiles_checked',
                        'ionosphere.training_metrics',
                        'ionosphere.sent_to_panorama',
                        'ionosphere.layers_checked',
                    ]
                    for i_redis_set in delete_redis_sets:
                        redis_set_to_delete = i_redis_set
                        try:
                            self.redis_conn.delete(redis_set_to_delete)
                            logger.info('deleted Redis set - %s' % redis_set_to_delete)
                        except:
                            logger.error(traceback.format_exc())
                            logger.error('error :: failed to delete Redis set - %s' % redis_set_to_delete)

                ionosphere_job = False
                learn_job = False

                # @added 20190524 - Bug #3050: Ionosphere - Skyline and Graphite feedback
                # Do not run checks if the namespace is a declared SKYLINE_FEEDBACK_NAMESPACES
                # namespace that has been checked in the last 10 minutes if
                # there are multiple checks to do.
                rate_limit_feedback_metrics = False
                if metric_var_files:
                    metric_var_files_sorted = sorted(metric_var_files)
                    metric_check_file = '%s/%s' % (settings.IONOSPHERE_CHECK_PATH, str(metric_var_files_sorted[0]))
                    metric_var_files_count = len(metric_var_files_sorted)
                    if metric_var_files_count > 2:
                        rate_limit_feedback_metrics = True
                if rate_limit_feedback_metrics:
                    for i_metric_check_file in metric_var_files_sorted:
                        feedback_metric = False
                        check_metric_file_list = i_metric_check_file.split('.', -1)[1:]
                        last_name_element = len(check_metric_file_list) - 1
                        base_name = '.'.join(check_metric_file_list[0:last_name_element])
                        metric_namespace_elements = base_name.split('.')
                        for to_skip in SKYLINE_FEEDBACK_NAMESPACES:
                            if to_skip in base_name:
                                feedback_metric = True
                                logger.info('SKYLINE_FEEDBACK_NAMESPACES matched on to_skip %s in base_name %s' % (to_skip, base_name))
                                break
                            to_skip_namespace_elements = to_skip.split('.')
                            elements_matched = set(metric_namespace_elements) & set(to_skip_namespace_elements)
                            if len(elements_matched) == len(to_skip_namespace_elements):
                                feedback_metric = True
                                logger.info('SKYLINE_FEEDBACK_NAMESPACES matched elements in %s' % base_name)
                                break
                        if feedback_metric:
                            remove_feedback_metric_check = False
                            if metric_var_files_count > 4:
                                logger.info('rate limiting feedback metric, removing check for %s as Ionosphere has %s pending checks, not checking feedback metric' % (
                                    base_name, str(metric_var_files_count)))
                                remove_feedback_metric_check = True
                            cache_key = 'ionosphere.feedback_metric.checked.%s' % (base_name)
                            check_done = False
                            try:
                                check_done = self.redis_conn.get(cache_key)
                            except Exception as e:
                                logger.error('error :: could not query Redis for cache_key: %s' % e)
                            if not check_done:
                                logger.info('not removing feedback metric as no check has been done in last 600 seconds on %s' % base_name)
                            else:
                                logger.info('rate limiting feedback metric, removing check as %s has been checked in the last 600 seconds' % (
                                    base_name))
                                remove_feedback_metric_check = True
                            if remove_feedback_metric_check:
                                metric_check_file = '%s/%s' % (settings.IONOSPHERE_CHECK_PATH, i_metric_check_file)
                                self.remove_metric_check_file(str(metric_check_file))
                    # Determine metric_var_files after possible feedback metric removals
                    metric_var_files = False
                    try:
                        metric_var_files = [f for f in listdir(settings.IONOSPHERE_CHECK_PATH) if isfile(join(settings.IONOSPHERE_CHECK_PATH, f))]
                    except:
                        logger.error('error :: failed to list files in check dir')
                        logger.info(traceback.format_exc())

                if metric_var_files:
                    ionosphere_job = True
                    break

                # @added 20170113 - Feature #1854: Ionosphere learn
                # Added the learn variable to spawn a spawn_learn_process when
                # required.
                work_queue_items = 0
                if settings.IONOSPHERE_LEARN:
                    learn_work = None
                    try:
                        learn_work = self.redis_conn.smembers('ionosphere.learn.work')
                    except Exception as e:
                        logger.error('error :: could not query Redis for ionosphere.learn.work - %s' % e)
                    if learn_work:
                        work_queue_items = len(learn_work)
                        if work_queue_items > 0:
                            learn_job = True
                if learn_job:
                    break

            # @added 20190404 - Bug #2904: Initial Ionosphere echo load and Ionosphere feedback
            #                   Feature #2484: FULL_DURATION feature profiles
            # Do not run an Ionosphere and echo checks on a metrics when a lot of
            # checks are being done.  Manage the Ionosphere load and increased
            # runtime in general that Ionosphere echo has introduced, especially
            # when Ionosphere is issued lots of checks, if lots of metrics suddenly
            # become anomalous.
            metric_var_files_count = 0
            ionosphere_busy = False

            if ionosphere_job:
                metric_var_files_sorted = sorted(metric_var_files)
                metric_check_file = '%s/%s' % (settings.IONOSPHERE_CHECK_PATH, str(metric_var_files_sorted[0]))
                # @added 20190403 - Bug #2904: Initial Ionosphere echo load and Ionosphere feedback
                #                   Feature #2484: FULL_DURATION feature profiles
                # Added a count of the number of checks to be done
                metric_var_files_count = len(metric_var_files)

                # If there are more than 4 metric check files set Ionosphere to
                # busy so that Ionosphere alternates between checking the normal
                # Ionosphere Mirage features profiles and the Ionosphere echo
                # features profiles on subsequent checks of a metric so that
                # when Ionosphere is busy it is not checking both sets of
                # features profiles on every run.
                if metric_var_files_count > 4:
                    ionosphere_busy = True

            # @added 20170108 - Feature #1830: Ionosphere alerts
            # Adding lists of smtp_alerter_metrics and ionosphere_non_smtp_alerter_metrics
            # Timed this takes 0.013319 seconds on 689 unique_metrics
            unique_metrics = []
            try:
                unique_metrics = list(self.redis_conn.smembers(settings.FULL_NAMESPACE + 'unique_metrics'))
            except:
                logger.error(traceback.format_exc())
                logger.error('error :: could not get the unique_metrics list from Redis')
                unique_metrics = []

            # @added 20190522 - Task #3034: Reduce multiprocessing Manager list usage
            # The Redis analyzer.smtp_alerter_metrics list is created here to
            # replace the self.ionosphere_smtp_alerter_metrics Manager.list in the below
            # section
            ionosphere_smtp_alerter_metrics = []
            try:
                ionosphere_smtp_alerter_metrics = list(self.redis_conn.smembers('ionosphere.ionosphere_smtp_alerter_metrics'))
            except:
                logger.info(traceback.format_exc())
                logger.error('error :: failed to generate a list from the ionosphere_smtp_alerter_metrics Redis set')
                ionosphere_smtp_alerter_metrics = []
            redis_sets_to_rename = [
                'ionosphere.ionosphere_smtp_alerter_metrics',
                'ionosphere.ionosphere_non_smtp_alerter_metrics'
            ]
            for current_redis_set in redis_sets_to_rename:
                new_redis_set = '%s.old' % current_redis_set
                try:
                    self.redis_conn.rename(current_redis_set, new_redis_set)
                except Exception as e:
                    if str(e) == 'no such key':
                        logger.info('could not rename Redis set %s to %s: %s' % (
                            current_redis_set, new_redis_set, str(e)))
                    else:
                        logger.error('error :: could not rename Redis set %s to %s: %s' % (
                            current_redis_set, new_redis_set, str(e)))

            for metric_name in unique_metrics:
                base_name = metric_name.replace(settings.FULL_NAMESPACE, '', 1)
                for alert in settings.ALERTS:
                    pattern_match = False
                    if str(alert[1]) == 'smtp':
                        ALERT_MATCH_PATTERN = alert[0]
                        METRIC_PATTERN = base_name
                        pattern_match = False
                        try:
                            # Match by regex
                            alert_match_pattern = re.compile(ALERT_MATCH_PATTERN)
                            pattern_match = alert_match_pattern.match(METRIC_PATTERN)
                            if pattern_match:
                                pattern_match = True
                                # @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
                                # if base_name not in self.ionosphere_smtp_alerter_metrics:
                                if base_name not in ionosphere_smtp_alerter_metrics:
                                    # self.ionosphere_smtp_alerter_metrics.append(base_name)
                                    redis_set = 'ionosphere.ionosphere_smtp_alerter_metrics'
                                    data = base_name
                                    try:
                                        self.redis_conn.sadd(redis_set, data)
                                    except:
                                        logger.info(traceback.format_exc())
                                        logger.error('error :: failed to add %s to Redis set %s' % (
                                            str(data), str(redis_set)))
                        except:
                            pattern_match = False

                        if not pattern_match:
                            # Match by substring
                            if alert[0] in base_name:
                                # @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
                                # if base_name not in self.ionosphere_smtp_alerter_metrics:
                                #     self.ionosphere_smtp_alerter_metrics.append(base_name)
                                if base_name not in ionosphere_smtp_alerter_metrics:
                                    redis_set = 'ionosphere.ionosphere_smtp_alerter_metrics'
                                    data = base_name
                                    try:
                                        self.redis_conn.sadd(redis_set, data)
                                    except:
                                        logger.info(traceback.format_exc())
                                        logger.error('error :: failed to add %s to Redis set %s' % (
                                            str(data), str(redis_set)))

                # @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
                # if base_name not in self.ionosphere_smtp_alerter_metrics:
                #     if base_name not in self.ionosphere_smtp_alerter_metrics:
                #         self.ionosphere_non_smtp_alerter_metrics.append(base_name)
                if base_name not in ionosphere_smtp_alerter_metrics:
                    redis_set = 'ionosphere.ionosphere_non_smtp_alerter_metrics'
                    data = base_name
                    try:
                        self.redis_conn.sadd(redis_set, data)
                    except:
                        logger.info(traceback.format_exc())
                        logger.error('error :: failed to add %s to Redis set %s' % (
                            str(data), str(redis_set)))

            # @added 20190522 - Task #3034: Reduce multiprocessing Manager list usage
            # The Redis lists are used here to replace the self.ionosphere_
            # Manager().list()
            ionosphere_smtp_alerter_metrics = []
            try:
                ionosphere_smtp_alerter_metrics = list(self.redis_conn.smembers('ionosphere.ionosphere_smtp_alerter_metrics'))
            except:
                logger.info(traceback.format_exc())
                logger.error('error :: failed to generate a list from the ionosphere_smtp_alerter_metrics Redis set')
                ionosphere_smtp_alerter_metrics = []
            ionosphere_non_smtp_alerter_metrics = []
            try:
                ionosphere_non_smtp_alerter_metrics = list(self.redis_conn.smembers('ionosphere.ionosphere_non_smtp_alerter_metrics'))
            except:
                logger.info(traceback.format_exc())
                logger.error('error :: failed to generate a list from the ionosphere_non_smtp_alerter_metrics Redis set')
                ionosphere_non_smtp_alerter_metrics = []

            # @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
            # logger.info('smtp_alerter_metrics     :: %s' % str(len(self.ionosphere_smtp_alerter_metrics)))
            # logger.info('ionosphere_non_smtp_alerter_metrics :: %s' % str(len(self.ionosphere_non_smtp_alerter_metrics)))
            logger.info('smtp_alerter_metrics     :: %s' % str(len(ionosphere_smtp_alerter_metrics)))
            logger.info('ionosphere_non_smtp_alerter_metrics :: %s' % str(len(ionosphere_non_smtp_alerter_metrics)))

            if ionosphere_job:

                # @added 20190326 - Feature #2484
                # First process ionosphere_echo to create any missing
                try:
                    ionosphere_echo_enabled = settings.IONOSPHERE_ECHO_ENABLED
                except:
                    ionosphere_echo_enabled = False

                # @added 20190403 - Bug #2904: Initial Ionosphere echo load and Ionosphere feedback
                #                   Feature #2484: FULL_DURATION feature profiles
                # If there are more than 2 metric check files, do not run
                # process_ionosphere_echo to create echo features profiles
                run_process_ionosphere_echo = True
                if metric_var_files_count > 2:
                    run_process_ionosphere_echo = False
                    logger.info(
                        'not running process_ionosphere_echo as there are %s metric check files to be checked' % (
                            str(metric_var_files_count)))

                # @added 20190527 - Feature #2484: FULL_DURATION feature profiles
                #                   Branch #3002: docker
                # Only process if there is a ionosphere.unique_metrics Redis set
                if run_process_ionosphere_echo:
                    ionosphere_unique_metrics = []
                    try:
                        ionosphere_unique_metrics = self.redis_conn.smembers('ionosphere.unique_metrics')
                    except:
                        logger.error(traceback.format_exc())
                        logger.error('error :: failed to get Redis smembers ionosphere.unique_metrics')
                        ionosphere_unique_metrics = []
                    # @added 20190527 - Feature #2484: FULL_DURATION feature profiles
                    if not ionosphere_unique_metrics:
                        logger.info('there are metrics in the Redis ionosphere.unique_metrics set, skipping process_ionosphere_echo')

                # If there are more than 4 metric check files set Ionosphere to
                # busy so that Ionosphere alternates between checking the normal
                # Ionosphere Mirage features profiles and the Ionosphere echo
                # features profiles on subsequent checks of a metric so that
                # when Ionosphere is busy it is not checking both sets of
                # features profiles on every run.
                if metric_var_files_count > 4:
                    ionosphere_busy = True

                if ionosphere_echo_enabled and run_process_ionosphere_echo:
                    # Spawn a single process_ionosphere_echo process
                    function_name = 'process_ionosphere_echo'
                    pids = []
                    spawned_pids = []
                    pid_count = 0
                    now = time()
                    for i in range(1, IONOSPHERE_PROCESSES + 1):
                        try:
                            p = Process(target=self.process_ionosphere_echo, args=(i, metric_check_file))
                            pids.append(p)
                            pid_count += 1
                            logger.info(
                                'starting %s of %s %s' % (
                                    str(pid_count), str(IONOSPHERE_PROCESSES),
                                    function_name))
                            p.start()
                            spawned_pids.append(p.pid)
                        except:
                            logger.error(traceback.format_exc())
                            logger.error('error :: failed to start %s' % function_name)
                            continue
                    # Self monitor the process and terminate if the
                    # process_ionosphere_echo has run for too long
                    try:
                        ionosphere_echo_max_fp_create_time = settings.IONOSPHERE_ECHO_MAX_FP_CREATE_TIME
                    except:
                        ionosphere_echo_max_fp_create_time = 55
                    p_starts = time()
                    while time() - p_starts <= ionosphere_echo_max_fp_create_time:
                        if any(p.is_alive() for p in pids):
                            # Just to avoid hogging the CPU
                            sleep(.1)
                        else:
                            # All the processes are done, break now.
                            time_to_run = time() - p_starts
                            logger.info(
                                '%s %s completed in %.2f seconds' % (
                                    str(IONOSPHERE_PROCESSES),
                                    function_name, time_to_run))
                            break
                    else:
                        # We only enter this if we didn't 'break' above.
                        logger.info('timed out, killing all %s processes' % (function_name))
                        for p in pids:
                            try:
                                p.terminate()
                                # p.join()
                                logger.info('killed %s process' % (function_name))
                            except:
                                logger.error(traceback.format_exc())
                                logger.error('error :: killing all %s processes' % function_name)

                logger.info('processing - %s' % str(metric_var_files_sorted[0]))
                function_name = 'spin_process'

            # @added 20170109 - Feature #1854: Ionosphere learn
            # Added the learn variable to spawn a spawn_learn_process when
            # required.
            # @added 20170112 - Feature #1854: Ionosphere learn - Redis ionosphere.learn.work namespace
            # Ionosphere learn needs Redis works sets
            # When a features profile is created there needs to be work added to a Redis
            # set
            # When a human makes a features profile, we want Ionosphere to make a
            # use_full_duration_days features profile valid_learning_duration (e.g.
            # 3361) later.
            if learn_job:
                logger.info('processing - learn work queue - %s' % str(work_queue_items))
                function_name = 'spawn_learn_process'

            # Spawn processes
            pids = []
            spawned_pids = []
            pid_count = 0
            now = time()
            # @modified 20180819 - Task #2526: Hard code IONOSPHERE_PROCESSES to 1
            # for i in range(1, settings.IONOSPHERE_PROCESSES + 1):
            for i in range(1, IONOSPHERE_PROCESSES + 1):
                if ionosphere_job:
                    try:
                        # @modified 20190404 - Bug #2904: Initial Ionosphere echo load and Ionosphere feedback
                        #                      Feature #2484: FULL_DURATION feature profiles
                        # Added ionosphere_busy if there are queued checks
                        # to ensure that Ionosphere echo is rate limited if a
                        # lot of metrics become anomalous and that Ionosphere
                        # alternates between normal Mirage features profiles
                        # comparisons and Ionosphere echo features profiles
                        # during busy times.
                        # p = Process(target=self.spin_process, args=(i, metric_check_file))
                        p = Process(target=self.spin_process, args=(i, metric_check_file, ionosphere_busy))
                        pids.append(p)
                        pid_count += 1
                        logger.info(
                            'starting %s of %s %s' % (
                                str(pid_count),
                                # @modified 20180819 - Task #2526: Hard code IONOSPHERE_PROCESSES to 1
                                # str(settings.IONOSPHERE_PROCESSES),
                                str(IONOSPHERE_PROCESSES),
                                function_name))
                        p.start()
                        spawned_pids.append(p.pid)
                    except:
                        logger.error(traceback.format_exc())
                        logger.error('error :: failed to start %s' % function_name)
                        continue

                # @added 20170113 - Feature #1854: Ionosphere learn - Redis ionosphere.learn.work namespace
                if learn_job:
                    try:
                        p = Process(target=self.spawn_learn_process, args=(i, int(now)))
                        pids.append(p)
                        pid_count += 1
                        logger.info(
                            'starting %s of %s %s' % (
                                str(pid_count),
                                # @modified 20180819 - Task #2526: Hard code IONOSPHERE_PROCESSES to 1
                                # str(settings.IONOSPHERE_PROCESSES),
                                str(IONOSPHERE_PROCESSES),
                                function_name))
                        p.start()
                        spawned_pids.append(p.pid)
                    except:
                        logger.error(traceback.format_exc())
                        logger.error('error :: failed to start %s' % function_name)
                        continue

            # Self monitor processes and terminate if any spin_process has run
            # for to long
            p_starts = time()
            # @modified 20180621 - Feature #2404: Ionosphere - fluid approximation
            # Increase run time to 55 seconds to allow for Min-Max scaling
            # while time() - p_starts <= 20:
            # @modified 20190327 - Feature #2484: FULL_DURATION feature profiles
            # Added ionosphere_echo which takes more time
            # while time() - p_starts <= 55:
            try:
                ionosphere_max_runtime = settings.IONOSPHERE_MAX_RUNTIME
            except:
                ionosphere_max_runtime = 120
            while time() - p_starts <= ionosphere_max_runtime:
                if any(p.is_alive() for p in pids):
                    # Just to avoid hogging the CPU
                    sleep(.1)
                else:
                    # All the processes are done, break now.
                    time_to_run = time() - p_starts
                    logger.info(
                        '%s %s completed in %.2f seconds' % (
                            # @modified 20180819 - Task #2526: Hard code IONOSPHERE_PROCESSES to 1
                            # str(settings.IONOSPHERE_PROCESSES),
                            str(IONOSPHERE_PROCESSES),
                            function_name, time_to_run))
                    break
            else:
                # We only enter this if we didn't 'break' above.
                logger.info('timed out, killing all %s processes' % (function_name))
                for p in pids:
                    try:
                        p.terminate()
                        # p.join()
                        logger.info('killed %s process' % (function_name))
                    except:
                        logger.error(traceback.format_exc())
                        logger.error('error :: killing all %s processes' % function_name)

                if ionosphere_job:
                    check_file_name = os.path.basename(str(metric_check_file))
                    if settings.ENABLE_IONOSPHERE_DEBUG:
                        logger.info('debug :: check_file_name - %s' % check_file_name)
                    check_file_timestamp = check_file_name.split('.', 1)[0]
                    if settings.ENABLE_IONOSPHERE_DEBUG:
                        logger.info('debug :: check_file_timestamp - %s' % str(check_file_timestamp))
                    check_file_metricname_txt = check_file_name.split('.', 1)[1]
                    if settings.ENABLE_IONOSPHERE_DEBUG:
                        logger.info('debug :: check_file_metricname_txt - %s' % check_file_metricname_txt)
                    check_file_metricname = check_file_metricname_txt.replace('.txt', '')
                    if settings.ENABLE_IONOSPHERE_DEBUG:
                        logger.info('debug :: check_file_metricname - %s' % check_file_metricname)
                    check_file_metricname_dir = check_file_metricname.replace('.', '/')
                    if settings.ENABLE_IONOSPHERE_DEBUG:
                        logger.info('debug :: check_file_metricname_dir - %s' % check_file_metricname_dir)

                    metric_failed_check_dir = '%s/%s/%s' % (failed_checks_dir, check_file_metricname_dir, check_file_timestamp)
                    fail_check(skyline_app, metric_failed_check_dir, str(metric_check_file))

            for p in pids:
                if p.is_alive():
                    logger.info('stopping %s - %s' % (function_name, str(p.is_alive())))
                    p.join()

            # @added 20170108 - Feature #1830: Ionosphere alerts
            # Reset added lists of ionospehere_smtp_alerter_metrics and
            # ionosphere_non_smtp_alerter_metrics
            # @modified 20190522 - Task #3034: Reduce multiprocessing Manager list usage
            # self.ionosphere_smtp_alerter_metrics[:] = []
            # self.ionosphere_non_smtp_alerter_metrics[:] = []

            # @added 20190522 - Task #3034: Reduce multiprocessing Manager list usage
            # Use Redis sets instead of Manager().list()
            # delete_redis_sets = [
            #     'ionosphere.ionosphere_smtp_alerter_metrics',
            #     'ionosphere.ionosphere_non_smtp_alerter_metrics',
            # ]
            delete_redis_sets = [
                'ionosphere.ionosphere_smtp_alerter_metrics.old',
                'ionosphere.ionosphere_non_smtp_alerter_metrics.old',
            ]
            for i_redis_set in delete_redis_sets:
                redis_set_to_delete = i_redis_set
                try:
                    self.redis_conn.delete(redis_set_to_delete)
                    logger.info('deleted Redis set - %s' % redis_set_to_delete)
                except:
                    logger.error(traceback.format_exc())
                    logger.error('error :: failed to delete Redis set - %s' % redis_set_to_delete)