hastic-server/analytics/analytics/utils/common.py

import numpy as np
import pandas as pd
import scipy.signal
from scipy.fftpack import fft
from scipy.signal import argrelextrema
from scipy.stats import gaussian_kde
from typing import Union
import utils

SHIFT_FACTOR = 0.05
CONFIDENCE_FACTOR = 0.2

def exponential_smoothing(series, alpha):
    result = [series[0]]
    if np.isnan(result):
        result = [0]
    for n in range(1, len(series)):
        if np.isnan(series[n]):
            series[n] = 0
        result.append(alpha * series[n] + (1 - alpha) * result[n - 1])
    return result

def find_steps(array, threshold):
    """
    Finds local maxima by segmenting array based on positions at which
    the threshold value is crossed. Note that this thresholding is
    applied after the absolute value of the array is taken. Thus,
    the distinction between upward and downward steps is lost. However,
    get_step_sizes can be used to determine directionality after the
    fact.
    Parameters
    ----------
    array : numpy array
        1 dimensional array that represents time series of data points
    threshold : int / float
        Threshold value that defines a step
    Returns
    -------
    steps : list
        List of indices of the detected steps
    """
    steps        = []
    array        = np.abs(array)
    above_points = np.where(array > threshold, 1, 0)
    ap_dif       = np.diff(above_points)
    cross_ups    = np.where(ap_dif == 1)[0]
    cross_dns    = np.where(ap_dif == -1)[0]
    for upi, dni in zip(cross_ups,cross_dns):
        steps.append(np.argmax(array[upi:dni]) + upi)
    return steps

def anomalies_to_timestamp(anomalies):
    for anomaly in anomalies:
        anomaly['from'] = int(anomaly['from'].timestamp() * 1000)
        anomaly['to'] = int(anomaly['to'].timestamp() * 1000)
    return anomalies

def segments_box(segments):
    max_time = 0
    min_time = float("inf")
    for segment in segments:
        min_time = min(min_time, segment['from'])
        max_time = max(max_time, segment['to'])
    min_time = pd.to_datetime(min_time, unit='ms')
    max_time = pd.to_datetime(max_time, unit='ms')
    return min_time, max_time

def find_intersections(data: pd.Series, median: float) -> list:
    """
        Finds all intersections between drop pattern data and median
    """
    cen_ind = []
    for i in range(1, len(data) - 1):
        if data[i - 1] < median and data[i + 1] > median:
            cen_ind.append(i)
    del_ind = []
    for i in range(1, len(cen_ind)):
        if cen_ind[i] == cen_ind[i - 1] + 1:
            del_ind.append(i - 1)

    return [x for (idx, x) in enumerate(cen_ind) if idx not in del_ind]

def logistic_sigmoid_distribution(self, x1, x2, alpha, height):
    return map(lambda x: logistic_sigmoid(x, alpha, height), range(x1, x2))

def logistic_sigmoid(x, alpha, height):
    return height / (1 + math.exp(-x * alpha))

def MyLogisticSigmoid(interval, alpha, heigh):
    distribution = []
    for i in range(-interval, interval):
        F = height / (1 + math.exp(-i * alpha))
        distribution.append(F)
    return distribution

def find_one_jump(data, x, size, height, err):
    l = []
    for i in range(x + 1, x + size):
        if (data[i] > data[x] and data[x + size] > data[x] + height):
            l.append(data[i])
    if len(l) > size * err:
        return x
    else:
        return 0

def find_all_jumps(data, size, height):
    possible_jump_list = []
    for i in range(len(data - size)):
        x = find_one_jump(data, i, size, height, 0.9)
        if x > 0:
            possible_jump_list.append(x)
    return possible_jump_list

def find_jump_center(cen_ind):
    jump_center = cen_ind[0]
    for i in range(len(cen_ind)):
        x = cen_ind[i]
        cx = scipy.signal.fftconvolve(pat_sigm, flat_data[x - WINDOW_SIZE : x + WINDOW_SIZE])
        c.append(cx[2 * WINDOW_SIZE])
        if i > 0 and cx > c[i - 1]:
            jump_center = x
    return jump_center

def find_ind_median(median, segment_data):
    x = np.arange(0, len(segment_data))
    f = []
    for i in range(len(segment_data)):
        f.append(median)
    f = np.array(f)
    g = []
    for i in segment_data:
        g.append(i)
    g = np.array(g)
    idx = np.argwhere(np.diff(np.sign(f - g)) != 0).reshape(-1) + 0
    return idx

def find_jump_length(segment_data, min_line, max_line):
    x = np.arange(0, len(segment_data))
    f = []
    l = []
    for i in range(len(segment_data)):
        f.append(min_line)
        l.append(max_line)
    f = np.array(f)
    l = np.array(l)
    g = []
    for i in segment_data:
        g.append(i)
    g = np.array(g)
    idx = np.argwhere(np.diff(np.sign(f - g)) != 0).reshape(-1) + 0
    idl = np.argwhere(np.diff(np.sign(l - g)) != 0).reshape(-1) + 0
    if (idl[0] - idx[-1] + 1) > 0:
        return idl[0] - idx[-1] + 1
    else:
        print("retard alert!")
        return 0

def find_jump(data, height, lenght):
    j_list = []
    for i in range(len(data)-lenght-1):
        for x in range(1, lenght):
            if(data[i+x] > data[i] + height):
                j_list.append(i)
    return(j_list)

def find_drop_length(segment_data, min_line, max_line):
    x = np.arange(0, len(segment_data))
    f = []
    l = []
    for i in range(len(segment_data)):
        f.append(min_line)
        l.append(max_line)
    f = np.array(f)
    l = np.array(l)
    g = []
    for i in segment_data:
        g.append(i)
    g = np.array(g)
    idx = np.argwhere(np.diff(np.sign(f - g)) != 0).reshape(-1) + 0 #min_line
    idl = np.argwhere(np.diff(np.sign(l - g)) != 0).reshape(-1) + 0 #max_line
    if (idx[0] - idl[-1] + 1) > 0:
        return idx[0] - idl[-1] + 1
    else:
        print("retard alert!")
        return 0

def find_drop_intersections(segment_data: pd.Series, median_line: float) -> list:
    """
        Finds all intersections between flatten data and median
    """
    cen_ind = []
    for i in range(1, len(segment_data)-1):
        if segment_data[i - 1] > median_line and segment_data[i + 1] < median_line:
            cen_ind.append(i)
    #   Delete close values except the last one
    del_ind = []
    for i in range(1, len(cen_ind)):
        if cen_ind[i] == cen_ind[i - 1] + 1:
            del_ind.append(i - 1)

    return [x for (idx, x) in enumerate(cen_ind) if idx not in del_ind]

def find_drop(data, height, length):
    d_list = []
    for i in range(len(data)-length-1):
        for x in range(1, length):
            if(data[i+x] < data[i] - height):
                d_list.append(i)
    return(d_list)

def timestamp_to_index(dataframe, timestamp):
    data = dataframe['timestamp']

    for i in range(len(data)):
        if data[i] >= timestamp:
            return i

def peak_finder(data, size):
    all_max = []
    for i in range(size, len(data) - size):
        if data[i] == max(data[i - size: i + size]) and data[i] > data[i + 1]:
            all_max.append(i)
    return all_max

def ar_mean(numbers):
    return float(sum(numbers)) / max(len(numbers), 1)

def get_av_model(patterns_list):
    if len(patterns_list) == 0:
        return []

    x = len(patterns_list[0])
    if len(patterns_list) > 1 and len(patterns_list[1]) != x:
        raise NameError(
            'All elements of patterns_list should have same length')

    model_pat = []
    for i in range(x):
        av_val = []
        for j in patterns_list:
            av_val.append(j.values[i])
        model_pat.append(ar_mean(av_val))
    return model_pat

def close_filtering(pat_list, win_size):
    if len(pat_list) == 0:
        return []
    s = [[pat_list[0]]]
    k = 0
    for i in range(1, len(pat_list)):
        if pat_list[i] - win_size <= s[k][-1]:
            s[k].append(pat_list[i])
        else:
            k += 1
            s.append([pat_list[i]])
    return s

def best_pat(pat_list, data, dir):
    new_pat_list = []
    for val in pat_list:
        max_val = data[val[0]]
        min_val = data[val[0]]
        ind = val[0]
        for i in val:
            if dir == 'max':
                if data[i] > max_val:
                    max_val = data[i]
                    ind = i
            else:
                if data[i] < min_val:
                    min_val = data[i]
                    ind = i
        new_pat_list.append(ind)
    return new_pat_list

def find_nan_indexes(segment: pd.Series) -> list:
    nan_list = np.isnan(segment)
    nan_indexes = []
    for i, val in enumerate(nan_list):
        if val:
            nan_indexes.append(i)
    return nan_indexes

def check_nan_values(segment: Union[pd.Series, list]) -> Union[pd.Series, list]:
    nan_list = utils.find_nan_indexes(segment)
    if len(nan_list) > 0:
        segment = utils.nan_to_zero(segment, nan_list)
    return segment

def nan_to_zero(segment: Union[pd.Series, list], nan_list: list) -> Union[pd.Series, list]:
    if type(segment) == pd.Series:
        for val in nan_list:
            segment.values[val] = 0
    else:
        for val in nan_list:
            segment[val] = 0
    return segment

def find_confidence(segment: pd.Series) -> float:
    segment = utils.check_nan_values(segment)
    segment_min = min(segment)
    segment_max = max(segment)
    return CONFIDENCE_FACTOR * (segment_max - segment_min)

def get_interval(data: pd.Series, center: int, window_size: int) -> pd.Series:
    left_bound = center - window_size
    right_bound = center + window_size + 1
    if left_bound < 0:
        left_bound = 0
    if right_bound > len(data):
        right_bound = len(data)
    return data[left_bound: right_bound]

def subtract_min_without_nan(segment: pd.Series) -> pd.Series:
    if len(segment) == 0:
        return []
    nan_list = utils.find_nan_indexes(segment)
    if len(nan_list) > 0:
        return segment
    else:
        segment = segment - min(segment)        
    return segment

def get_convolve(segments: list, av_model: list, data: pd.Series, window_size: int) -> list:
    labeled_segment = []
    convolve_list = []
    for segment in segments:
        labeled_segment = utils.get_interval(data, segment, window_size)
        labeled_segment = utils.subtract_min_without_nan(labeled_segment)
        labeled_segment = utils.check_nan_values(labeled_segment)
        auto_convolve = scipy.signal.fftconvolve(labeled_segment, labeled_segment)
        convolve_segment = scipy.signal.fftconvolve(labeled_segment, av_model)
        convolve_list.append(max(auto_convolve))
        convolve_list.append(max(convolve_segment))
    return convolve_list

def find_jump_parameters(segment_data: pd.Series, segment_from_index: int):
    flat_segment = segment_data.rolling(window=5).mean()
    flat_segment_dropna = flat_segment.dropna()
    segment_median, segment_max_line, segment_min_line = utils.get_distribution_density(flat_segment_dropna)
    jump_height = (1 - SHIFT_FACTOR) * (segment_max_line - segment_min_line)
    jump_length = utils.find_jump_length(segment_data, segment_min_line, segment_max_line) # finds all interseprions with median
    cen_ind = utils.find_intersections(segment_data.tolist(), segment_median)
    jump_center = cen_ind[0]
    segment_cent_index = jump_center + segment_from_index
    return segment_cent_index, jump_height, jump_length

def find_drop_parameters(segment_data: pd.Series, segment_from_index: int):
    flat_segment = segment_data.rolling(window=5).mean()
    flat_segment_dropna = flat_segment.dropna()
    segment_median, segment_max_line, segment_min_line = utils.get_distribution_density(flat_segment_dropna)
    drop_height = (1 - SHIFT_FACTOR) * (segment_max_line - segment_min_line)
    drop_length = utils.find_drop_length(segment_data, segment_min_line, segment_max_line)
    cen_ind = utils.find_drop_intersections(segment_data.tolist(), segment_median)
    drop_center = cen_ind[0]
    segment_cent_index = drop_center + segment_from_index
    return segment_cent_index, drop_height, drop_length

def get_distribution_density(segment: pd.Series) -> float:
    min_jump = min(segment)
    max_jump = max(segment)
    pdf = gaussian_kde(segment)
    x = np.linspace(segment.min() - 1, segment.max() + 1, len(segment))
    y = pdf(x)
    ax_list = list(zip(x, y))
    ax_list = np.array(ax_list, np.float32)
    antipeaks_kde = argrelextrema(np.array(ax_list), np.less)[0]
    peaks_kde = argrelextrema(np.array(ax_list), np.greater)[0]
    try:
        min_peak_index = peaks_kde[0]
        segment_min_line = ax_list[min_peak_index, 0]
        max_peak_index = peaks_kde[1]
        segment_max_line = ax_list[max_peak_index, 0]
        segment_median = ax_list[antipeaks_kde[0], 0]
    except IndexError:
        segment_max_line = max_jump * (1 - SHIFT_FACTOR)
        segment_min_line = min_jump * (1 - SHIFT_FACTOR)
        segment_median = (max_jump - min_jump) / 2 + min_jump
    return segment_median, segment_max_line, segment_min_line
Unit testing for analytics project #216 (#223) 6 years ago			`import numpy as np`
			`import pandas as pd`
Move repeating code from models to utils #270 (#272) peak / trough / jump / drop / general common code to and utils refactoring 6 years ago			`import scipy.signal`
			`from scipy.fftpack import fft`
			`from scipy.signal import argrelextrema`
			`from scipy.stats import gaussian_kde`
Add some sort of verification of incoming and outgoing data in analytics #227 (#281) * fix find_confidence * fix get_interval * fix subtract_min_without_nan * fix substract and get_convolve 6 years ago			`from typing import Union`
Move repeating code from models to utils #270 (#272) peak / trough / jump / drop / general common code to and utils refactoring 6 years ago			`import utils`
Models with filtering#186 (#218) 6 years ago
The center of drop and jump patterns is shifted from real value #291 (#292) * fix centers in jumps and drops * coeff * add simple docstring * fix utils * fix spaces * fix names 6 years ago			`SHIFT_FACTOR = 0.05`
			`CONFIDENCE_FACTOR = 0.2`

Unit testing for analytics project #216 (#223) 6 years ago			`def exponential_smoothing(series, alpha):`
			`result = [series[0]]`
Incorrect work of analytics with nan filled dataset #247 (#248) 6 years ago			`if np.isnan(result):`
			`result = [0]`
Unit testing for analytics project #216 (#223) 6 years ago			`for n in range(1, len(series)):`
Incorrect work of analytics with nan filled dataset #247 (#248) 6 years ago			`if np.isnan(series[n]):`
			`series[n] = 0`
Unit testing for analytics project #216 (#223) 6 years ago			`result.append(alpha * series[n] + (1 - alpha) * result[n - 1])`
			`return result`

			`def find_steps(array, threshold):`
			`"""`
			`Finds local maxima by segmenting array based on positions at which`
			`the threshold value is crossed. Note that this thresholding is`
			`applied after the absolute value of the array is taken. Thus,`
			`the distinction between upward and downward steps is lost. However,`
			`get_step_sizes can be used to determine directionality after the`
			`fact.`
			`Parameters`
			`----------`
			`array : numpy array`
			`1 dimensional array that represents time series of data points`
			`threshold : int / float`
			`Threshold value that defines a step`
			`Returns`
			`-------`
			`steps : list`
			`List of indices of the detected steps`
			`"""`
			`steps = []`
			`array = np.abs(array)`
			`above_points = np.where(array > threshold, 1, 0)`
			`ap_dif = np.diff(above_points)`
			`cross_ups = np.where(ap_dif == 1)[0]`
			`cross_dns = np.where(ap_dif == -1)[0]`
			`for upi, dni in zip(cross_ups,cross_dns):`
			`steps.append(np.argmax(array[upi:dni]) + upi)`
			`return steps`

			`def anomalies_to_timestamp(anomalies):`
			`for anomaly in anomalies:`
			`anomaly['from'] = int(anomaly['from'].timestamp() * 1000)`
			`anomaly['to'] = int(anomaly['to'].timestamp() * 1000)`
			`return anomalies`

			`def segments_box(segments):`
			`max_time = 0`
			`min_time = float("inf")`
			`for segment in segments:`
			`min_time = min(min_time, segment['from'])`
			`max_time = max(max_time, segment['to'])`
			`min_time = pd.to_datetime(min_time, unit='ms')`
			`max_time = pd.to_datetime(max_time, unit='ms')`
			`return min_time, max_time`

The center of drop and jump patterns is shifted from real value #291 (#292) * fix centers in jumps and drops * coeff * add simple docstring * fix utils * fix spaces * fix names 6 years ago			`def find_intersections(data: pd.Series, median: float) -> list:`
Unit testing for analytics project #216 (#223) 6 years ago			`"""`
The center of drop and jump patterns is shifted from real value #291 (#292) * fix centers in jumps and drops * coeff * add simple docstring * fix utils * fix spaces * fix names 6 years ago			`Finds all intersections between drop pattern data and median`
Unit testing for analytics project #216 (#223) 6 years ago			`"""`
			`cen_ind = []`
The center of drop and jump patterns is shifted from real value #291 (#292) * fix centers in jumps and drops * coeff * add simple docstring * fix utils * fix spaces * fix names 6 years ago			`for i in range(1, len(data) - 1):`
Unit testing for analytics project #216 (#223) 6 years ago			`if data[i - 1] < median and data[i + 1] > median:`
			`cen_ind.append(i)`
			`del_ind = []`
			`for i in range(1, len(cen_ind)):`
			`if cen_ind[i] == cen_ind[i - 1] + 1:`
			`del_ind.append(i - 1)`
trim trailing whitespaces 6 years ago
Unit testing for analytics project #216 (#223) 6 years ago			`return [x for (idx, x) in enumerate(cen_ind) if idx not in del_ind]`

			`def logistic_sigmoid_distribution(self, x1, x2, alpha, height):`
			`return map(lambda x: logistic_sigmoid(x, alpha, height), range(x1, x2))`

			`def logistic_sigmoid(x, alpha, height):`
			`return height / (1 + math.exp(-x * alpha))`

			`def MyLogisticSigmoid(interval, alpha, heigh):`
			`distribution = []`
			`for i in range(-interval, interval):`
			`F = height / (1 + math.exp(-i * alpha))`
			`distribution.append(F)`
			`return distribution`

			`def find_one_jump(data, x, size, height, err):`
			`l = []`
			`for i in range(x + 1, x + size):`
			`if (data[i] > data[x] and data[x + size] > data[x] + height):`
			`l.append(data[i])`
			`if len(l) > size * err:`
			`return x`
			`else:`
			`return 0`

			`def find_all_jumps(data, size, height):`
			`possible_jump_list = []`
			`for i in range(len(data - size)):`
			`x = find_one_jump(data, i, size, height, 0.9)`
			`if x > 0:`
			`possible_jump_list.append(x)`
			`return possible_jump_list`

			`def find_jump_center(cen_ind):`
			`jump_center = cen_ind[0]`
			`for i in range(len(cen_ind)):`
			`x = cen_ind[i]`
			`cx = scipy.signal.fftconvolve(pat_sigm, flat_data[x - WINDOW_SIZE : x + WINDOW_SIZE])`
			`c.append(cx[2 * WINDOW_SIZE])`
			`if i > 0 and cx > c[i - 1]:`
			`jump_center = x`
			`return jump_center`

			`def find_ind_median(median, segment_data):`
			`x = np.arange(0, len(segment_data))`
			`f = []`
			`for i in range(len(segment_data)):`
			`f.append(median)`
			`f = np.array(f)`
trim trailing whitespaces 6 years ago			`g = []`
Unit testing for analytics project #216 (#223) 6 years ago			`for i in segment_data:`
			`g.append(i)`
			`g = np.array(g)`
			`idx = np.argwhere(np.diff(np.sign(f - g)) != 0).reshape(-1) + 0`
			`return idx`

			`def find_jump_length(segment_data, min_line, max_line):`
			`x = np.arange(0, len(segment_data))`
			`f = []`
			`l = []`
			`for i in range(len(segment_data)):`
			`f.append(min_line)`
			`l.append(max_line)`
			`f = np.array(f)`
			`l = np.array(l)`
trim trailing whitespaces 6 years ago			`g = []`
Unit testing for analytics project #216 (#223) 6 years ago			`for i in segment_data:`
			`g.append(i)`
			`g = np.array(g)`
			`idx = np.argwhere(np.diff(np.sign(f - g)) != 0).reshape(-1) + 0`
			`idl = np.argwhere(np.diff(np.sign(l - g)) != 0).reshape(-1) + 0`
			`if (idl[0] - idx[-1] + 1) > 0:`
			`return idl[0] - idx[-1] + 1`
			`else:`
			`print("retard alert!")`
			`return 0`
trim trailing whitespaces 6 years ago
Unit testing for analytics project #216 (#223) 6 years ago			`def find_jump(data, height, lenght):`
			`j_list = []`
			`for i in range(len(data)-lenght-1):`
			`for x in range(1, lenght):`
			`if(data[i+x] > data[i] + height):`
			`j_list.append(i)`
			`return(j_list)`

			`def find_drop_length(segment_data, min_line, max_line):`
			`x = np.arange(0, len(segment_data))`
			`f = []`
			`l = []`
			`for i in range(len(segment_data)):`
			`f.append(min_line)`
			`l.append(max_line)`
			`f = np.array(f)`
			`l = np.array(l)`
trim trailing whitespaces 6 years ago			`g = []`
Unit testing for analytics project #216 (#223) 6 years ago			`for i in segment_data:`
			`g.append(i)`
			`g = np.array(g)`
			`idx = np.argwhere(np.diff(np.sign(f - g)) != 0).reshape(-1) + 0 #min_line`
			`idl = np.argwhere(np.diff(np.sign(l - g)) != 0).reshape(-1) + 0 #max_line`
			`if (idx[0] - idl[-1] + 1) > 0:`
			`return idx[0] - idl[-1] + 1`
			`else:`
			`print("retard alert!")`
			`return 0`

The center of drop and jump patterns is shifted from real value #291 (#292) * fix centers in jumps and drops * coeff * add simple docstring * fix utils * fix spaces * fix names 6 years ago			`def find_drop_intersections(segment_data: pd.Series, median_line: float) -> list:`
			`"""`
			`Finds all intersections between flatten data and median`
			`"""`
			`cen_ind = []`
			`for i in range(1, len(segment_data)-1):`
			`if segment_data[i - 1] > median_line and segment_data[i + 1] < median_line:`
			`cen_ind.append(i)`
			`# Delete close values except the last one`
			`del_ind = []`
			`for i in range(1, len(cen_ind)):`
			`if cen_ind[i] == cen_ind[i - 1] + 1:`
			`del_ind.append(i - 1)`

			`return [x for (idx, x) in enumerate(cen_ind) if idx not in del_ind]`
Unit testing for analytics project #216 (#223) 6 years ago
			`def find_drop(data, height, length):`
			`d_list = []`
			`for i in range(len(data)-length-1):`
			`for x in range(1, length):`
			`if(data[i+x] < data[i] - height):`
			`d_list.append(i)`
			`return(d_list)`

			`def timestamp_to_index(dataframe, timestamp):`
			`data = dataframe['timestamp']`

			`for i in range(len(data)):`
			`if data[i] >= timestamp:`
			`return i`

			`def peak_finder(data, size):`
			`all_max = []`
			`for i in range(size, len(data) - size):`
			`if data[i] == max(data[i - size: i + size]) and data[i] > data[i + 1]:`
			`all_max.append(i)`
			`return all_max`

			`def ar_mean(numbers):`
			`return float(sum(numbers)) / max(len(numbers), 1)`

			`def get_av_model(patterns_list):`
IndexError: list index out of range in get_av_model #239 (#241) 6 years ago			`if len(patterns_list) == 0:`
			`return []`

Unit testing for analytics project #216 (#223) 6 years ago			`x = len(patterns_list[0])`
Incorrect work of models with single patterns #234 (#235) add first value of patterns list = val[0] instead 0 6 years ago			`if len(patterns_list) > 1 and len(patterns_list[1]) != x:`
IndexError: list index out of range in get_av_model #239 (#241) 6 years ago			`raise NameError(`
			`'All elements of patterns_list should have same length')`

Unit testing for analytics project #216 (#223) 6 years ago			`model_pat = []`
			`for i in range(x):`
			`av_val = []`
			`for j in patterns_list:`
			`av_val.append(j.values[i])`
			`model_pat.append(ar_mean(av_val))`
			`return model_pat`
Models with filtering#186 (#218) 6 years ago
			`def close_filtering(pat_list, win_size):`
IndexError: list index out of range in close_filtering #240 (#243) 6 years ago			`if len(pat_list) == 0:`
			`return []`
Models with filtering#186 (#218) 6 years ago			`s = [[pat_list[0]]]`
			`k = 0`
			`for i in range(1, len(pat_list)):`
			`if pat_list[i] - win_size <= s[k][-1]:`
			`s[k].append(pat_list[i])`
			`else:`
			`k += 1`
			`s.append([pat_list[i]])`
			`return s`

			`def best_pat(pat_list, data, dir):`
			`new_pat_list = []`
			`for val in pat_list:`
			`max_val = data[val[0]]`
			`min_val = data[val[0]]`
Incorrect work of models with single patterns #234 (#235) add first value of patterns list = val[0] instead 0 6 years ago			`ind = val[0]`
Models with filtering#186 (#218) 6 years ago			`for i in val:`
			`if dir == 'max':`
			`if data[i] > max_val:`
			`max_val = data[i]`
			`ind = i`
			`else:`
			`if data[i] < min_val:`
			`min_val = data[i]`
			`ind = i`
			`new_pat_list.append(ind)`
			`return new_pat_list`
Proccesing for NaN values #231 (#236) 6 years ago
Add some sort of verification of incoming and outgoing data in analytics #227 (#281) * fix find_confidence * fix get_interval * fix subtract_min_without_nan * fix substract and get_convolve 6 years ago			`def find_nan_indexes(segment: pd.Series) -> list:`
Proccesing for NaN values #231 (#236) 6 years ago			`nan_list = np.isnan(segment)`
			`nan_indexes = []`
			`for i, val in enumerate(nan_list):`
			`if val:`
			`nan_indexes.append(i)`
			`return nan_indexes`

Add some sort of verification of incoming and outgoing data in analytics #227 (#281) * fix find_confidence * fix get_interval * fix subtract_min_without_nan * fix substract and get_convolve 6 years ago			`def check_nan_values(segment: Union[pd.Series, list]) -> Union[pd.Series, list]:`
			`nan_list = utils.find_nan_indexes(segment)`
			`if len(nan_list) > 0:`
			`segment = utils.nan_to_zero(segment, nan_list)`
			`return segment`

			`def nan_to_zero(segment: Union[pd.Series, list], nan_list: list) -> Union[pd.Series, list]:`
			`if type(segment) == pd.Series:`
			`for val in nan_list:`
			`segment.values[val] = 0`
			`else:`
			`for val in nan_list:`
			`segment[val] = 0`
Proccesing for NaN values #231 (#236) 6 years ago			`return segment`
Move repeating code from models to utils #270 (#272) peak / trough / jump / drop / general common code to and utils refactoring 6 years ago
			`def find_confidence(segment: pd.Series) -> float:`
Add some sort of verification of incoming and outgoing data in analytics #227 (#281) * fix find_confidence * fix get_interval * fix subtract_min_without_nan * fix substract and get_convolve 6 years ago			`segment = utils.check_nan_values(segment)`
Move repeating code from models to utils #270 (#272) peak / trough / jump / drop / general common code to and utils refactoring 6 years ago			`segment_min = min(segment)`
			`segment_max = max(segment)`
The center of drop and jump patterns is shifted from real value #291 (#292) * fix centers in jumps and drops * coeff * add simple docstring * fix utils * fix spaces * fix names 6 years ago			`return CONFIDENCE_FACTOR * (segment_max - segment_min)`
Move repeating code from models to utils #270 (#272) peak / trough / jump / drop / general common code to and utils refactoring 6 years ago
			`def get_interval(data: pd.Series, center: int, window_size: int) -> pd.Series:`
			`left_bound = center - window_size`
			`right_bound = center + window_size + 1`
Add some sort of verification of incoming and outgoing data in analytics #227 (#281) * fix find_confidence * fix get_interval * fix subtract_min_without_nan * fix substract and get_convolve 6 years ago			`if left_bound < 0:`
			`left_bound = 0`
			`if right_bound > len(data):`
			`right_bound = len(data)`
Move repeating code from models to utils #270 (#272) peak / trough / jump / drop / general common code to and utils refactoring 6 years ago			`return data[left_bound: right_bound]`

Add some sort of verification of incoming and outgoing data in analytics #227 (#281) * fix find_confidence * fix get_interval * fix subtract_min_without_nan * fix substract and get_convolve 6 years ago			`def subtract_min_without_nan(segment: pd.Series) -> pd.Series:`
			`if len(segment) == 0:`
			`return []`
			`nan_list = utils.find_nan_indexes(segment)`
			`if len(nan_list) > 0:`
			`return segment`
			`else:`
			`segment = segment - min(segment)`
Move repeating code from models to utils #270 (#272) peak / trough / jump / drop / general common code to and utils refactoring 6 years ago			`return segment`

			`def get_convolve(segments: list, av_model: list, data: pd.Series, window_size: int) -> list:`
			`labeled_segment = []`
			`convolve_list = []`
			`for segment in segments:`
			`labeled_segment = utils.get_interval(data, segment, window_size)`
			`labeled_segment = utils.subtract_min_without_nan(labeled_segment)`
Add some sort of verification of incoming and outgoing data in analytics #227 (#281) * fix find_confidence * fix get_interval * fix subtract_min_without_nan * fix substract and get_convolve 6 years ago			`labeled_segment = utils.check_nan_values(labeled_segment)`
Move repeating code from models to utils #270 (#272) peak / trough / jump / drop / general common code to and utils refactoring 6 years ago			`auto_convolve = scipy.signal.fftconvolve(labeled_segment, labeled_segment)`
			`convolve_segment = scipy.signal.fftconvolve(labeled_segment, av_model)`
			`convolve_list.append(max(auto_convolve))`
			`convolve_list.append(max(convolve_segment))`
			`return convolve_list`

			`def find_jump_parameters(segment_data: pd.Series, segment_from_index: int):`
			`flat_segment = segment_data.rolling(window=5).mean()`
			`flat_segment_dropna = flat_segment.dropna()`
			`segment_median, segment_max_line, segment_min_line = utils.get_distribution_density(flat_segment_dropna)`
The center of drop and jump patterns is shifted from real value #291 (#292) * fix centers in jumps and drops * coeff * add simple docstring * fix utils * fix spaces * fix names 6 years ago			`jump_height = (1 - SHIFT_FACTOR) * (segment_max_line - segment_min_line)`
Move repeating code from models to utils #270 (#272) peak / trough / jump / drop / general common code to and utils refactoring 6 years ago			`jump_length = utils.find_jump_length(segment_data, segment_min_line, segment_max_line) # finds all interseprions with median`
The center of drop and jump patterns is shifted from real value #291 (#292) * fix centers in jumps and drops * coeff * add simple docstring * fix utils * fix spaces * fix names 6 years ago			`cen_ind = utils.find_intersections(segment_data.tolist(), segment_median)`
Move repeating code from models to utils #270 (#272) peak / trough / jump / drop / general common code to and utils refactoring 6 years ago			`jump_center = cen_ind[0]`
The center of drop and jump patterns is shifted from real value #291 (#292) * fix centers in jumps and drops * coeff * add simple docstring * fix utils * fix spaces * fix names 6 years ago			`segment_cent_index = jump_center + segment_from_index`
Move repeating code from models to utils #270 (#272) peak / trough / jump / drop / general common code to and utils refactoring 6 years ago			`return segment_cent_index, jump_height, jump_length`

			`def find_drop_parameters(segment_data: pd.Series, segment_from_index: int):`
			`flat_segment = segment_data.rolling(window=5).mean()`
			`flat_segment_dropna = flat_segment.dropna()`
			`segment_median, segment_max_line, segment_min_line = utils.get_distribution_density(flat_segment_dropna)`
The center of drop and jump patterns is shifted from real value #291 (#292) * fix centers in jumps and drops * coeff * add simple docstring * fix utils * fix spaces * fix names 6 years ago			`drop_height = (1 - SHIFT_FACTOR) * (segment_max_line - segment_min_line)`
Move repeating code from models to utils #270 (#272) peak / trough / jump / drop / general common code to and utils refactoring 6 years ago			`drop_length = utils.find_drop_length(segment_data, segment_min_line, segment_max_line)`
The center of drop and jump patterns is shifted from real value #291 (#292) * fix centers in jumps and drops * coeff * add simple docstring * fix utils * fix spaces * fix names 6 years ago			`cen_ind = utils.find_drop_intersections(segment_data.tolist(), segment_median)`
Move repeating code from models to utils #270 (#272) peak / trough / jump / drop / general common code to and utils refactoring 6 years ago			`drop_center = cen_ind[0]`
The center of drop and jump patterns is shifted from real value #291 (#292) * fix centers in jumps and drops * coeff * add simple docstring * fix utils * fix spaces * fix names 6 years ago			`segment_cent_index = drop_center + segment_from_index`
Move repeating code from models to utils #270 (#272) peak / trough / jump / drop / general common code to and utils refactoring 6 years ago			`return segment_cent_index, drop_height, drop_length`

			`def get_distribution_density(segment: pd.Series) -> float:`
			`min_jump = min(segment)`
			`max_jump = max(segment)`
			`pdf = gaussian_kde(segment)`
			`x = np.linspace(segment.min() - 1, segment.max() + 1, len(segment))`
			`y = pdf(x)`
			`ax_list = list(zip(x, y))`
			`ax_list = np.array(ax_list, np.float32)`
			`antipeaks_kde = argrelextrema(np.array(ax_list), np.less)[0]`
			`peaks_kde = argrelextrema(np.array(ax_list), np.greater)[0]`
			`try:`
			`min_peak_index = peaks_kde[0]`
			`segment_min_line = ax_list[min_peak_index, 0]`
			`max_peak_index = peaks_kde[1]`
			`segment_max_line = ax_list[max_peak_index, 0]`
			`segment_median = ax_list[antipeaks_kde[0], 0]`
			`except IndexError:`
The center of drop and jump patterns is shifted from real value #291 (#292) * fix centers in jumps and drops * coeff * add simple docstring * fix utils * fix spaces * fix names 6 years ago			`segment_max_line = max_jump * (1 - SHIFT_FACTOR)`
			`segment_min_line = min_jump * (1 - SHIFT_FACTOR)`
Move repeating code from models to utils #270 (#272) peak / trough / jump / drop / general common code to and utils refactoring 6 years ago			`segment_median = (max_jump - min_jump) / 2 + min_jump`
			`return segment_median, segment_max_line, segment_min_line`