|
|
|
import models
|
|
|
|
import utils
|
|
|
|
|
|
|
|
# from grafana_data_provider import GrafanaDataProvider
|
|
|
|
|
|
|
|
import logging
|
|
|
|
from urllib.parse import urlparse
|
|
|
|
import os.path
|
|
|
|
import json
|
|
|
|
import config
|
|
|
|
|
|
|
|
import pandas as pd
|
|
|
|
|
|
|
|
from detectors import Detector
|
|
|
|
|
|
|
|
|
|
|
|
logger = logging.getLogger('analytic_toolset')
|
|
|
|
|
|
|
|
|
|
|
|
def resolve_model_by_pattern(pattern: str) -> models.Model:
|
|
|
|
if pattern == 'PEAK':
|
|
|
|
return models.PeaksModel()
|
|
|
|
if pattern == 'DROP':
|
|
|
|
return models.StepModel()
|
|
|
|
if pattern == 'JUMP':
|
|
|
|
return models.JumpModel()
|
|
|
|
if pattern == 'CUSTOM':
|
|
|
|
return models.CustomModel()
|
|
|
|
raise ValueError('Unknown pattern "%s"' % pattern)
|
|
|
|
|
|
|
|
|
|
|
|
class PatternDetector(Detector):
|
|
|
|
|
|
|
|
def __init__(self, pattern_type):
|
|
|
|
self.pattern_type = pattern_type
|
|
|
|
self.model = resolve_model_by_pattern(self.pattern_type)
|
|
|
|
window_size = 100
|
|
|
|
|
|
|
|
async def train(self, dataframe: pd.DataFrame, segments: list):
|
|
|
|
# TODO: pass only part of dataframe that has segments
|
|
|
|
self.model.fit(dataframe, data, segments)
|
|
|
|
self.__save_model()
|
|
|
|
return 0
|
|
|
|
|
|
|
|
async def predict(self, data):
|
|
|
|
|
|
|
|
start_index = self.data_prov.get_upper_bound(last_prediction_time)
|
|
|
|
start_index = max(0, start_index - window_size)
|
|
|
|
dataframe = self.data_prov.get_data_range(start_index)
|
|
|
|
|
|
|
|
predicted_indexes = self.model.predict(dataframe)
|
|
|
|
predicted_indexes = [(x, y) for (x, y) in predicted_indexes if x >= start_index and y >= start_index]
|
|
|
|
|
|
|
|
predicted_times = self.data_prov.inverse_transform_indexes(predicted_indexes)
|
|
|
|
segments = []
|
|
|
|
for time_value in predicted_times:
|
|
|
|
ts1 = int(time_value[0].timestamp() * 1000)
|
|
|
|
ts2 = int(time_value[1].timestamp() * 1000)
|
|
|
|
segments.append({
|
|
|
|
'start': min(ts1, ts2),
|
|
|
|
'finish': max(ts1, ts2)
|
|
|
|
})
|
|
|
|
|
|
|
|
last_dataframe_time = dataframe.iloc[-1]['timestamp']
|
|
|
|
last_prediction_time = int(last_dataframe_time.timestamp() * 1000)
|
|
|
|
return segments, last_prediction_time
|