hastic-server/analytics/analytics/analytic_unit_manager.py

from typing import Dict
import pandas as pd
import numpy as np
import logging as log
import traceback
from concurrent.futures import Executor, ThreadPoolExecutor

import detectors
from analytic_unit_worker import AnalyticUnitWorker
from models import ModelCache


logger = log.getLogger('AnalyticUnitManager')
WORKERS_EXECUTORS = 20

AnalyticUnitId = str


def get_detector_by_type(detector_type: str, analytic_unit_type: str) -> detectors.Detector:
    if detector_type == 'pattern':
        return detectors.PatternDetector(analytic_unit_type)
    elif detector_type == 'threshold':
        return detectors.ThresholdDetector()

    raise ValueError('Unknown detector type "%s"' % detector_type)

def prepare_data(data: list):
    """
        Takes list
        - converts it into pd.DataFrame,
        - converts 'timestamp' column to pd.Datetime,
        - subtracts min value from dataset
    """
    data = pd.DataFrame(data, columns=['timestamp', 'value'])
    data['timestamp'] = pd.to_datetime(data['timestamp'], unit='ms')
    data.fillna(value = np.nan, inplace = True)
    return data


class AnalyticUnitManager:

    def __init__(self):
        self.analytic_workers: Dict[AnalyticUnitId, AnalyticUnitWorker] = dict()
        self.workers_executor = ThreadPoolExecutor(max_workers=WORKERS_EXECUTORS)

    def __ensure_worker(
        self,
        analytic_unit_id: AnalyticUnitId,
        detector_type: str,
        analytic_unit_type: str
    ) -> AnalyticUnitWorker:
        if analytic_unit_id in self.analytic_workers:
            # TODO: check that type is the same
            return self.analytic_workers[analytic_unit_id]
        detector = get_detector_by_type(detector_type, analytic_unit_type)
        worker = AnalyticUnitWorker(analytic_unit_id, detector, self.workers_executor)
        self.analytic_workers[analytic_unit_id] = worker
        return worker

    async def __handle_analytic_task(self, task) -> dict:
        """
            returns payload or None
        """
        analytic_unit_id: AnalyticUnitId = task['analyticUnitId']

        if task['type'] == 'CANCEL':
            if analytic_unit_id in self.analytic_workers:
                self.analytic_workers[analytic_unit_id].cancel()
            return

        payload = task['payload']
        worker = self.__ensure_worker(analytic_unit_id, payload['detector'], payload['analyticUnitType'])
        data = prepare_data(payload['data'])
        if task['type'] == 'PUSH':
            # TODO: do it a better way
            res = await worker.recieve_data(data, payload['cache'])
            res.update({ 'analyticUnitId': analytic_unit_id })
            return res
        elif task['type'] == 'LEARN':
            if 'segments' in payload:
                return await worker.do_train(payload['segments'], data, payload['cache'])
            elif 'threshold' in payload:
                return await worker.do_train(payload['threshold'], data, payload['cache'])
            else:
                raise ValueError('No segments or threshold in LEARN payload')
        elif task['type'] == 'DETECT':
            return await worker.do_detect(data, payload['cache'])

        raise ValueError('Unknown task type "%s"' % task['type'])

    async def handle_analytic_task(self, task):
        try:
            result_payload = await self.__handle_analytic_task(task)
            result_message =  {
                'status': 'SUCCESS',
                'payload': result_payload
            }
            return result_message
        except Exception as e:
            error_text = traceback.format_exc()
            # TODO: move result to a class which renders to json for messaging to analytics
            return {
                'status': 'FAILED',
                'error': str(e)
            }
One panel - one worker #62 6 years ago			`from typing import Dict`
Fix learning (#116) 6 years ago			`import pandas as pd`
Incorrect work of analytics with nan filled dataset #247 (#248) 6 years ago			`import numpy as np`
Fix webhooks (#341) 5 years ago			`import logging as log`
			`import traceback`
Workers for analyticunits #203 (#265) * rm async from analytic_unit_worker + some refactorings in maager * AnalyticUnitManager * workers for analytic units 6 years ago			`from concurrent.futures import Executor, ThreadPoolExecutor`
One panel - one worker #62 6 years ago
			`import detectors`
			`from analytic_unit_worker import AnalyticUnitWorker`
Error: detect missing cache #299 (#302) * Pass cache to detect * rename AnalyticUnitCache to ModelCache * Send .data from cache * Drop nans from bucket && set window size from cache && check cache None * Read proper payload on DETECT message 6 years ago			`from models import ModelCache`
One panel - one worker #62 6 years ago
Workers for analyticunits #203 (#265) * rm async from analytic_unit_worker + some refactorings in maager * AnalyticUnitManager * workers for analytic units 6 years ago
Fix webhooks (#341) 5 years ago			`logger = log.getLogger('AnalyticUnitManager')`
Workers for analyticunits #203 (#265) * rm async from analytic_unit_worker + some refactorings in maager * AnalyticUnitManager * workers for analytic units 6 years ago			`WORKERS_EXECUTORS = 20`
analytics repair 6 years ago
analytics clearup 6 years ago			`AnalyticUnitId = str`
One panel - one worker #62 6 years ago
analytics clearup 6 years ago
Threshold detector #324 (#330) 6 years ago			`def get_detector_by_type(detector_type: str, analytic_unit_type: str) -> detectors.Detector:`
			`if detector_type == 'pattern':`
			`return detectors.PatternDetector(analytic_unit_type)`
			`elif detector_type == 'threshold':`
			`return detectors.ThresholdDetector()`

			`raise ValueError('Unknown detector type "%s"' % detector_type)`
One panel - one worker #62 6 years ago
Make all models work && add reverse peak model (#124) - Subtract min value from dataset before passing to model - Rename StepModel -> DropModel - Use cache to save state in all models - Return `Segment { 'from': <timestamp>, 'to': <timestamp>}` instead of `Segment { 'from': <index>, 'to': <index>}` in all models - Integrate new peaks model (from https://github.com/hastic/hastic-server/pull/123) - Integrate new reverse-peaks model (from https://github.com/hastic/hastic-server/pull/123) - Refactor: make `predict` method in `Model` not abstract and remove it from all children - Refactor: add abstract `do_predict` method to models 6 years ago			`def prepare_data(data: list):`
			`"""`
			`Takes list`
			`- converts it into pd.DataFrame,`
			`- converts 'timestamp' column to pd.Datetime,`
			`- subtracts min value from dataset`
			`"""`
			`data = pd.DataFrame(data, columns=['timestamp', 'value'])`
Convert timestamps from s to ms 6 years ago			`data['timestamp'] = pd.to_datetime(data['timestamp'], unit='ms')`
Convert None to NaN before sending data to model #333 (#334) 5 years ago			`data.fillna(value = np.nan, inplace = True)`
Make all models work && add reverse peak model (#124) - Subtract min value from dataset before passing to model - Rename StepModel -> DropModel - Use cache to save state in all models - Return `Segment { 'from': <timestamp>, 'to': <timestamp>}` instead of `Segment { 'from': <index>, 'to': <index>}` in all models - Integrate new peaks model (from https://github.com/hastic/hastic-server/pull/123) - Integrate new reverse-peaks model (from https://github.com/hastic/hastic-server/pull/123) - Refactor: make `predict` method in `Model` not abstract and remove it from all children - Refactor: add abstract `do_predict` method to models 6 years ago			`return data`
Workers for analyticunits #203 (#265) * rm async from analytic_unit_worker + some refactorings in maager * AnalyticUnitManager * workers for analytic units 6 years ago

			`class AnalyticUnitManager:`

			`def __init__(self):`
			`self.analytic_workers: Dict[AnalyticUnitId, AnalyticUnitWorker] = dict()`
			`self.workers_executor = ThreadPoolExecutor(max_workers=WORKERS_EXECUTORS)`

Threshold detector #324 (#330) 6 years ago			`def __ensure_worker(`
			`self,`
			`analytic_unit_id: AnalyticUnitId,`
			`detector_type: str,`
			`analytic_unit_type: str`
			`) -> AnalyticUnitWorker:`
Workers for analyticunits #203 (#265) * rm async from analytic_unit_worker + some refactorings in maager * AnalyticUnitManager * workers for analytic units 6 years ago			`if analytic_unit_id in self.analytic_workers:`
			`# TODO: check that type is the same`
			`return self.analytic_workers[analytic_unit_id]`
Threshold detector #324 (#330) 6 years ago			`detector = get_detector_by_type(detector_type, analytic_unit_type)`
Workers for analyticunits #203 (#265) * rm async from analytic_unit_worker + some refactorings in maager * AnalyticUnitManager * workers for analytic units 6 years ago			`worker = AnalyticUnitWorker(analytic_unit_id, detector, self.workers_executor)`
			`self.analytic_workers[analytic_unit_id] = worker`
			`return worker`

Analytic unit predict event #277 (#280) 6 years ago			`async def __handle_analytic_task(self, task) -> dict:`
			`"""`
			`returns payload or None`
			`"""`
			`analytic_unit_id: AnalyticUnitId = task['analyticUnitId']`

			`if task['type'] == 'CANCEL':`
			`if analytic_unit_id in self.analytic_workers:`
			`self.analytic_workers[analytic_unit_id].cancel()`
			`return`

			`payload = task['payload']`
Threshold detector #324 (#330) 6 years ago			`worker = self.__ensure_worker(analytic_unit_id, payload['detector'], payload['analyticUnitType'])`
Analytic unit predict event #277 (#280) 6 years ago			`data = prepare_data(payload['data'])`
Analytic unit worker bucket #273 (#297) 6 years ago			`if task['type'] == 'PUSH':`
Fix threshold detector (#331) 5 years ago			`# TODO: do it a better way`
			`res = await worker.recieve_data(data, payload['cache'])`
Fix webhooks (#341) 5 years ago			`res.update({ 'analyticUnitId': analytic_unit_id })`
			`return res`
Analytic unit worker bucket #273 (#297) 6 years ago			`elif task['type'] == 'LEARN':`
Threshold detector #324 (#330) 6 years ago			`if 'segments' in payload:`
			`return await worker.do_train(payload['segments'], data, payload['cache'])`
			`elif 'threshold' in payload:`
			`return await worker.do_train(payload['threshold'], data, payload['cache'])`
			`else:`
			`raise ValueError('No segments or threshold in LEARN payload')`
Rename predict to detect #279 (#284) * dummy rename * fixes * renaming in analytics 6 years ago			`elif task['type'] == 'DETECT':`
			`return await worker.do_detect(data, payload['cache'])`
Analytic unit predict event #277 (#280) 6 years ago
			`raise ValueError('Unknown task type "%s"' % task['type'])`

Workers for analyticunits #203 (#265) * rm async from analytic_unit_worker + some refactorings in maager * AnalyticUnitManager * workers for analytic units 6 years ago			`async def handle_analytic_task(self, task):`
			`try:`
Analytic unit predict event #277 (#280) 6 years ago			`result_payload = await self.__handle_analytic_task(task)`
Fix webhooks (#341) 5 years ago			`result_message = {`
Workers for analyticunits #203 (#265) * rm async from analytic_unit_worker + some refactorings in maager * AnalyticUnitManager * workers for analytic units 6 years ago			`'status': 'SUCCESS',`
			`'payload': result_payload`
			`}`
Fix webhooks (#341) 5 years ago			`return result_message`
Workers for analyticunits #203 (#265) * rm async from analytic_unit_worker + some refactorings in maager * AnalyticUnitManager * workers for analytic units 6 years ago			`except Exception as e:`
			`error_text = traceback.format_exc()`
			`# TODO: move result to a class which renders to json for messaging to analytics`
			`return {`
			`'status': 'FAILED',`
			`'error': str(e)`
			`}`