misp-dashboard/util.py

import datetime
import time
from collections import defaultdict

ONE_DAY = 60*60*24

def getZrange(serv_redis_db, keyCateg, date, topNum, endSubkey=""):
    date_str = getDateStrFormat(date)
    keyname = "{}:{}{}".format(keyCateg, date_str, endSubkey)
    data = serv_redis_db.zrange(keyname, 0, topNum-1, desc=True, withscores=True)
    data = [ [record[0], record[1]] for record in data ]
    return data

def noSpaceLower(text):
    return text.lower().replace(' ', '_')

def push_to_redis_zset(serv_redis_db, mainKey, toAdd, endSubkey="", count=1):
    now = datetime.datetime.now()
    today_str = getDateStrFormat(now)
    keyname = "{}:{}{}".format(mainKey, today_str, endSubkey)
    serv_redis_db.zincrby(keyname, count, toAdd)

def getMonthSpan(date):
    ds = datetime.datetime(date.year, date.month, 1)
    dyear = 1 if ds.month+1 > 12 else 0
    dmonth = -12 if ds.month+1 > 12 else 0
    de = datetime.datetime(ds.year + dyear, ds.month+1 + dmonth, 1)

    delta = de - ds
    to_return = []
    for i in range(delta.days):
        to_return.append(ds + datetime.timedelta(days=i))
    return to_return

def getXPrevDaysSpan(date, days):
    de = date
    ds = de - datetime.timedelta(days=days)

    delta = de - ds
    to_return = []
    for i in range(delta.days+1):
        to_return.append(de - datetime.timedelta(days=i))
    return to_return

def getXPrevHoursSpan(date, hours):
    de = date
    de = de.replace(minute=0, second=0, microsecond=0)
    ds = de - datetime.timedelta(hours=hours)

    delta = de - ds
    to_return = []
    for i in range(0, int(delta.total_seconds()/3600)+1):
        to_return.append(de - datetime.timedelta(hours=i))
    return to_return

def getHoursSpanOfDate(date, adaptToFitCurrentTime=True, daySpanned=6):
    ds = date
    ds = ds.replace(hour=0, minute=0, second=0, microsecond=0)
    to_return = []
    now = datetime.datetime.now()
    for i in range(0, 24):
        the_date = ds + datetime.timedelta(hours=i)
        if the_date > now or the_date < now - datetime.timedelta(days=daySpanned): # avoid going outside
            continue
        to_return.append(the_date)
    return to_return

def getDateStrFormat(date):
    return str(date.year)+str(date.month).zfill(2)+str(date.day).zfill(2)

def getDateHoursStrFormat(date):
    return getDateStrFormat(date)+str(date.hour)

def getTimestamp(date):
    return int(time.mktime(date.timetuple()))


def sortByTrendingScore(toSort, topNum=5):
    scoredLabels = defaultdict(float)
    numDay = len(toSort)
    baseDecay = 1.0
    decayRate = lambda x: baseDecay*((numDay-x**2)/numDay)

    for i, arr in enumerate(toSort):
        timestamp = arr[0]
        dailyData = arr[1]
        for item in dailyData:
            label = item[0]
            occ = item[1]
            scoredLabels[label] += occ*decayRate(i)

    topList = [[l, s] for l, s in scoredLabels.items()]
    topList.sort(key=lambda x: x[1], reverse=True)
    topSet = [ l for l, v in topList[:topNum]]

    # now that we have the top, filter out poor scored elements
    topArray = []
    for arr in toSort:
        timestamp = arr[0]
        dailyData = arr[1]
        topDailyArray = list(filter(lambda item: (item[0] in topSet), dailyData))
        dailyCombi = [timestamp, topDailyArray]
        topArray.append(dailyCombi)

    return topArray


def getFields(obj, fields):
    jsonWalker = fields.split('.')
    itemToExplore = obj
    lastName = ""
    try:
        for i in jsonWalker:
            itemToExplore = itemToExplore[i]
            lastName = i
        if type(itemToExplore) is list:
            return {'name': lastName, 'data': itemToExplore}
        else:
            if i == 'timestamp':
                itemToExplore = datetime.datetime.utcfromtimestamp(
                    int(itemToExplore)).strftime('%Y-%m-%d %H:%M:%S')
            return itemToExplore
    except KeyError as e:
        return None
chg: [sort] isort on source files fix: [typo] fix retreive to retrieve 2019-05-29 01:30:57 +02:00			`import datetime`
			`import time`
new: [trending] Better algorithm to detect trending item 2018-09-24 09:21:02 +02:00			`from collections import defaultdict`
Separeted contributor functions from server script 2017-11-06 10:42:51 +01:00
fix: bug due to variable deletion 2017-11-27 16:28:27 +01:00			`ONE_DAY = 606024`

Moving geo functions into their own script 2017-11-27 09:47:55 +01:00			`def getZrange(serv_redis_db, keyCateg, date, topNum, endSubkey=""):`
			`date_str = getDateStrFormat(date)`
			`keyname = "{}:{}{}".format(keyCateg, date_str, endSubkey)`
			`data = serv_redis_db.zrange(keyname, 0, topNum-1, desc=True, withscores=True)`
chg: More sane response decoding, done by the ORM 2019-06-19 11:32:06 +02:00			`data = [ [record[0], record[1]] for record in data ]`
Moving geo functions into their own script 2017-11-27 09:47:55 +01:00			`return data`

fix: Fixed tons of bugs related to migration of handle_contribution to controbutor_helper 2017-12-01 15:39:17 +01:00			`def noSpaceLower(text):`
			`return text.lower().replace(' ', '_')`

refacto: Moved ranking config located in config.cfg into ranking.cfg for better control and visualisation. Moved code handling contribution into the contributor_helper script. Deleted TEST_* function as not used anymore. Real test function will be done later in the project. 2017-11-29 16:09:39 +01:00			`def push_to_redis_zset(serv_redis_db, mainKey, toAdd, endSubkey="", count=1):`
			`now = datetime.datetime.now()`
fix: Fixed tons of bugs related to migration of handle_contribution to controbutor_helper 2017-12-01 15:39:17 +01:00			`today_str = getDateStrFormat(now)`
refacto: Moved ranking config located in config.cfg into ranking.cfg for better control and visualisation. Moved code handling contribution into the contributor_helper script. Deleted TEST_* function as not used anymore. Real test function will be done later in the project. 2017-11-29 16:09:39 +01:00			`keyname = "{}:{}{}".format(mainKey, today_str, endSubkey)`
fix: [all] Fixed issue with py-redis>2.x and fix failed merge conflict 2019-06-18 11:25:17 +02:00			`serv_redis_db.zincrby(keyname, count, toAdd)`
refacto: Moved ranking config located in config.cfg into ranking.cfg for better control and visualisation. Moved code handling contribution into the contributor_helper script. Deleted TEST_* function as not used anymore. Real test function will be done later in the project. 2017-11-29 16:09:39 +01:00
Separeted contributor functions from server script 2017-11-06 10:42:51 +01:00			`def getMonthSpan(date):`
			`ds = datetime.datetime(date.year, date.month, 1)`
			`dyear = 1 if ds.month+1 > 12 else 0`
			`dmonth = -12 if ds.month+1 > 12 else 0`
			`de = datetime.datetime(ds.year + dyear, ds.month+1 + dmonth, 1)`

			`delta = de - ds`
			`to_return = []`
			`for i in range(delta.days):`
			`to_return.append(ds + datetime.timedelta(days=i))`
			`return to_return`

Added support of previous date in getLastContributors 2017-11-10 09:28:59 +01:00			`def getXPrevDaysSpan(date, days):`
			`de = date`
			`ds = de - datetime.timedelta(days=days)`

			`delta = de - ds`
			`to_return = []`
			`for i in range(delta.days+1):`
			`to_return.append(de - datetime.timedelta(days=i))`
			`return to_return`

Added login overtime + users_helper script 2017-11-15 09:36:44 +01:00			`def getXPrevHoursSpan(date, hours):`
			`de = date`
			`de = de.replace(minute=0, second=0, microsecond=0)`
			`ds = de - datetime.timedelta(hours=hours)`

			`delta = de - ds`
			`to_return = []`
			`for i in range(0, int(delta.total_seconds()/3600)+1):`
			`to_return.append(de - datetime.timedelta(hours=i))`
			`return to_return`

feature: Added contribution overtime in login overtime chart 2017-11-21 11:59:07 +01:00			`def getHoursSpanOfDate(date, adaptToFitCurrentTime=True, daySpanned=6):`
			`ds = date`
			`ds = ds.replace(hour=0, minute=0, second=0, microsecond=0)`
			`to_return = []`
			`now = datetime.datetime.now()`
			`for i in range(0, 24):`
			`the_date = ds + datetime.timedelta(hours=i)`
			`if the_date > now or the_date < now - datetime.timedelta(days=daySpanned): # avoid going outside`
			`continue`
			`to_return.append(the_date)`
			`return to_return`

Separeted contributor functions from server script 2017-11-06 10:42:51 +01:00			`def getDateStrFormat(date):`
			`return str(date.year)+str(date.month).zfill(2)+str(date.day).zfill(2)`
Updated org contrib. overtime to display the date 2017-11-10 11:15:31 +01:00
update: consider only one login of user per hour 2017-11-17 11:47:20 +01:00			`def getDateHoursStrFormat(date):`
			`return getDateStrFormat(date)+str(date.hour)`

Updated org contrib. overtime to display the date 2017-11-10 11:15:31 +01:00			`def getTimestamp(date):`
Added login overtime + users_helper script 2017-11-15 09:36:44 +01:00			`return int(time.mktime(date.timetuple()))`
new: [trending] Better algorithm to detect trending item 2018-09-24 09:21:02 +02:00

			`def sortByTrendingScore(toSort, topNum=5):`
			`scoredLabels = defaultdict(float)`
			`numDay = len(toSort)`
			`baseDecay = 1.0`
chg+fix: [trending/flask] applied algorithm strategy for other stats + FIXED eventsource caching bug: Data was cached and delivered all at once when reconnecting to the source 2018-09-24 10:26:15 +02:00			`decayRate = lambda x: baseDecay((numDay-x*2)/numDay)`
new: [trending] Better algorithm to detect trending item 2018-09-24 09:21:02 +02:00
			`for i, arr in enumerate(toSort):`
			`timestamp = arr[0]`
			`dailyData = arr[1]`
			`for item in dailyData:`
			`label = item[0]`
			`occ = item[1]`
			`scoredLabels[label] += occ*decayRate(i)`

			`topList = [[l, s] for l, s in scoredLabels.items()]`
			`topList.sort(key=lambda x: x[1], reverse=True)`
			`topSet = [ l for l, v in topList[:topNum]]`

			`# now that we have the top, filter out poor scored elements`
			`topArray = []`
			`for arr in toSort:`
			`timestamp = arr[0]`
			`dailyData = arr[1]`
			`topDailyArray = list(filter(lambda item: (item[0] in topSet), dailyData))`
			`dailyCombi = [timestamp, topDailyArray]`
			`topArray.append(dailyCombi)`

			`return topArray`
new+chg: [livelog] Added basic filtering capabilities and fullscreen mode Also, Improved table, reconnection mechanism and UI 2019-02-22 10:41:54 +01:00

			`def getFields(obj, fields):`
			`jsonWalker = fields.split('.')`
			`itemToExplore = obj`
			`lastName = ""`
			`try:`
			`for i in jsonWalker:`
			`itemToExplore = itemToExplore[i]`
			`lastName = i`
			`if type(itemToExplore) is list:`
			`return {'name': lastName, 'data': itemToExplore}`
			`else:`
			`if i == 'timestamp':`
			`itemToExplore = datetime.datetime.utcfromtimestamp(`
			`int(itemToExplore)).strftime('%Y-%m-%d %H:%M:%S')`
			`return itemToExplore`
			`except KeyError as e:`
			`return None`