AIL-framework/bin/ZMQ_Sub_Curve.py

#!/usr/bin/env python2
# -*-coding:UTF-8 -*
"""
The ZMQ_Sub_Curve Module
============================

This module is consuming the Redis-list created by the ZMQ_Sub_Curve_Q Module.

This modules update a .csv file used to draw curves representing selected words and their occurency per day.

..note:: The channel will have the name of the file created.

..note:: Module ZMQ_Something_Q and ZMQ_Something are closely bound, always put
the same Subscriber name in both of them.

Requirements
------------

*Need running Redis instances. (Redis)
*Categories files of words in /files/ need to be created
*Need the ZMQ_PubSub_Tokenize_Q Module running to be able to work properly.

"""
import redis, argparse, zmq, ConfigParser, time
from packages import Paste as P
from packages import ZMQ_PubSub
from pubsublogger import publisher
from packages import lib_words

configfile = './packages/config.cfg'

def main():
    """Main Function"""

    # CONFIG #
    cfg = ConfigParser.ConfigParser()
    cfg.read(configfile)

    # SCRIPT PARSER #
    parser = argparse.ArgumentParser(
    description = '''This script is a part of the Analysis Information
    Leak framework.''',
    epilog = '''''')

    parser.add_argument('-l',
    type = str,
    default = "../files/list_categ_files",
    help = 'Path to the list_categ_files (../files/list_categ_files)',
    action = 'store')

    args = parser.parse_args()

    # REDIS #
    r_serv = redis.StrictRedis(
        host = cfg.get("Redis_Queues", "host"),
        port = cfg.getint("Redis_Queues", "port"),
        db = cfg.getint("Redis_Queues", "db"))

    r_serv1 = redis.StrictRedis(
        host = cfg.get("Redis_Level_DB", "host"),
        port = cfg.get("Redis_Level_DB", "port"),
        db = 0)

    # LOGGING #
    publisher.channel = "Script"

    # ZMQ #
    channel = cfg.get("PubSub_Words", "channel_0")
    subscriber_name = "curve"
    subscriber_config_section = "PubSub_Words"

    Sub = ZMQ_PubSub.ZMQSub(configfile, subscriber_config_section, channel, subscriber_name)

    # FUNCTIONS #
    publisher.info("Script Curve subscribed to channel {0}".format(cfg.get("PubSub_Words", "channel_0")))

    # FILE CURVE SECTION #
    csv_path = cfg.get("Directories", "wordtrending_csv")
    wordfile_path = cfg.get("Directories", "wordsfile")

    paste_words = []
    message = Sub.get_msg_from_queue(r_serv)
    prec_filename = None
    while True:
        if message != None:
            channel, filename, word, score = message.split()
            if prec_filename == None or filename != prec_filename:
                PST = P.Paste(filename)
                lib_words.create_curve_with_word_file(r_serv1, csv_path, wordfile_path, int(PST.p_date.year), int(PST.p_date.month))

            prec_filename = filename
            prev_score = r_serv1.hget(word.lower(), PST.p_date)
            print prev_score
            if prev_score != None:
                r_serv1.hset(word.lower(), PST.p_date, int(prev_score) + int(score))
            else:
                r_serv1.hset(word.lower(), PST.p_date, score)
             #r_serv.expire(word,86400) #1day

        else:
            if r_serv.sismember("SHUTDOWN_FLAGS", "Curve"):
                r_serv.srem("SHUTDOWN_FLAGS", "Curve")
                print "Shutdown Flag Up: Terminating"
                publisher.warning("Shutdown Flag Up: Terminating.")
                break
            publisher.debug("Script Curve is Idling")
            print "sleepin"
            time.sleep(1)

        message = Sub.get_msg_from_queue(r_serv)


if __name__ == "__main__":
    main()
Initial import of AIL framework - Analysis Information Leak framework AIL is a modular framework to analyse potential information leak from unstructured data source like pastes from Past ebin or similar services. AIL framework is flexible and can be extended to support other functionalities to mine sen sitive information 2014-08-06 11:43:40 +02:00			`#!/usr/bin/env python2`
			`# --coding:UTF-8 -`
			`"""`
			`The ZMQ_Sub_Curve Module`
			`============================`

Changing ZMQ Curve Module comment 2014-08-07 14:46:43 +02:00			`This module is consuming the Redis-list created by the ZMQ_Sub_Curve_Q Module.`
Initial import of AIL framework - Analysis Information Leak framework AIL is a modular framework to analyse potential information leak from unstructured data source like pastes from Past ebin or similar services. AIL framework is flexible and can be extended to support other functionalities to mine sen sitive information 2014-08-06 11:43:40 +02:00
Changing ZMQ Curve Module comment 2014-08-07 14:46:43 +02:00			`This modules update a .csv file used to draw curves representing selected words and their occurency per day.`
Initial import of AIL framework - Analysis Information Leak framework AIL is a modular framework to analyse potential information leak from unstructured data source like pastes from Past ebin or similar services. AIL framework is flexible and can be extended to support other functionalities to mine sen sitive information 2014-08-06 11:43:40 +02:00
			`..note:: The channel will have the name of the file created.`

			`..note:: Module ZMQ_Something_Q and ZMQ_Something are closely bound, always put`
			`the same Subscriber name in both of them.`

			`Requirements`
			`------------`

			`*Need running Redis instances. (Redis)`
			`*Categories files of words in /files/ need to be created`
			`*Need the ZMQ_PubSub_Tokenize_Q Module running to be able to work properly.`

			`"""`
			`import redis, argparse, zmq, ConfigParser, time`
			`from packages import Paste as P`
			`from packages import ZMQ_PubSub`
			`from pubsublogger import publisher`
			`from packages import lib_words`

			`configfile = './packages/config.cfg'`

			`def main():`
			`"""Main Function"""`

			`# CONFIG #`
			`cfg = ConfigParser.ConfigParser()`
			`cfg.read(configfile)`

			`# SCRIPT PARSER #`
			`parser = argparse.ArgumentParser(`
			`description = '''This script is a part of the Analysis Information`
			`Leak framework.''',`
			`epilog = '''''')`

			`parser.add_argument('-l',`
			`type = str,`
			`default = "../files/list_categ_files",`
			`help = 'Path to the list_categ_files (../files/list_categ_files)',`
			`action = 'store')`

			`args = parser.parse_args()`

			`# REDIS #`
			`r_serv = redis.StrictRedis(`
			`host = cfg.get("Redis_Queues", "host"),`
			`port = cfg.getint("Redis_Queues", "port"),`
			`db = cfg.getint("Redis_Queues", "db"))`

			`r_serv1 = redis.StrictRedis(`
			`host = cfg.get("Redis_Level_DB", "host"),`
			`port = cfg.get("Redis_Level_DB", "port"),`
			`db = 0)`

			`# LOGGING #`
			`publisher.channel = "Script"`

			`# ZMQ #`
			`channel = cfg.get("PubSub_Words", "channel_0")`
			`subscriber_name = "curve"`
			`subscriber_config_section = "PubSub_Words"`

			`Sub = ZMQ_PubSub.ZMQSub(configfile, subscriber_config_section, channel, subscriber_name)`

			`# FUNCTIONS #`
			`publisher.info("Script Curve subscribed to channel {0}".format(cfg.get("PubSub_Words", "channel_0")))`

Hardcoded path from ZMQ_Curve are now referring correctly in config.cfg.sample fix #6 2014-08-11 11:33:18 +02:00			`# FILE CURVE SECTION #`
			`csv_path = cfg.get("Directories", "wordtrending_csv")`
			`wordfile_path = cfg.get("Directories", "wordsfile")`

Initial import of AIL framework - Analysis Information Leak framework AIL is a modular framework to analyse potential information leak from unstructured data source like pastes from Past ebin or similar services. AIL framework is flexible and can be extended to support other functionalities to mine sen sitive information 2014-08-06 11:43:40 +02:00			`paste_words = []`
			`message = Sub.get_msg_from_queue(r_serv)`
			`prec_filename = None`
			`while True:`
			`if message != None:`
			`channel, filename, word, score = message.split()`
			`if prec_filename == None or filename != prec_filename:`
			`PST = P.Paste(filename)`
Hardcoded path from ZMQ_Curve are now referring correctly in config.cfg.sample fix #6 2014-08-11 11:33:18 +02:00			`lib_words.create_curve_with_word_file(r_serv1, csv_path, wordfile_path, int(PST.p_date.year), int(PST.p_date.month))`
Initial import of AIL framework - Analysis Information Leak framework AIL is a modular framework to analyse potential information leak from unstructured data source like pastes from Past ebin or similar services. AIL framework is flexible and can be extended to support other functionalities to mine sen sitive information 2014-08-06 11:43:40 +02:00
			`prec_filename = filename`
			`prev_score = r_serv1.hget(word.lower(), PST.p_date)`
			`print prev_score`
			`if prev_score != None:`
			`r_serv1.hset(word.lower(), PST.p_date, int(prev_score) + int(score))`
			`else:`
			`r_serv1.hset(word.lower(), PST.p_date, score)`
			`#r_serv.expire(word,86400) #1day`

			`else:`
			`if r_serv.sismember("SHUTDOWN_FLAGS", "Curve"):`
			`r_serv.srem("SHUTDOWN_FLAGS", "Curve")`
			`print "Shutdown Flag Up: Terminating"`
			`publisher.warning("Shutdown Flag Up: Terminating.")`
			`break`
			`publisher.debug("Script Curve is Idling")`
			`print "sleepin"`
			`time.sleep(1)`

			`message = Sub.get_msg_from_queue(r_serv)`


			`if __name__ == "__main__":`
			`main()`