AIL-framework/bin/ZMQ_Sub_Curve.py

#!/usr/bin/env python2
# -*-coding:UTF-8 -*
"""
The ZMQ_Sub_Curve Module
============================

This module is consuming the Redis-list created by the ZMQ_Sub_Curve_Q Module.

This modules update a .csv file used to draw curves representing selected words and their occurency per day.

..note:: The channel will have the name of the file created.

..note:: Module ZMQ_Something_Q and ZMQ_Something are closely bound, always put
the same Subscriber name in both of them.

Requirements
------------

*Need running Redis instances. (Redis)
*Categories files of words in /files/ need to be created
*Need the ZMQ_PubSub_Tokenize_Q Module running to be able to work properly.

"""
import redis, argparse, zmq, ConfigParser, time
from packages import Paste as P
from packages import ZMQ_PubSub
from pubsublogger import publisher
from packages import lib_words

configfile = './packages/config.cfg'

def main():
    """Main Function"""

    # CONFIG #
    cfg = ConfigParser.ConfigParser()
    cfg.read(configfile)

    # SCRIPT PARSER #
    parser = argparse.ArgumentParser(
    description = '''This script is a part of the Analysis Information
    Leak framework.''',
    epilog = '''''')

    parser.add_argument('-l',
    type = str,
    default = "../files/list_categ_files",
    help = 'Path to the list_categ_files (../files/list_categ_files)',
    action = 'store')

    args = parser.parse_args()

    # REDIS #
    r_serv = redis.StrictRedis(
        host = cfg.get("Redis_Queues", "host"),
        port = cfg.getint("Redis_Queues", "port"),
        db = cfg.getint("Redis_Queues", "db"))

    r_serv1 = redis.StrictRedis(
        host = cfg.get("Redis_Level_DB", "host"),
        port = cfg.get("Redis_Level_DB", "port"),
        db = 0)

    # LOGGING #
    publisher.channel = "Script"

    # ZMQ #
    channel = cfg.get("PubSub_Words", "channel_0")
    subscriber_name = "curve"
    subscriber_config_section = "PubSub_Words"

    Sub = ZMQ_PubSub.ZMQSub(configfile, subscriber_config_section, channel, subscriber_name)

    # FUNCTIONS #
    publisher.info("Script Curve subscribed to channel {0}".format(cfg.get("PubSub_Words", "channel_0")))

    # FILE CURVE SECTION #
    csv_path = cfg.get("Directories", "wordtrending_csv")
    wordfile_path = cfg.get("Directories", "wordsfile")

    paste_words = []
    message = Sub.get_msg_from_queue(r_serv)
    prec_filename = None
    while True:
        if message != None:
            channel, filename, word, score = message.split()
            if prec_filename == None or filename != prec_filename:
                PST = P.Paste(filename)
                lib_words.create_curve_with_word_file(r_serv1, csv_path, wordfile_path, int(PST.p_date.year), int(PST.p_date.month))

            prec_filename = filename
            prev_score = r_serv1.hget(word.lower(), PST.p_date)
            print prev_score
            if prev_score != None:
                r_serv1.hset(word.lower(), PST.p_date, int(prev_score) + int(score))
            else:
                r_serv1.hset(word.lower(), PST.p_date, score)
             #r_serv.expire(word,86400) #1day

        else:
            if r_serv.sismember("SHUTDOWN_FLAGS", "Curve"):
                r_serv.srem("SHUTDOWN_FLAGS", "Curve")
                print "Shutdown Flag Up: Terminating"
                publisher.warning("Shutdown Flag Up: Terminating.")
                break
            publisher.debug("Script Curve is Idling")
            print "sleepin"
            time.sleep(1)

        message = Sub.get_msg_from_queue(r_serv)


if __name__ == "__main__":
    main()