2014-08-06 11:43:40 +02:00
|
|
|
#!/usr/bin/env python2
|
|
|
|
# -*-coding:UTF-8 -*
|
|
|
|
|
|
|
|
"""
|
|
|
|
The ZMQ_PubSub_Lines Module
|
|
|
|
============================
|
|
|
|
|
2014-08-20 15:14:57 +02:00
|
|
|
This module is consuming the Redis-list created by the ZMQ_PubSub_Line_Q
|
|
|
|
Module.
|
2014-08-06 11:43:40 +02:00
|
|
|
|
2014-08-20 15:14:57 +02:00
|
|
|
It perform a sorting on the line's length and publish/forward them to
|
|
|
|
differents channels:
|
2014-08-06 11:43:40 +02:00
|
|
|
|
|
|
|
*Channel 1 if max length(line) < max
|
|
|
|
*Channel 2 if max length(line) > max
|
|
|
|
|
|
|
|
The collected informations about the processed pastes
|
|
|
|
(number of lines and maximum length line) are stored in Redis.
|
|
|
|
|
|
|
|
..note:: Module ZMQ_Something_Q and ZMQ_Something are closely bound, always put
|
|
|
|
the same Subscriber name in both of them.
|
|
|
|
|
|
|
|
Requirements
|
|
|
|
------------
|
|
|
|
|
|
|
|
*Need running Redis instances. (LevelDB & Redis)
|
|
|
|
*Need the ZMQ_PubSub_Line_Q Module running to be able to work properly.
|
|
|
|
|
|
|
|
"""
|
2014-08-14 17:55:18 +02:00
|
|
|
import redis
|
|
|
|
import argparse
|
|
|
|
import time
|
|
|
|
from packages import Paste
|
2014-08-06 11:43:40 +02:00
|
|
|
from pubsublogger import publisher
|
|
|
|
|
2014-08-20 15:14:57 +02:00
|
|
|
import Helper
|
2014-08-06 11:43:40 +02:00
|
|
|
|
2014-08-20 15:14:57 +02:00
|
|
|
if __name__ == "__main__":
|
|
|
|
publisher.channel = "Script"
|
2014-08-14 17:55:18 +02:00
|
|
|
|
2014-08-20 15:14:57 +02:00
|
|
|
config_section = 'PubSub_Global'
|
|
|
|
config_channel = 'channel'
|
|
|
|
subscriber_name = 'line'
|
2014-08-06 11:43:40 +02:00
|
|
|
|
2014-08-20 15:14:57 +02:00
|
|
|
h = Helper.Redis_Queues(config_section, config_channel, subscriber_name)
|
|
|
|
|
|
|
|
# Publisher
|
|
|
|
pub_config_section = 'PubSub_Longlines'
|
|
|
|
h.zmq_pub(pub_config_section, None)
|
|
|
|
|
|
|
|
# Subscriber
|
|
|
|
h.zmq_sub(config_section)
|
2014-08-06 11:43:40 +02:00
|
|
|
|
|
|
|
# SCRIPT PARSER #
|
|
|
|
parser = argparse.ArgumentParser(
|
2014-08-20 15:14:57 +02:00
|
|
|
description='''This script is a part of the Analysis Information \
|
|
|
|
Leak framework.''')
|
2014-08-06 11:43:40 +02:00
|
|
|
|
2014-08-20 15:14:57 +02:00
|
|
|
parser.add_argument(
|
|
|
|
'-max', type=int, default=500,
|
|
|
|
help='The limit between "short lines" and "long lines"',
|
|
|
|
action='store')
|
2014-08-06 11:43:40 +02:00
|
|
|
|
|
|
|
args = parser.parse_args()
|
|
|
|
|
|
|
|
# REDIS #
|
2014-08-20 15:14:57 +02:00
|
|
|
# FIXME move it in the Paste object
|
2014-08-06 11:43:40 +02:00
|
|
|
r_serv = redis.StrictRedis(
|
2014-08-20 15:14:57 +02:00
|
|
|
host=h.config.get("Redis_Data_Merging", "host"),
|
|
|
|
port=h.config.getint("Redis_Data_Merging", "port"),
|
|
|
|
db=h.config.getint("Redis_Data_Merging", "db"))
|
2014-08-06 11:43:40 +02:00
|
|
|
|
2014-08-20 15:14:57 +02:00
|
|
|
channel_0 = h.config.get("PubSub_Longlines", "channel_0")
|
|
|
|
channel_1 = h.config.get("PubSub_Longlines", "channel_1")
|
2014-08-06 11:43:40 +02:00
|
|
|
|
|
|
|
# FUNCTIONS #
|
2014-08-20 15:14:57 +02:00
|
|
|
tmp_string = "Lines script Subscribed to channel {} and Start to publish \
|
|
|
|
on channel {}, {}"
|
|
|
|
publisher.info(tmp_string.format(h.sub_channel, channel_0, channel_1))
|
2014-08-06 11:43:40 +02:00
|
|
|
|
|
|
|
while True:
|
|
|
|
try:
|
2014-08-20 15:14:57 +02:00
|
|
|
message = h.redis_rpop()
|
2014-08-14 17:55:18 +02:00
|
|
|
if message is not None:
|
|
|
|
PST = Paste.Paste(message.split(" ", -1)[-1])
|
2014-08-06 11:43:40 +02:00
|
|
|
else:
|
2014-08-20 15:14:57 +02:00
|
|
|
if h.redis_queue_shutdown():
|
2014-08-06 11:43:40 +02:00
|
|
|
print "Shutdown Flag Up: Terminating"
|
|
|
|
publisher.warning("Shutdown Flag Up: Terminating.")
|
|
|
|
break
|
|
|
|
publisher.debug("Tokeniser is idling 10s")
|
|
|
|
time.sleep(10)
|
|
|
|
continue
|
|
|
|
|
|
|
|
lines_infos = PST.get_lines_info()
|
|
|
|
|
|
|
|
PST.save_attribute_redis(r_serv, "p_nb_lines", lines_infos[0])
|
2014-08-20 15:14:57 +02:00
|
|
|
PST.save_attribute_redis(r_serv, "p_max_length_line",
|
|
|
|
lines_infos[1])
|
2014-08-06 11:43:40 +02:00
|
|
|
|
2014-08-14 17:55:18 +02:00
|
|
|
r_serv.sadd("Pastes_Objects", PST.p_path)
|
2014-08-06 11:43:40 +02:00
|
|
|
if lines_infos[1] >= args.max:
|
2014-08-20 15:14:57 +02:00
|
|
|
h.pub_channel = channel_0
|
2014-08-06 11:43:40 +02:00
|
|
|
else:
|
2014-08-20 15:14:57 +02:00
|
|
|
h.pub_channel = channel_1
|
|
|
|
h.zmq_pub_send(PST.p_path)
|
2014-08-06 11:43:40 +02:00
|
|
|
except IOError:
|
|
|
|
print "CRC Checksum Error on : ", PST.p_path
|