mirror of https://github.com/D4-project/d4-core
Merge pull request #8 from D4-project/metatypes
Use parent and Child class for 254 types. Use Module (Child Class) to change type handler behaviourvisu-type
commit
e24b9f576b
|
@ -0,0 +1,197 @@
|
||||||
|
#!/usr/bin/env python3
|
||||||
|
|
||||||
|
import os
|
||||||
|
import sys
|
||||||
|
import time
|
||||||
|
import json
|
||||||
|
import redis
|
||||||
|
import datetime
|
||||||
|
|
||||||
|
DEFAULT_FILE_EXTENSION = 'txt'
|
||||||
|
DEFAULT_FILE_SEPARATOR = b'\n'
|
||||||
|
ROTATION_SAVE_CYCLE = 5 # seconds
|
||||||
|
TYPE = 254
|
||||||
|
|
||||||
|
class MetaTypesDefault:
|
||||||
|
|
||||||
|
def __init__(self, uuid, json_file):
|
||||||
|
self.uuid = uuid
|
||||||
|
self.type_name = json_file['type']
|
||||||
|
self.save_path = None
|
||||||
|
self.parse_json(json_file)
|
||||||
|
|
||||||
|
def test(self):
|
||||||
|
print('class: MetaTypesDefault')
|
||||||
|
|
||||||
|
######## JSON PARSER ########
|
||||||
|
def parse_json(self, json_file):
|
||||||
|
self.save_file_on_disk = True
|
||||||
|
self.file_rotation_mode = True
|
||||||
|
self.file_rotation = False
|
||||||
|
self.file_separator = b'\n'
|
||||||
|
self.filename = b''.join([self.type_name.encode(), b'.txt'])
|
||||||
|
|
||||||
|
######## PROCESS FUNCTIONS ########
|
||||||
|
def process_data(self, data):
|
||||||
|
# save data on disk
|
||||||
|
if self.is_file_saved_on_disk():
|
||||||
|
self.save_data_to_file(data)
|
||||||
|
|
||||||
|
######## CORE FUNCTIONS ########
|
||||||
|
|
||||||
|
def check_json_file(self, json_file):
|
||||||
|
# the json object must contain a type field
|
||||||
|
if "type" in json_file:
|
||||||
|
return True
|
||||||
|
else:
|
||||||
|
return False
|
||||||
|
|
||||||
|
# # TODO: update for non rotate_file mode
|
||||||
|
def save_json_file(self, json_file):
|
||||||
|
self.set_last_time_saved(time.time()) #time_file
|
||||||
|
self.set_last_saved_date(datetime.datetime.now().strftime("%Y%m%d%H%M%S")) #date_file
|
||||||
|
# update save path
|
||||||
|
self.set_save_path( os.path.join(self.get_save_dir(), self.get_filename(file_extention='json')) )
|
||||||
|
# save json
|
||||||
|
with open(self.get_save_path(), 'w') as f:
|
||||||
|
f.write(json.dumps(json_file))
|
||||||
|
# update save path for 254 files type
|
||||||
|
self.set_save_path( os.path.join(self.get_save_dir(), self.get_filename()) )
|
||||||
|
|
||||||
|
def save_data_to_file(self, data):
|
||||||
|
if self.is_file_rotation_mode():
|
||||||
|
self.save_rotate_file(data)
|
||||||
|
|
||||||
|
|
||||||
|
def save_rotate_file(self, data):
|
||||||
|
if not self.get_file_rotation():
|
||||||
|
new_date = datetime.datetime.now().strftime("%Y%m%d%H%M%S")
|
||||||
|
# check if a new file rotation is needed # # TODO: change ROTATION_SAVE_CYCLE
|
||||||
|
if ( new_date[0:8] != self.get_last_saved_date()[0:8] ) or ( int(time.time()) - self.get_last_time_saved() > ROTATION_SAVE_CYCLE ):
|
||||||
|
self.set_rotate_file(True)
|
||||||
|
|
||||||
|
# rotate file
|
||||||
|
if self.get_file_rotation():
|
||||||
|
# init save path
|
||||||
|
if self.get_save_path() is None:
|
||||||
|
self.set_last_time_saved(time.time())
|
||||||
|
self.set_last_saved_date(datetime.datetime.now().strftime("%Y%m%d%H%M%S"))
|
||||||
|
# update save path
|
||||||
|
self.set_save_path( os.path.join(self.get_save_dir(), self.get_filename()) )
|
||||||
|
|
||||||
|
# rotate file
|
||||||
|
if self.get_file_separator() in data:
|
||||||
|
end_file, start_new_file = data.rsplit(self.get_file_separator(), maxsplit=1)
|
||||||
|
# save end of file
|
||||||
|
with open(self.get_save_path(), 'ab') as f:
|
||||||
|
f.write(end_file)
|
||||||
|
|
||||||
|
# set last saved date/time
|
||||||
|
self.set_last_time_saved(time.time())
|
||||||
|
self.set_last_saved_date(datetime.datetime.now().strftime("%Y%m%d%H%M%S"))
|
||||||
|
# update save path
|
||||||
|
self.set_save_path( os.path.join(self.get_save_dir(), self.get_filename()) )
|
||||||
|
|
||||||
|
# save start of new file
|
||||||
|
if start_new_file != b'':
|
||||||
|
with open(self.get_save_path(), 'ab') as f:
|
||||||
|
f.write(start_new_file)
|
||||||
|
# end of rotation
|
||||||
|
self.set_rotate_file(False)
|
||||||
|
|
||||||
|
# wait file separator
|
||||||
|
else:
|
||||||
|
with open(self.get_save_path(), 'ab') as f:
|
||||||
|
f.write(data)
|
||||||
|
else:
|
||||||
|
# save file
|
||||||
|
with open(self.get_save_path(), 'ab') as f:
|
||||||
|
f.write(data)
|
||||||
|
|
||||||
|
|
||||||
|
def save_same_directory(self, data):
|
||||||
|
pass
|
||||||
|
|
||||||
|
######## GET FUNCTIONS ########
|
||||||
|
|
||||||
|
def get_type_name(self):
|
||||||
|
return self.type_name
|
||||||
|
|
||||||
|
def get_file_separator(self):
|
||||||
|
return self.file_separator
|
||||||
|
|
||||||
|
def get_uuid(self):
|
||||||
|
return self.uuid
|
||||||
|
|
||||||
|
def get_filename(self, file_extention=None):
|
||||||
|
if file_extention is None:
|
||||||
|
file_extention = DEFAULT_FILE_EXTENSION
|
||||||
|
# File Rotation, : data/<uuid>/254/<year>/<month>/<day>/
|
||||||
|
if self.is_file_rotation_mode():
|
||||||
|
return '{}-{}-{}-{}-{}.{}'.format(self.uuid, self.get_last_saved_year(), self.get_last_saved_month(), self.get_last_saved_day(), self.get_last_saved_hour_minute(), file_extention)
|
||||||
|
|
||||||
|
def get_save_dir(self):
|
||||||
|
# File Rotation, save data in directory: data/<uuid>/254/<year>/<month>/<day>/
|
||||||
|
if self.is_file_rotation_mode():
|
||||||
|
data_directory_uuid_type = os.path.join('../../data', self.get_uuid(), str(TYPE))
|
||||||
|
return os.path.join(data_directory_uuid_type, self.get_last_saved_year(), self.get_last_saved_month(), self.get_last_saved_day() , self.type_name)
|
||||||
|
|
||||||
|
# # TODO: save global type dir ???
|
||||||
|
if self.is_file_saved_on_disk():
|
||||||
|
pass
|
||||||
|
|
||||||
|
def get_save_path(self):
|
||||||
|
return self.save_path
|
||||||
|
|
||||||
|
def is_file_saved_on_disk(self):
|
||||||
|
if self.save_file_on_disk:
|
||||||
|
return True
|
||||||
|
else:
|
||||||
|
return False
|
||||||
|
|
||||||
|
def is_file_rotation_mode(self):
|
||||||
|
if self.file_rotation_mode:
|
||||||
|
return True
|
||||||
|
else:
|
||||||
|
return False
|
||||||
|
|
||||||
|
def get_file_rotation(self):
|
||||||
|
return self.file_rotation
|
||||||
|
|
||||||
|
def get_last_time_saved(self):
|
||||||
|
return self.last_time_saved
|
||||||
|
|
||||||
|
def get_last_saved_date(self):
|
||||||
|
return self.last_saved_date
|
||||||
|
|
||||||
|
def get_last_saved_year(self):
|
||||||
|
return self.last_saved_date[0:4]
|
||||||
|
|
||||||
|
def get_last_saved_month(self):
|
||||||
|
return self.last_saved_date[4:6]
|
||||||
|
|
||||||
|
def get_last_saved_day(self):
|
||||||
|
return self.last_saved_date[6:8]
|
||||||
|
|
||||||
|
def get_last_saved_hour_minute(self):
|
||||||
|
return self.last_saved_date[8:14]
|
||||||
|
|
||||||
|
######## SET FUNCTIONS ########
|
||||||
|
|
||||||
|
def set_rotate_file(self, boolean_value):
|
||||||
|
self.file_rotation = boolean_value
|
||||||
|
|
||||||
|
def set_last_time_saved(self, value_time):
|
||||||
|
self.last_time_saved = int(value_time)
|
||||||
|
|
||||||
|
def set_last_saved_date(self, date):
|
||||||
|
self.last_saved_date = date
|
||||||
|
|
||||||
|
def set_save_path(self, save_path):
|
||||||
|
# # TODO: create directory
|
||||||
|
dir_path = os.path.dirname(save_path)
|
||||||
|
if not os.path.isdir(dir_path):
|
||||||
|
os.makedirs(dir_path)
|
||||||
|
self.save_path = save_path
|
||||||
|
|
||||||
|
##############
|
|
@ -0,0 +1,18 @@
|
||||||
|
#!/usr/bin/env python3
|
||||||
|
|
||||||
|
import os
|
||||||
|
import sys
|
||||||
|
import time
|
||||||
|
import json
|
||||||
|
import redis
|
||||||
|
|
||||||
|
from meta_types_modules.MetaTypesDefault import MetaTypesDefault
|
||||||
|
|
||||||
|
class TypeHandler(MetaTypesDefault):
|
||||||
|
|
||||||
|
def __init__(self, uuid, json_file):
|
||||||
|
super().__init__(uuid, json_file)
|
||||||
|
print('init_spec')
|
||||||
|
|
||||||
|
def test(self):
|
||||||
|
print('Class: ja3-jl')
|
|
@ -8,6 +8,8 @@ import redis
|
||||||
|
|
||||||
import datetime
|
import datetime
|
||||||
|
|
||||||
|
from meta_types_modules import MetaTypesDefault
|
||||||
|
|
||||||
host_redis_stream = "localhost"
|
host_redis_stream = "localhost"
|
||||||
port_redis_stream = 6379
|
port_redis_stream = 6379
|
||||||
|
|
||||||
|
@ -30,22 +32,16 @@ max_buffer_length = 100000
|
||||||
rotation_save_cycle = 10 #seconds
|
rotation_save_cycle = 10 #seconds
|
||||||
|
|
||||||
json_file_name = 'meta_json.json'
|
json_file_name = 'meta_json.json'
|
||||||
extended_type_name = None # # TODO: use default or json['file_type']
|
|
||||||
|
|
||||||
save_to_file = True
|
def get_class( package_class ):
|
||||||
|
parts = package_class.split('.')
|
||||||
|
module = ".".join(parts[:-1])
|
||||||
|
mod = __import__( module )
|
||||||
|
for comp in parts[1:]:
|
||||||
|
mod = getattr(mod, comp)
|
||||||
|
return mod
|
||||||
|
|
||||||
def get_dir_data_uuid(uuid, type):
|
def check_default_json_file(json_file):
|
||||||
return os.path.join('../../data', uuid, str(type))
|
|
||||||
|
|
||||||
def get_save_dir(dir_data_uuid, year, month, day, extended_type=None):
|
|
||||||
dir_path = os.path.join(dir_data_uuid, year, month, day)
|
|
||||||
if extended_type:
|
|
||||||
dir_path = os.path.join(dir_path, extended_type)
|
|
||||||
if not os.path.isdir(dir_path):
|
|
||||||
os.makedirs(dir_path)
|
|
||||||
return dir_path
|
|
||||||
|
|
||||||
def check_json_file(json_file):
|
|
||||||
# the json object must contain a type field
|
# the json object must contain a type field
|
||||||
if "type" in json_file:
|
if "type" in json_file:
|
||||||
return True
|
return True
|
||||||
|
@ -72,6 +68,9 @@ def clean_stream(stream_name, type, session_uuid):
|
||||||
|
|
||||||
if __name__ == "__main__":
|
if __name__ == "__main__":
|
||||||
|
|
||||||
|
|
||||||
|
###################################################3
|
||||||
|
|
||||||
if len(sys.argv) != 2:
|
if len(sys.argv) != 2:
|
||||||
print('usage:', 'Worker.py', 'session_uuid')
|
print('usage:', 'Worker.py', 'session_uuid')
|
||||||
exit(1)
|
exit(1)
|
||||||
|
@ -129,7 +128,8 @@ if __name__ == "__main__":
|
||||||
# complete json received
|
# complete json received
|
||||||
if full_json:
|
if full_json:
|
||||||
print(full_json)
|
print(full_json)
|
||||||
if check_json_file(full_json):
|
if check_default_json_file(full_json):
|
||||||
|
# end type 2 processing
|
||||||
break
|
break
|
||||||
# Incorrect Json
|
# Incorrect Json
|
||||||
else:
|
else:
|
||||||
|
@ -151,24 +151,21 @@ if __name__ == "__main__":
|
||||||
clean_db(session_uuid)
|
clean_db(session_uuid)
|
||||||
sys.exit(1)
|
sys.exit(1)
|
||||||
|
|
||||||
file_separator = b'\n' ## TODO: map all file separator or extract from json
|
|
||||||
extended_type_name = '{}.txt'.format(extended_type) # # TODO: create default or extract from JSON
|
#### Handle Specific MetaTypes ####
|
||||||
|
# Use Specific Handler defined
|
||||||
|
if os.path.isdir(os.path.join('meta_types_modules', extended_type)):
|
||||||
|
class_type_handler = get_class('meta_types_modules.{}.{}.TypeHandler'.format(extended_type, extended_type))
|
||||||
|
type_handler = class_type_handler(uuid, full_json)
|
||||||
|
# Use Standard Handler
|
||||||
|
else:
|
||||||
|
type_handler = MetaTypesDefault.MetaTypesDefault(uuid, full_json)
|
||||||
|
|
||||||
|
#file_separator = type_handler.get_file_separator(self)
|
||||||
|
#extended_type_name = type_handler.get_file_name()
|
||||||
|
|
||||||
# save json on disk
|
# save json on disk
|
||||||
if save_to_file:
|
type_handler.save_json_file(full_json)
|
||||||
rotate_file = False
|
|
||||||
time_file = time.time()
|
|
||||||
date_file = datetime.datetime.now().strftime("%Y%m%d%H%M%S")
|
|
||||||
# get new save_path #use first or last received date ???
|
|
||||||
dir_data_uuid = get_dir_data_uuid(uuid, type_defined)
|
|
||||||
dir_full_path = get_save_dir(dir_data_uuid, date_file[0:4], date_file[4:6], date_file[6:8], extended_type=extended_type)
|
|
||||||
filename = '{}-{}-{}-{}-{}.{}'.format(uuid, date_file[0:4], date_file[4:6], date_file[6:8], date_file[8:14], json_file_name)
|
|
||||||
save_path = os.path.join(dir_full_path, filename)
|
|
||||||
with open(save_path, 'w') as f:
|
|
||||||
f.write(json.dumps(full_json))
|
|
||||||
# get extended_type save_path
|
|
||||||
filename = '{}-{}-{}-{}-{}.{}'.format(uuid, date_file[0:4], date_file[4:6], date_file[6:8], date_file[8:14], extended_type_name)
|
|
||||||
save_path = os.path.join(dir_full_path, filename)
|
|
||||||
|
|
||||||
# change stream_name/type
|
# change stream_name/type
|
||||||
stream_name = stream_defined
|
stream_name = stream_defined
|
||||||
|
@ -176,6 +173,8 @@ if __name__ == "__main__":
|
||||||
id = 0
|
id = 0
|
||||||
buffer = b''
|
buffer = b''
|
||||||
|
|
||||||
|
type_handler.test()
|
||||||
|
|
||||||
# handle 254 type
|
# handle 254 type
|
||||||
while True:
|
while True:
|
||||||
res = redis_server_stream.xread({stream_name: id}, count=1)
|
res = redis_server_stream.xread({stream_name: id}, count=1)
|
||||||
|
@ -186,37 +185,9 @@ if __name__ == "__main__":
|
||||||
data = res[0][1][0][1]
|
data = res[0][1][0][1]
|
||||||
|
|
||||||
if id and data:
|
if id and data:
|
||||||
# save data on disk
|
# process 254 data type
|
||||||
if save_to_file:
|
type_handler.process_data(data[b'message'])
|
||||||
new_date = datetime.datetime.now().strftime("%Y%m%d%H%M%S")
|
# remove data from redis stream
|
||||||
# check if a new rotation is needed
|
|
||||||
if ( new_date[0:8] != date_file[0:8] ) or ( time.time() - time_file > rotation_save_cycle ):
|
|
||||||
date_file = new_date
|
|
||||||
rotate_file = True
|
|
||||||
|
|
||||||
# file rotation
|
|
||||||
if rotate_file and file_separator in data[b'message']:
|
|
||||||
end_file, start_new_file = data[b'message'].rsplit(file_separator, maxsplit=1)
|
|
||||||
# save end of file
|
|
||||||
with open(save_path, 'ab') as f:
|
|
||||||
f.write(end_file)
|
|
||||||
|
|
||||||
# get new save_path
|
|
||||||
dir_full_path = get_save_dir(dir_data_uuid, date_file[0:4], date_file[4:6], date_file[6:8], extended_type=extended_type)
|
|
||||||
filename = '{}-{}-{}-{}-{}.{}'.format(uuid, date_file[0:4], date_file[4:6], date_file[6:8], date_file[8:14], extended_type_name)
|
|
||||||
save_path = os.path.join(dir_full_path, filename)
|
|
||||||
|
|
||||||
# save start of new file
|
|
||||||
if start_new_file != b'':
|
|
||||||
with open(save_path, 'ab') as f:
|
|
||||||
f.write(start_new_file)
|
|
||||||
# end of rotation
|
|
||||||
rotate_file = False
|
|
||||||
time_file = time.time()
|
|
||||||
else:
|
|
||||||
with open(save_path, 'ab') as f:
|
|
||||||
f.write(data[b'message'])
|
|
||||||
|
|
||||||
redis_server_stream.xdel(stream_name, id)
|
redis_server_stream.xdel(stream_name, id)
|
||||||
|
|
||||||
else:
|
else:
|
||||||
|
|
Loading…
Reference in New Issue