chg: Updated csvimport to support files from csv export + import MISP objects

2018-07-27 23:13:47 +02:00 · 2018-07-27 23:13:47 +02:00 · 63ba7580d3
parent a8170ded17
commit 63ba7580d3
1 changed files with 88 additions and 17 deletions
--- a/misp_modules/modules/import_mod/csvimport.py
+++ b/misp_modules/modules/import_mod/csvimport.py
@ -1,6 +1,7 @@
 # -*- coding: utf-8 -*-
 import json, os, base64
-import pymisp
+from pymisp import __path__ as pymisp_path
 from collections import defaultdict
 misperrors = {'error': 'Error'}
 moduleinfo = {'version': '0.1', 'author': 'Christian Studer',
@ -13,20 +14,49 @@ userConfig = {'header': {
                'message': 'Define the header of the csv file, with types (included in MISP attribute types or attribute fields) separated by commas.\nFor fields that do not match these types, please use space or simply nothing between commas.\nFor instance: ip-src,domain, ,timestamp'},
              'has_header':{
                'type': 'Boolean',
-                'message': 'Tick this box ONLY if there is a header line, NOT COMMENTED, in the file (which will be skipped atm).'
+                'message': 'Tick this box ONLY if there is a header line, NOT COMMENTED, in the file.'
              }}
 duplicatedFields = {'mispType': {'mispComment': 'comment'},
                    'attrField': {'attrComment': 'comment'}}
 attributesFields = ['type', 'value', 'category', 'to_ids', 'comment', 'distribution']
 misp_standard_csv_header = ['uuid','event_id','category','type','value','comment','to_ids','date',
                            'object_relation','object_uuid','object_name','object_meta_category']
 delimiters = [',', ';', '|', '/', '\t', '    ']
 class CsvParser():
-    def __init__(self, header, has_header):
+    def __init__(self, header, has_header, data):
-        self.header = header
+        if data[0].split(',') == misp_standard_csv_header:
-        self.fields_number = len(header)
+            self.header = misp_standard_csv_header
-        self.has_header = has_header
+            self.from_misp = True
-        self.attributes = []
+            self.data = data[1:]
        else:
            self.from_misp = False
            self.has_header = has_header
            if header:
                self.header = header
                self.fields_number = len(header)
                self.parse_data(data)
            else:
                self.has_delimiter = True
                self.fields_number, self.delimiter, self.header = self.get_delimiter_from_header(data[0])
                self.data = data
            self.result = []
    def get_delimiter_from_header(self, data):
        delimiters_count = {}
        for d in delimiters:
            length = data.count(d)
            if length > 0:
                delimiters_count[d] = data.count(d)
        if len(delimiters_count) == 0:
            length = 0
            delimiter = None
            header = [data]
        else:
            length, delimiter = max((n, v) for v, n in delimiters_count.items())
            header = data.split(delimiter)
        return length + 1, delimiter, header
    def parse_data(self, data):
        return_data = []
@ -45,6 +75,7 @@ class CsvParser():
                    return_data.append(l)
            # find which delimiter is used
            self.delimiter = self.find_delimiter()
            if self.fields_number == 0: self.header = return_data[0].split(self.delimiter)
        self.data = return_data[1:] if self.has_header else return_data
    def parse_delimiter(self, line):
@ -56,6 +87,43 @@ class CsvParser():
        _, delimiter = max((n, v) for v, n in self.delimiter_count.items())
        return delimiter
    def parse_csv(self):
        if self.from_misp:
            self.build_misp_event()
        else:
            self.buildAttributes()
    def build_misp_event(self):
        l_attributes = []
        l_objects = []
        objects = defaultdict(list)
        attribute_fields = self.header[:1] + self.header[2:8]
        relation_type = self.header[8]
        object_fields = self.header[9:]
        for line in self.data:
            attribute = {}
            try:
                a_uuid,_,category,a_type,value,comment,to_ids,date,relation,o_uuid,o_name,o_meta_category = line.split(',')
            except ValueError:
                continue
            for t, v in zip(attribute_fields, [a_uuid,category,a_type,value,comment,to_ids,date]):
                attribute[t] = v.replace('"', '')
            attribute['to_ids'] = True if to_ids == '1' else False
            relation = relation.replace('"', '')
            if relation:
                attribute[relation_type] = relation
                object_index = tuple(o.replace('"', '') for o in (o_uuid,o_name,o_meta_category))
                objects[object_index].append(attribute)
            else:
                l_attributes.append(attribute)
        for keys, attributes in objects.items():
            misp_object = {}
            for t, v in zip(['uuid','name','meta-category'], keys):
                misp_object[t] = v
            misp_object['Attribute'] = attributes
            l_objects.append(misp_object)
        self.result = {"Attribute": l_attributes, "Object": l_objects}
    def buildAttributes(self):
        # if there is only 1 field of data
        if self.delimiter is None:
@ -63,7 +131,7 @@ class CsvParser():
            for data in self.data:
                d = data.strip()
                if d:
-                    self.attributes.append({'types': mispType, 'values': d})
+                    self.result.append({'types': mispType, 'values': d})
        else:
            # split fields that should be recognized as misp attribute types from the others
            list2pop, misp, head = self.findMispTypes()
@ -83,10 +151,10 @@ class CsvParser():
                    for h, ds in zip(head, datasplit):
                        if h:
                            attribute[h] = ds.strip()
-                    self.attributes.append(attribute)
+                    self.result.append(attribute)
    def findMispTypes(self):
-        descFilename = os.path.join(pymisp.__path__[0], 'data/describeTypes.json')
+        descFilename = os.path.join(pymisp_path[0], 'data/describeTypes.json')
        with open(descFilename, 'r') as f:
            MispTypes = json.loads(f.read())['result'].get('types')
        list2pop = []
@ -124,18 +192,21 @@ def handler(q=False):
    else:
        misperrors['error'] = "Unsupported attributes type"
        return misperrors
    if not request.get('config') and not request['config'].get('header'):
        misperrors['error'] = "Configuration error"
        return misperrors
    header = request['config'].get('header').split(',')
    header = [c.strip() for c in header]
    has_header = request['config'].get('has_header')
    has_header = True if has_header == '1' else False
    if not request.get('config') and not request['config'].get('header'):
        if has_header:
            header = []
        else:
            misperrors['error'] = "Configuration error"
            return misperrors
    else:
        header = request['config'].get('header').split(',')
        header = [c.strip() for c in header]
    csv_parser = CsvParser(header, has_header)
    csv_parser.parse_data(data.split('\n'))
    # build the attributes
    csv_parser.buildAttributes()
-    r = {'results': csv_parser.attributes}
+    r = {'results': csv_parser.result}
    return r
 def introspection():