2018-03-18 23:21:29 +01:00
|
|
|
#!/usr/bin/env python
|
|
|
|
# -*- coding: utf-8 -*-
|
|
|
|
|
|
|
|
from ..exceptions import InvalidMISPObject
|
|
|
|
from .abstractgenerator import AbstractMISPObjectGenerator
|
|
|
|
from io import BytesIO
|
|
|
|
import logging
|
2018-05-03 20:51:04 +02:00
|
|
|
from email import message_from_bytes, policy
|
2020-01-23 10:27:40 +01:00
|
|
|
from pathlib import Path
|
|
|
|
from typing import Union
|
2018-03-18 23:21:29 +01:00
|
|
|
|
|
|
|
logger = logging.getLogger('pymisp')
|
|
|
|
|
|
|
|
|
|
|
|
class EMailObject(AbstractMISPObjectGenerator):
|
|
|
|
|
2020-01-23 10:27:40 +01:00
|
|
|
def __init__(self, filepath: Union[Path, str]=None, pseudofile: BytesIO=None, attach_original_email: bool=True, standalone: bool=True, **kwargs):
|
2019-10-08 09:28:33 +02:00
|
|
|
# PY3 way:
|
|
|
|
# super().__init__('file')
|
|
|
|
super(EMailObject, self).__init__('email', standalone=standalone, **kwargs)
|
2018-03-18 23:21:29 +01:00
|
|
|
if filepath:
|
|
|
|
with open(filepath, 'rb') as f:
|
2018-05-03 20:51:04 +02:00
|
|
|
self.__pseudofile = BytesIO(f.read())
|
2018-03-18 23:21:29 +01:00
|
|
|
elif pseudofile and isinstance(pseudofile, BytesIO):
|
2018-05-03 20:51:04 +02:00
|
|
|
self.__pseudofile = pseudofile
|
2018-03-18 23:21:29 +01:00
|
|
|
else:
|
|
|
|
raise InvalidMISPObject('File buffer (BytesIO) or a path is required.')
|
2018-05-03 20:51:04 +02:00
|
|
|
self.__email = message_from_bytes(self.__pseudofile.getvalue(), policy=policy.default)
|
|
|
|
if attach_original_email:
|
2018-05-07 10:18:38 +02:00
|
|
|
self.add_attribute('eml', value='Full email.eml', data=self.__pseudofile)
|
2018-03-18 23:21:29 +01:00
|
|
|
self.generate_attributes()
|
|
|
|
|
2018-05-03 20:51:04 +02:00
|
|
|
@property
|
|
|
|
def email(self):
|
|
|
|
return self.__email
|
|
|
|
|
|
|
|
@property
|
|
|
|
def attachments(self):
|
|
|
|
to_return = []
|
|
|
|
for attachment in self.__email.iter_attachments():
|
2019-04-24 15:37:40 +02:00
|
|
|
content = attachment.get_content()
|
|
|
|
if isinstance(content, str):
|
|
|
|
content = content.encode()
|
|
|
|
to_return.append((attachment.get_filename(), BytesIO(content)))
|
2018-05-03 20:51:04 +02:00
|
|
|
return to_return
|
|
|
|
|
2018-03-18 23:21:29 +01:00
|
|
|
def generate_attributes(self):
|
2018-05-08 11:02:32 +02:00
|
|
|
if self.__email.get_body(preferencelist=('html', 'plain')):
|
2018-05-11 16:20:07 +02:00
|
|
|
self.add_attribute('email-body', value=self.__email.get_body(preferencelist=('html', 'plain')).get_payload(decode=True).decode('utf8', 'surrogateescape'))
|
2018-03-18 23:21:29 +01:00
|
|
|
if 'Reply-To' in self.__email:
|
|
|
|
self.add_attribute('reply-to', value=self.__email['Reply-To'])
|
|
|
|
if 'Message-ID' in self.__email:
|
|
|
|
self.add_attribute('message-id', value=self.__email['Message-ID'])
|
|
|
|
if 'To' in self.__email:
|
2019-12-04 15:18:27 +01:00
|
|
|
# TODO: split name and email address
|
2019-04-24 15:37:40 +02:00
|
|
|
to_add = [to.strip() for to in self.__email['To'].split(',')]
|
|
|
|
self.add_attributes('to', *to_add)
|
2018-03-18 23:21:29 +01:00
|
|
|
if 'Cc' in self.__email:
|
2019-12-04 15:18:27 +01:00
|
|
|
# TODO: split name and email address
|
2019-04-24 15:37:40 +02:00
|
|
|
to_add = [to.strip() for to in self.__email['Cc'].split(',')]
|
|
|
|
self.add_attributes('cc', *to_add)
|
2018-03-18 23:21:29 +01:00
|
|
|
if 'Subject' in self.__email:
|
|
|
|
self.add_attribute('subject', value=self.__email['Subject'])
|
|
|
|
if 'From' in self.__email:
|
2019-12-04 15:18:27 +01:00
|
|
|
# TODO: split name and email address
|
2019-04-24 15:37:40 +02:00
|
|
|
to_add = [to.strip() for to in self.__email['From'].split(',')]
|
|
|
|
self.add_attributes('from', *to_add)
|
2018-03-18 23:21:29 +01:00
|
|
|
if 'Return-Path' in self.__email:
|
2019-12-04 15:18:27 +01:00
|
|
|
# TODO: split name and email address
|
2018-03-18 23:21:29 +01:00
|
|
|
self.add_attribute('return-path', value=self.__email['Return-Path'])
|
2018-05-03 20:51:04 +02:00
|
|
|
if 'User-Agent' in self.__email:
|
|
|
|
self.add_attribute('user-agent', value=self.__email['User-Agent'])
|
2019-12-04 15:18:27 +01:00
|
|
|
if self.__email.get_boundary():
|
|
|
|
self.add_attribute('mime-boundary', value=self.__email.get_boundary())
|
|
|
|
if 'X-Mailer' in self.__email:
|
|
|
|
self.add_attribute('x-mailer', value=self.__email['X-Mailer'])
|
|
|
|
if 'Thread-Index' in self.__email:
|
|
|
|
self.add_attribute('thread-index', value=self.__email['Thread-Index'])
|
|
|
|
# TODO: email-header: all headers in one bloc
|
|
|
|
# TODO: BCC?
|
|
|
|
# TODO: received headers sometimes have TO email addresses
|