2017-07-21 18:47:10 +02:00
|
|
|
#!/usr/bin/env python3
|
2024-01-17 13:13:14 +01:00
|
|
|
|
|
|
|
from __future__ import annotations
|
2017-07-21 18:47:10 +02:00
|
|
|
|
2017-11-08 03:10:04 +01:00
|
|
|
import logging
|
2024-01-31 12:15:08 +01:00
|
|
|
|
2021-01-19 15:44:58 +01:00
|
|
|
from base64 import b64encode
|
2024-01-31 12:15:08 +01:00
|
|
|
from datetime import datetime
|
|
|
|
from hashlib import md5, sha1, sha256, sha512
|
|
|
|
from io import BytesIO
|
|
|
|
from pathlib import Path
|
|
|
|
from typing import Any
|
2017-07-21 18:47:10 +02:00
|
|
|
|
2020-02-07 11:51:44 +01:00
|
|
|
from . import FileObject
|
2024-01-31 12:15:08 +01:00
|
|
|
from .abstractgenerator import AbstractMISPObjectGenerator
|
|
|
|
from ..exceptions import InvalidMISPObject
|
2017-07-21 18:47:10 +02:00
|
|
|
|
2023-04-19 10:47:41 +02:00
|
|
|
import lief
|
2024-02-01 17:24:24 +01:00
|
|
|
import lief.PE
|
2017-07-21 18:47:10 +02:00
|
|
|
|
|
|
|
try:
|
2020-01-23 10:27:40 +01:00
|
|
|
import pydeep # type: ignore
|
2017-07-21 18:47:10 +02:00
|
|
|
HAS_PYDEEP = True
|
|
|
|
except ImportError:
|
|
|
|
HAS_PYDEEP = False
|
|
|
|
|
2020-02-07 11:51:44 +01:00
|
|
|
logger = logging.getLogger('pymisp')
|
|
|
|
|
|
|
|
|
2024-01-31 12:15:08 +01:00
|
|
|
def make_pe_objects(lief_parsed: lief.PE.Binary,
|
|
|
|
misp_file: FileObject,
|
|
|
|
standalone: bool = True,
|
|
|
|
default_attributes_parameters: dict[str, Any] = {}) -> tuple[FileObject, PEObject, list[PESectionObject]]:
|
2020-02-07 11:51:44 +01:00
|
|
|
pe_object = PEObject(parsed=lief_parsed, standalone=standalone, default_attributes_parameters=default_attributes_parameters)
|
|
|
|
misp_file.add_reference(pe_object.uuid, 'includes', 'PE indicators')
|
|
|
|
pe_sections = []
|
|
|
|
for s in pe_object.sections:
|
|
|
|
pe_sections.append(s)
|
|
|
|
return misp_file, pe_object, pe_sections
|
|
|
|
|
2017-07-21 18:47:10 +02:00
|
|
|
|
2017-08-28 19:01:53 +02:00
|
|
|
class PEObject(AbstractMISPObjectGenerator):
|
2017-07-21 18:47:10 +02:00
|
|
|
|
2024-01-31 12:15:08 +01:00
|
|
|
__pe: lief.PE.Binary
|
|
|
|
|
|
|
|
def __init__(self, parsed: lief.PE.Binary | None = None, # type: ignore[no-untyped-def]
|
|
|
|
filepath: Path | str | None = None,
|
|
|
|
pseudofile: BytesIO | list[int] | None = None,
|
|
|
|
**kwargs) -> None:
|
2020-09-15 12:39:59 +02:00
|
|
|
"""Creates an PE object, with lief"""
|
2021-10-26 02:37:12 +02:00
|
|
|
super().__init__('pe', **kwargs)
|
2017-07-21 18:47:10 +02:00
|
|
|
if not HAS_PYDEEP:
|
2023-02-06 20:43:42 +01:00
|
|
|
logger.warning("pydeep is missing, please install pymisp this way: pip install pymisp[fileobjects]")
|
2017-07-21 18:47:10 +02:00
|
|
|
if pseudofile:
|
|
|
|
if isinstance(pseudofile, BytesIO):
|
2024-01-31 12:15:08 +01:00
|
|
|
p = lief.PE.parse(obj=pseudofile)
|
2017-07-21 18:47:10 +02:00
|
|
|
elif isinstance(pseudofile, bytes):
|
2024-01-31 12:15:08 +01:00
|
|
|
p = lief.PE.parse(raw=list(pseudofile))
|
2024-01-22 13:45:25 +01:00
|
|
|
elif isinstance(pseudofile, list):
|
2024-01-31 12:15:08 +01:00
|
|
|
p = lief.PE.parse(raw=pseudofile)
|
2017-07-21 18:47:10 +02:00
|
|
|
else:
|
2024-01-17 13:13:14 +01:00
|
|
|
raise InvalidMISPObject(f'Pseudo file can be BytesIO or bytes got {type(pseudofile)}')
|
2024-01-31 12:15:08 +01:00
|
|
|
if not p:
|
|
|
|
raise InvalidMISPObject('Unable to parse pseudofile')
|
|
|
|
self.__pe = p
|
2017-07-21 18:47:10 +02:00
|
|
|
elif filepath:
|
2024-01-31 12:15:08 +01:00
|
|
|
if p := lief.PE.parse(filepath):
|
|
|
|
self.__pe = p
|
|
|
|
else:
|
|
|
|
raise InvalidMISPObject(f'Unable to parse {filepath}')
|
2017-07-21 18:47:10 +02:00
|
|
|
elif parsed:
|
|
|
|
# Got an already parsed blob
|
|
|
|
if isinstance(parsed, lief.PE.Binary):
|
2017-09-12 16:46:06 +02:00
|
|
|
self.__pe = parsed
|
2017-07-21 18:47:10 +02:00
|
|
|
else:
|
2024-01-17 13:13:14 +01:00
|
|
|
raise InvalidMISPObject(f'Not a lief.PE.Binary: {type(parsed)}')
|
2017-07-21 18:47:10 +02:00
|
|
|
self.generate_attributes()
|
|
|
|
|
2024-01-31 12:15:08 +01:00
|
|
|
def _is_exe(self) -> bool:
|
2017-07-21 18:47:10 +02:00
|
|
|
if not self._is_dll() and not self._is_driver():
|
2024-01-31 12:15:08 +01:00
|
|
|
return self.__pe.header.has_characteristic(lief.PE.Header.CHARACTERISTICS.EXECUTABLE_IMAGE)
|
2017-07-21 18:47:10 +02:00
|
|
|
return False
|
|
|
|
|
2024-01-31 12:15:08 +01:00
|
|
|
def _is_dll(self) -> bool:
|
|
|
|
return self.__pe.header.has_characteristic(lief.PE.Header.CHARACTERISTICS.DLL)
|
2017-07-21 18:47:10 +02:00
|
|
|
|
2024-01-31 12:15:08 +01:00
|
|
|
def _is_driver(self) -> bool:
|
2017-07-21 18:47:10 +02:00
|
|
|
# List from pefile
|
2024-01-17 13:13:14 +01:00
|
|
|
system_DLLs = {'ntoskrnl.exe', 'hal.dll', 'ndis.sys', 'bootvid.dll', 'kdcom.dll'}
|
2017-09-12 16:46:06 +02:00
|
|
|
if system_DLLs.intersection([imp.lower() for imp in self.__pe.libraries]):
|
2017-07-21 18:47:10 +02:00
|
|
|
return True
|
|
|
|
return False
|
|
|
|
|
2024-01-31 12:15:08 +01:00
|
|
|
def _get_pe_type(self) -> str:
|
2017-07-21 18:47:10 +02:00
|
|
|
if self._is_dll():
|
2017-08-23 15:36:13 +02:00
|
|
|
return 'dll'
|
2017-07-21 18:47:10 +02:00
|
|
|
elif self._is_driver():
|
2017-08-23 15:36:13 +02:00
|
|
|
return 'driver'
|
2017-07-21 18:47:10 +02:00
|
|
|
elif self._is_exe():
|
2017-08-23 15:36:13 +02:00
|
|
|
return 'exe'
|
2017-07-21 18:47:10 +02:00
|
|
|
else:
|
2017-08-23 15:36:13 +02:00
|
|
|
return 'unknown'
|
|
|
|
|
2024-01-31 12:15:08 +01:00
|
|
|
def generate_attributes(self) -> None:
|
2017-08-28 19:01:53 +02:00
|
|
|
self.add_attribute('type', value=self._get_pe_type())
|
2017-07-21 18:47:10 +02:00
|
|
|
# General information
|
2017-09-12 16:46:06 +02:00
|
|
|
self.add_attribute('entrypoint-address', value=self.__pe.entrypoint)
|
|
|
|
self.add_attribute('compilation-timestamp', value=datetime.utcfromtimestamp(self.__pe.header.time_date_stamps).isoformat())
|
2021-01-19 15:44:58 +01:00
|
|
|
self.add_attribute('imphash', value=lief.PE.get_imphash(self.__pe, lief.PE.IMPHASH_MODE.PEFILE))
|
|
|
|
self.add_attribute('authentihash', value=self.__pe.authentihash_sha256.hex())
|
2024-01-31 12:15:08 +01:00
|
|
|
r_manager = self.__pe.resources_manager
|
|
|
|
if isinstance(r_manager, lief.PE.ResourcesManager):
|
|
|
|
version = r_manager.version
|
|
|
|
if isinstance(version, lief.PE.ResourceVersion) and version.string_file_info is not None:
|
|
|
|
fileinfo = dict(version.string_file_info.langcode_items[0].items.items())
|
2017-08-28 19:01:53 +02:00
|
|
|
self.add_attribute('original-filename', value=fileinfo.get('OriginalFilename'))
|
|
|
|
self.add_attribute('internal-filename', value=fileinfo.get('InternalName'))
|
|
|
|
self.add_attribute('file-description', value=fileinfo.get('FileDescription'))
|
|
|
|
self.add_attribute('file-version', value=fileinfo.get('FileVersion'))
|
|
|
|
self.add_attribute('product-name', value=fileinfo.get('ProductName'))
|
|
|
|
self.add_attribute('product-version', value=fileinfo.get('ProductVersion'))
|
|
|
|
self.add_attribute('company-name', value=fileinfo.get('CompanyName'))
|
|
|
|
self.add_attribute('legal-copyright', value=fileinfo.get('LegalCopyright'))
|
2024-01-31 12:15:08 +01:00
|
|
|
self.add_attribute('lang-id', value=version.string_file_info.langcode_items[0].key)
|
2017-07-21 18:47:10 +02:00
|
|
|
# Sections
|
|
|
|
self.sections = []
|
2017-09-12 16:46:06 +02:00
|
|
|
if self.__pe.sections:
|
2017-07-21 18:47:10 +02:00
|
|
|
pos = 0
|
2017-09-12 16:46:06 +02:00
|
|
|
for section in self.__pe.sections:
|
2021-02-15 16:11:15 +01:00
|
|
|
if not section.name and not section.size:
|
|
|
|
# Skip section if name is none AND size is 0.
|
|
|
|
continue
|
2020-06-30 12:40:08 +02:00
|
|
|
s = PESectionObject(section, standalone=self._standalone, default_attributes_parameters=self._default_attributes_parameters)
|
2024-01-17 13:13:14 +01:00
|
|
|
self.add_reference(s.uuid, 'includes', f'Section {pos} of PE')
|
2020-01-30 11:44:13 +01:00
|
|
|
if ((self.__pe.entrypoint >= section.virtual_address)
|
|
|
|
and (self.__pe.entrypoint < (section.virtual_address + section.virtual_size))):
|
2024-01-31 12:15:08 +01:00
|
|
|
if isinstance(section.name, bytes):
|
|
|
|
section_name = section.name.decode()
|
|
|
|
else:
|
|
|
|
section_name = section.name
|
|
|
|
self.add_attribute('entrypoint-section-at-position', value=f'{section_name}|{pos}')
|
2017-07-21 18:47:10 +02:00
|
|
|
pos += 1
|
|
|
|
self.sections.append(s)
|
2017-08-28 19:01:53 +02:00
|
|
|
self.add_attribute('number-sections', value=len(self.sections))
|
2021-01-19 15:44:58 +01:00
|
|
|
# Signatures
|
|
|
|
self.certificates = []
|
|
|
|
self.signers = []
|
|
|
|
for sign in self.__pe.signatures:
|
|
|
|
for c in sign.certificates:
|
|
|
|
cert_obj = PECertificate(c)
|
|
|
|
self.add_reference(cert_obj.uuid, 'signed-by')
|
|
|
|
self.certificates.append(cert_obj)
|
|
|
|
for s_info in sign.signers:
|
|
|
|
signer_obj = PESigners(s_info)
|
|
|
|
self.add_reference(signer_obj.uuid, 'signed-by')
|
|
|
|
self.signers.append(signer_obj)
|
|
|
|
|
|
|
|
|
|
|
|
class PECertificate(AbstractMISPObjectGenerator):
|
|
|
|
|
2024-01-31 12:15:08 +01:00
|
|
|
def __init__(self, certificate: lief.PE.x509, **kwargs) -> None: # type: ignore[no-untyped-def]
|
2021-01-19 15:44:58 +01:00
|
|
|
super().__init__('x509')
|
|
|
|
self.__certificate = certificate
|
|
|
|
self.generate_attributes()
|
|
|
|
|
2024-01-31 12:15:08 +01:00
|
|
|
def generate_attributes(self) -> None:
|
2021-01-19 15:44:58 +01:00
|
|
|
self.add_attribute('issuer', value=self.__certificate.issuer)
|
|
|
|
self.add_attribute('serial-number', value=self.__certificate.serial_number)
|
2024-01-31 12:15:08 +01:00
|
|
|
if len(self.__certificate.valid_from) == 6:
|
|
|
|
self.add_attribute('validity-not-before',
|
|
|
|
value=datetime(year=self.__certificate.valid_from[0],
|
|
|
|
month=self.__certificate.valid_from[1],
|
|
|
|
day=self.__certificate.valid_from[2],
|
|
|
|
hour=self.__certificate.valid_from[3],
|
|
|
|
minute=self.__certificate.valid_from[4],
|
|
|
|
second=self.__certificate.valid_from[5]))
|
|
|
|
if len(self.__certificate.valid_to) == 6:
|
|
|
|
self.add_attribute('validity-not-after',
|
|
|
|
value=datetime(year=self.__certificate.valid_to[0],
|
|
|
|
month=self.__certificate.valid_to[1],
|
|
|
|
day=self.__certificate.valid_to[2],
|
|
|
|
hour=self.__certificate.valid_to[3],
|
|
|
|
minute=self.__certificate.valid_to[4],
|
|
|
|
second=self.__certificate.valid_to[5]))
|
2021-01-19 15:44:58 +01:00
|
|
|
self.add_attribute('version', value=self.__certificate.version)
|
|
|
|
self.add_attribute('subject', value=self.__certificate.subject)
|
|
|
|
self.add_attribute('signature_algorithm', value=self.__certificate.signature_algorithm)
|
|
|
|
self.add_attribute('raw-base64', value=b64encode(self.__certificate.raw))
|
|
|
|
|
|
|
|
|
|
|
|
class PESigners(AbstractMISPObjectGenerator):
|
|
|
|
|
2024-01-31 12:15:08 +01:00
|
|
|
def __init__(self, signer: lief.PE.SignerInfo, **kwargs) -> None: # type: ignore[no-untyped-def]
|
2021-01-19 15:44:58 +01:00
|
|
|
super().__init__('authenticode-signerinfo')
|
|
|
|
self.__signer = signer
|
|
|
|
self.generate_attributes()
|
|
|
|
|
2024-01-31 12:15:08 +01:00
|
|
|
def generate_attributes(self) -> None:
|
2021-01-19 15:44:58 +01:00
|
|
|
self.add_attribute('issuer', value=self.__signer.issuer)
|
|
|
|
self.add_attribute('serial-number', value=self.__signer.serial_number)
|
|
|
|
self.add_attribute('version', value=self.__signer.version)
|
2024-01-31 12:15:08 +01:00
|
|
|
self.add_attribute('digest_algorithm', value=str(self.__signer.digest_algorithm))
|
|
|
|
self.add_attribute('encryption_algorithm', value=str(self.__signer.encryption_algorithm))
|
2021-01-19 15:44:58 +01:00
|
|
|
self.add_attribute('digest-base64', value=b64encode(self.__signer.encrypted_digest))
|
2024-02-01 17:24:24 +01:00
|
|
|
info: lief.PE.SpcSpOpusInfo = self.__signer.get_attribute(lief.PE.Attribute.TYPE.SPC_SP_OPUS_INFO) # type: ignore[assignment]
|
2021-01-19 15:44:58 +01:00
|
|
|
if info:
|
|
|
|
self.add_attribute('program-name', value=info.program_name)
|
|
|
|
self.add_attribute('url', value=info.more_info)
|
2017-07-21 18:47:10 +02:00
|
|
|
|
|
|
|
|
2017-08-28 19:01:53 +02:00
|
|
|
class PESectionObject(AbstractMISPObjectGenerator):
|
2017-07-21 18:47:10 +02:00
|
|
|
|
2024-01-31 12:15:08 +01:00
|
|
|
def __init__(self, section: lief.PE.Section, **kwargs) -> None: # type: ignore[no-untyped-def]
|
2020-09-15 12:39:59 +02:00
|
|
|
"""Creates an PE Section object. Object generated by PEObject."""
|
2021-01-19 15:44:58 +01:00
|
|
|
super().__init__('pe-section')
|
2017-09-12 16:46:06 +02:00
|
|
|
self.__section = section
|
|
|
|
self.__data = bytes(self.__section.content)
|
2017-07-21 18:47:10 +02:00
|
|
|
self.generate_attributes()
|
|
|
|
|
2024-01-31 12:15:08 +01:00
|
|
|
def generate_attributes(self) -> None:
|
2017-09-12 16:46:06 +02:00
|
|
|
self.add_attribute('name', value=self.__section.name)
|
2024-01-31 12:15:08 +01:00
|
|
|
self.add_attribute('size-in-bytes', value=self.__section.size)
|
|
|
|
if int(self.__section.size) > 0:
|
2020-08-14 17:13:53 +02:00
|
|
|
# zero-filled sections can create too many correlations
|
|
|
|
to_ids = float(self.__section.entropy) > 0
|
|
|
|
disable_correlation = not to_ids
|
2017-09-12 16:46:06 +02:00
|
|
|
self.add_attribute('entropy', value=self.__section.entropy)
|
2020-08-14 17:13:53 +02:00
|
|
|
self.add_attribute('md5', value=md5(self.__data).hexdigest(), disable_correlation=disable_correlation, to_ids=to_ids)
|
|
|
|
self.add_attribute('sha1', value=sha1(self.__data).hexdigest(), disable_correlation=disable_correlation, to_ids=to_ids)
|
|
|
|
self.add_attribute('sha256', value=sha256(self.__data).hexdigest(), disable_correlation=disable_correlation, to_ids=to_ids)
|
|
|
|
self.add_attribute('sha512', value=sha512(self.__data).hexdigest(), disable_correlation=disable_correlation, to_ids=to_ids)
|
|
|
|
if HAS_PYDEEP and float(self.__section.entropy) > 0:
|
|
|
|
if self.__section.name == '.rsrc':
|
|
|
|
# ssdeep of .rsrc creates too many correlations
|
|
|
|
disable_correlation = True
|
|
|
|
to_ids = False
|
|
|
|
self.add_attribute('ssdeep', value=pydeep.hash_buf(self.__data).decode(), disable_correlation=disable_correlation, to_ids=to_ids)
|