2017-02-10 22:35:02 +01:00
|
|
|
"""Utility functions and classes for the stix2 library."""
|
|
|
|
|
|
|
|
import datetime as dt
|
2017-05-05 16:53:28 +02:00
|
|
|
import json
|
|
|
|
|
2017-05-09 21:10:53 +02:00
|
|
|
from dateutil import parser
|
2017-05-10 00:03:46 +02:00
|
|
|
import pytz
|
2017-04-25 00:29:56 +02:00
|
|
|
|
2017-05-19 19:51:59 +02:00
|
|
|
# Sentinel value for properties that should be set to the current time.
|
2017-02-10 22:35:02 +01:00
|
|
|
# We can't use the standard 'default' approach, since if there are multiple
|
|
|
|
# timestamps in a single object, the timestamps will vary by a few microseconds.
|
|
|
|
NOW = object()
|
|
|
|
|
|
|
|
|
2017-06-23 00:47:35 +02:00
|
|
|
class STIXdatetime(dt.datetime):
|
|
|
|
def __new__(cls, *args, **kwargs):
|
|
|
|
precision = kwargs.pop('precision', None)
|
|
|
|
if isinstance(args[0], dt.datetime): # Allow passing in a datetime object
|
|
|
|
dttm = args[0]
|
2017-06-28 21:55:23 +02:00
|
|
|
args = (dttm.year, dttm.month, dttm.day, dttm.hour, dttm.minute,
|
|
|
|
dttm.second, dttm.microsecond, dttm.tzinfo)
|
|
|
|
# self will be an instance of STIXdatetime, not dt.datetime
|
2017-06-23 00:47:35 +02:00
|
|
|
self = dt.datetime.__new__(cls, *args, **kwargs)
|
|
|
|
self.precision = precision
|
|
|
|
return self
|
|
|
|
|
2017-08-11 21:04:58 +02:00
|
|
|
def __repr__(self):
|
|
|
|
return "'%s'" % format_datetime(self)
|
|
|
|
|
2017-06-23 00:47:35 +02:00
|
|
|
|
2017-02-10 22:35:02 +01:00
|
|
|
def get_timestamp():
|
2017-06-23 00:47:35 +02:00
|
|
|
return STIXdatetime.now(tz=pytz.UTC)
|
2017-02-10 22:35:02 +01:00
|
|
|
|
|
|
|
|
|
|
|
def format_datetime(dttm):
|
2017-04-17 16:48:13 +02:00
|
|
|
# 1. Convert to timezone-aware
|
|
|
|
# 2. Convert to UTC
|
|
|
|
# 3. Format in ISO format
|
2017-06-23 00:47:35 +02:00
|
|
|
# 4. Ensure correct precision
|
|
|
|
# 4a. Add subsecond value if non-zero and precision not defined
|
2017-04-17 16:48:13 +02:00
|
|
|
# 5. Add "Z"
|
|
|
|
|
2017-05-22 17:11:42 +02:00
|
|
|
if dttm.tzinfo is None or dttm.tzinfo.utcoffset(dttm) is None:
|
2017-04-17 19:16:14 +02:00
|
|
|
# dttm is timezone-naive; assume UTC
|
2017-05-22 17:11:42 +02:00
|
|
|
zoned = pytz.utc.localize(dttm)
|
|
|
|
else:
|
|
|
|
zoned = dttm.astimezone(pytz.utc)
|
2017-04-17 16:48:13 +02:00
|
|
|
ts = zoned.strftime("%Y-%m-%dT%H:%M:%S")
|
2017-06-23 00:47:35 +02:00
|
|
|
ms = zoned.strftime("%f")
|
|
|
|
precision = getattr(dttm, "precision", None)
|
2017-06-28 21:55:23 +02:00
|
|
|
if precision == 'second':
|
|
|
|
pass # Alredy precise to the second
|
|
|
|
elif precision == "millisecond":
|
|
|
|
ts = ts + '.' + ms[:3]
|
2017-06-23 00:47:35 +02:00
|
|
|
elif zoned.microsecond > 0:
|
2017-04-17 16:48:13 +02:00
|
|
|
ts = ts + '.' + ms.rstrip("0")
|
|
|
|
return ts + "Z"
|
2017-04-19 20:32:56 +02:00
|
|
|
|
|
|
|
|
2017-06-23 00:47:35 +02:00
|
|
|
def parse_into_datetime(value, precision=None):
|
2017-05-04 22:34:08 +02:00
|
|
|
if isinstance(value, dt.date):
|
|
|
|
if hasattr(value, 'hour'):
|
2017-06-23 00:47:35 +02:00
|
|
|
ts = value
|
2017-05-04 22:34:08 +02:00
|
|
|
else:
|
|
|
|
# Add a time component
|
2017-06-23 00:47:35 +02:00
|
|
|
ts = dt.datetime.combine(value, dt.time(0, 0, tzinfo=pytz.utc))
|
2017-05-04 22:34:08 +02:00
|
|
|
else:
|
2017-06-23 00:47:35 +02:00
|
|
|
# value isn't a date or datetime object so assume it's a string
|
|
|
|
try:
|
|
|
|
parsed = parser.parse(value)
|
|
|
|
except (TypeError, ValueError):
|
|
|
|
# Unknown format
|
|
|
|
raise ValueError("must be a datetime object, date object, or "
|
|
|
|
"timestamp string in a recognizable format.")
|
|
|
|
if parsed.tzinfo:
|
|
|
|
ts = parsed.astimezone(pytz.utc)
|
|
|
|
else:
|
|
|
|
# Doesn't have timezone info in the string; assume UTC
|
|
|
|
ts = pytz.utc.localize(parsed)
|
|
|
|
|
|
|
|
# Ensure correct precision
|
|
|
|
if not precision:
|
2017-08-11 21:04:58 +02:00
|
|
|
return STIXdatetime(ts, precision=precision)
|
2017-06-23 00:47:35 +02:00
|
|
|
ms = ts.microsecond
|
2017-06-28 21:55:23 +02:00
|
|
|
if precision == 'second':
|
|
|
|
ts = ts.replace(microsecond=0)
|
|
|
|
elif precision == 'millisecond':
|
2017-06-23 00:47:35 +02:00
|
|
|
ms_len = len(str(ms))
|
|
|
|
if ms_len > 3:
|
|
|
|
# Truncate to millisecond precision
|
2017-06-28 21:55:23 +02:00
|
|
|
factor = 10 ** (ms_len - 3)
|
|
|
|
ts = ts.replace(microsecond=(ts.microsecond // factor) * factor)
|
|
|
|
else:
|
|
|
|
ts = ts.replace(microsecond=0)
|
2017-06-23 00:47:35 +02:00
|
|
|
return STIXdatetime(ts, precision=precision)
|
2017-05-04 22:34:08 +02:00
|
|
|
|
|
|
|
|
2017-04-19 20:32:56 +02:00
|
|
|
def get_dict(data):
|
|
|
|
"""Return data as a dictionary.
|
|
|
|
Input can be a dictionary, string, or file-like object.
|
|
|
|
"""
|
|
|
|
|
|
|
|
if type(data) is dict:
|
2017-05-16 15:25:08 +02:00
|
|
|
return data
|
2017-04-19 20:32:56 +02:00
|
|
|
else:
|
|
|
|
try:
|
2017-05-16 15:25:08 +02:00
|
|
|
return json.loads(data)
|
2017-04-19 20:32:56 +02:00
|
|
|
except TypeError:
|
2017-05-16 15:25:08 +02:00
|
|
|
pass
|
|
|
|
try:
|
|
|
|
return json.load(data)
|
|
|
|
except AttributeError:
|
|
|
|
pass
|
|
|
|
try:
|
|
|
|
return dict(data)
|
|
|
|
except (ValueError, TypeError):
|
|
|
|
raise ValueError("Cannot convert '%s' to dictionary." % str(data))
|