436 lines
		
	
	
		
			14 KiB
		
	
	
	
		
			Python
		
	
	
			
		
		
	
	
			436 lines
		
	
	
		
			14 KiB
		
	
	
	
		
			Python
		
	
	
# Copyright 2014-2016 OpenMarket Ltd
 | 
						|
#
 | 
						|
# Licensed under the Apache License, Version 2.0 (the "License");
 | 
						|
# you may not use this file except in compliance with the License.
 | 
						|
# You may obtain a copy of the License at
 | 
						|
#
 | 
						|
#     http://www.apache.org/licenses/LICENSE-2.0
 | 
						|
#
 | 
						|
# Unless required by applicable law or agreed to in writing, software
 | 
						|
# distributed under the License is distributed on an "AS IS" BASIS,
 | 
						|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | 
						|
# See the License for the specific language governing permissions and
 | 
						|
# limitations under the License.
 | 
						|
 | 
						|
""" Thread-local-alike tracking of log contexts within synapse
 | 
						|
 | 
						|
This module provides objects and utilities for tracking contexts through
 | 
						|
synapse code, so that log lines can include a request identifier, and so that
 | 
						|
CPU and database activity can be accounted for against the request that caused
 | 
						|
them.
 | 
						|
 | 
						|
See doc/log_contexts.rst for details on how this works.
 | 
						|
"""
 | 
						|
 | 
						|
from twisted.internet import defer
 | 
						|
 | 
						|
import threading
 | 
						|
import logging
 | 
						|
 | 
						|
logger = logging.getLogger(__name__)
 | 
						|
 | 
						|
try:
 | 
						|
    import resource
 | 
						|
 | 
						|
    # Python doesn't ship with a definition of RUSAGE_THREAD but it's defined
 | 
						|
    # to be 1 on linux so we hard code it.
 | 
						|
    RUSAGE_THREAD = 1
 | 
						|
 | 
						|
    # If the system doesn't support RUSAGE_THREAD then this should throw an
 | 
						|
    # exception.
 | 
						|
    resource.getrusage(RUSAGE_THREAD)
 | 
						|
 | 
						|
    def get_thread_resource_usage():
 | 
						|
        return resource.getrusage(RUSAGE_THREAD)
 | 
						|
except:
 | 
						|
    # If the system doesn't support resource.getrusage(RUSAGE_THREAD) then we
 | 
						|
    # won't track resource usage by returning None.
 | 
						|
    def get_thread_resource_usage():
 | 
						|
        return None
 | 
						|
 | 
						|
 | 
						|
class LoggingContext(object):
 | 
						|
    """Additional context for log formatting. Contexts are scoped within a
 | 
						|
    "with" block.
 | 
						|
    Args:
 | 
						|
        name (str): Name for the context for debugging.
 | 
						|
    """
 | 
						|
 | 
						|
    __slots__ = [
 | 
						|
        "previous_context", "name", "usage_start", "usage_end", "main_thread",
 | 
						|
        "__dict__", "tag", "alive",
 | 
						|
    ]
 | 
						|
 | 
						|
    thread_local = threading.local()
 | 
						|
 | 
						|
    class Sentinel(object):
 | 
						|
        """Sentinel to represent the root context"""
 | 
						|
 | 
						|
        __slots__ = []
 | 
						|
 | 
						|
        def __str__(self):
 | 
						|
            return "sentinel"
 | 
						|
 | 
						|
        def copy_to(self, record):
 | 
						|
            pass
 | 
						|
 | 
						|
        def start(self):
 | 
						|
            pass
 | 
						|
 | 
						|
        def stop(self):
 | 
						|
            pass
 | 
						|
 | 
						|
        def add_database_transaction(self, duration_ms):
 | 
						|
            pass
 | 
						|
 | 
						|
        def __nonzero__(self):
 | 
						|
            return False
 | 
						|
 | 
						|
    sentinel = Sentinel()
 | 
						|
 | 
						|
    def __init__(self, name=None):
 | 
						|
        self.previous_context = LoggingContext.current_context()
 | 
						|
        self.name = name
 | 
						|
        self.ru_stime = 0.
 | 
						|
        self.ru_utime = 0.
 | 
						|
        self.db_txn_count = 0
 | 
						|
        self.db_txn_duration = 0.
 | 
						|
        self.usage_start = None
 | 
						|
        self.main_thread = threading.current_thread()
 | 
						|
        self.tag = ""
 | 
						|
        self.alive = True
 | 
						|
 | 
						|
    def __str__(self):
 | 
						|
        return "%s@%x" % (self.name, id(self))
 | 
						|
 | 
						|
    @classmethod
 | 
						|
    def current_context(cls):
 | 
						|
        """Get the current logging context from thread local storage"""
 | 
						|
        return getattr(cls.thread_local, "current_context", cls.sentinel)
 | 
						|
 | 
						|
    @classmethod
 | 
						|
    def set_current_context(cls, context):
 | 
						|
        """Set the current logging context in thread local storage
 | 
						|
        Args:
 | 
						|
            context(LoggingContext): The context to activate.
 | 
						|
        Returns:
 | 
						|
            The context that was previously active
 | 
						|
        """
 | 
						|
        current = cls.current_context()
 | 
						|
 | 
						|
        if current is not context:
 | 
						|
            current.stop()
 | 
						|
            cls.thread_local.current_context = context
 | 
						|
            context.start()
 | 
						|
        return current
 | 
						|
 | 
						|
    def __enter__(self):
 | 
						|
        """Enters this logging context into thread local storage"""
 | 
						|
        old_context = self.set_current_context(self)
 | 
						|
        if self.previous_context != old_context:
 | 
						|
            logger.warn(
 | 
						|
                "Expected previous context %r, found %r",
 | 
						|
                self.previous_context, old_context
 | 
						|
            )
 | 
						|
        self.alive = True
 | 
						|
        return self
 | 
						|
 | 
						|
    def __exit__(self, type, value, traceback):
 | 
						|
        """Restore the logging context in thread local storage to the state it
 | 
						|
        was before this context was entered.
 | 
						|
        Returns:
 | 
						|
            None to avoid suppressing any exeptions that were thrown.
 | 
						|
        """
 | 
						|
        current = self.set_current_context(self.previous_context)
 | 
						|
        if current is not self:
 | 
						|
            if current is self.sentinel:
 | 
						|
                logger.debug("Expected logging context %s has been lost", self)
 | 
						|
            else:
 | 
						|
                logger.warn(
 | 
						|
                    "Current logging context %s is not expected context %s",
 | 
						|
                    current,
 | 
						|
                    self
 | 
						|
                )
 | 
						|
        self.previous_context = None
 | 
						|
        self.alive = False
 | 
						|
 | 
						|
    def copy_to(self, record):
 | 
						|
        """Copy fields from this context to the record"""
 | 
						|
        for key, value in self.__dict__.items():
 | 
						|
            setattr(record, key, value)
 | 
						|
 | 
						|
        record.ru_utime, record.ru_stime = self.get_resource_usage()
 | 
						|
 | 
						|
    def start(self):
 | 
						|
        if threading.current_thread() is not self.main_thread:
 | 
						|
            return
 | 
						|
 | 
						|
        if self.usage_start and self.usage_end:
 | 
						|
            self.ru_utime += self.usage_end.ru_utime - self.usage_start.ru_utime
 | 
						|
            self.ru_stime += self.usage_end.ru_stime - self.usage_start.ru_stime
 | 
						|
            self.usage_start = None
 | 
						|
            self.usage_end = None
 | 
						|
 | 
						|
        if not self.usage_start:
 | 
						|
            self.usage_start = get_thread_resource_usage()
 | 
						|
 | 
						|
    def stop(self):
 | 
						|
        if threading.current_thread() is not self.main_thread:
 | 
						|
            return
 | 
						|
 | 
						|
        if self.usage_start:
 | 
						|
            self.usage_end = get_thread_resource_usage()
 | 
						|
 | 
						|
    def get_resource_usage(self):
 | 
						|
        ru_utime = self.ru_utime
 | 
						|
        ru_stime = self.ru_stime
 | 
						|
 | 
						|
        if self.usage_start and threading.current_thread() is self.main_thread:
 | 
						|
            current = get_thread_resource_usage()
 | 
						|
            ru_utime += current.ru_utime - self.usage_start.ru_utime
 | 
						|
            ru_stime += current.ru_stime - self.usage_start.ru_stime
 | 
						|
 | 
						|
        return ru_utime, ru_stime
 | 
						|
 | 
						|
    def add_database_transaction(self, duration_ms):
 | 
						|
        self.db_txn_count += 1
 | 
						|
        self.db_txn_duration += duration_ms / 1000.
 | 
						|
 | 
						|
 | 
						|
class LoggingContextFilter(logging.Filter):
 | 
						|
    """Logging filter that adds values from the current logging context to each
 | 
						|
    record.
 | 
						|
    Args:
 | 
						|
        **defaults: Default values to avoid formatters complaining about
 | 
						|
            missing fields
 | 
						|
    """
 | 
						|
    def __init__(self, **defaults):
 | 
						|
        self.defaults = defaults
 | 
						|
 | 
						|
    def filter(self, record):
 | 
						|
        """Add each fields from the logging contexts to the record.
 | 
						|
        Returns:
 | 
						|
            True to include the record in the log output.
 | 
						|
        """
 | 
						|
        context = LoggingContext.current_context()
 | 
						|
        for key, value in self.defaults.items():
 | 
						|
            setattr(record, key, value)
 | 
						|
        context.copy_to(record)
 | 
						|
        return True
 | 
						|
 | 
						|
 | 
						|
class PreserveLoggingContext(object):
 | 
						|
    """Captures the current logging context and restores it when the scope is
 | 
						|
    exited. Used to restore the context after a function using
 | 
						|
    @defer.inlineCallbacks is resumed by a callback from the reactor."""
 | 
						|
 | 
						|
    __slots__ = ["current_context", "new_context", "has_parent"]
 | 
						|
 | 
						|
    def __init__(self, new_context=LoggingContext.sentinel):
 | 
						|
        self.new_context = new_context
 | 
						|
 | 
						|
    def __enter__(self):
 | 
						|
        """Captures the current logging context"""
 | 
						|
        self.current_context = LoggingContext.set_current_context(
 | 
						|
            self.new_context
 | 
						|
        )
 | 
						|
 | 
						|
        if self.current_context:
 | 
						|
            self.has_parent = self.current_context.previous_context is not None
 | 
						|
            if not self.current_context.alive:
 | 
						|
                logger.debug(
 | 
						|
                    "Entering dead context: %s",
 | 
						|
                    self.current_context,
 | 
						|
                )
 | 
						|
 | 
						|
    def __exit__(self, type, value, traceback):
 | 
						|
        """Restores the current logging context"""
 | 
						|
        context = LoggingContext.set_current_context(self.current_context)
 | 
						|
 | 
						|
        if context != self.new_context:
 | 
						|
            logger.debug(
 | 
						|
                "Unexpected logging context: %s is not %s",
 | 
						|
                context, self.new_context,
 | 
						|
            )
 | 
						|
 | 
						|
        if self.current_context is not LoggingContext.sentinel:
 | 
						|
            if not self.current_context.alive:
 | 
						|
                logger.debug(
 | 
						|
                    "Restoring dead context: %s",
 | 
						|
                    self.current_context,
 | 
						|
                )
 | 
						|
 | 
						|
 | 
						|
class _PreservingContextDeferred(defer.Deferred):
 | 
						|
    """A deferred that ensures that all callbacks and errbacks are called with
 | 
						|
    the given logging context.
 | 
						|
    """
 | 
						|
    def __init__(self, context):
 | 
						|
        self._log_context = context
 | 
						|
        defer.Deferred.__init__(self)
 | 
						|
 | 
						|
    def addCallbacks(self, callback, errback=None,
 | 
						|
                     callbackArgs=None, callbackKeywords=None,
 | 
						|
                     errbackArgs=None, errbackKeywords=None):
 | 
						|
        callback = self._wrap_callback(callback)
 | 
						|
        errback = self._wrap_callback(errback)
 | 
						|
        return defer.Deferred.addCallbacks(
 | 
						|
            self, callback,
 | 
						|
            errback=errback,
 | 
						|
            callbackArgs=callbackArgs,
 | 
						|
            callbackKeywords=callbackKeywords,
 | 
						|
            errbackArgs=errbackArgs,
 | 
						|
            errbackKeywords=errbackKeywords,
 | 
						|
        )
 | 
						|
 | 
						|
    def _wrap_callback(self, f):
 | 
						|
        def g(res, *args, **kwargs):
 | 
						|
            with PreserveLoggingContext(self._log_context):
 | 
						|
                res = f(res, *args, **kwargs)
 | 
						|
            return res
 | 
						|
        return g
 | 
						|
 | 
						|
 | 
						|
def preserve_context_over_fn(fn, *args, **kwargs):
 | 
						|
    """Takes a function and invokes it with the given arguments, but removes
 | 
						|
    and restores the current logging context while doing so.
 | 
						|
 | 
						|
    If the result is a deferred, call preserve_context_over_deferred before
 | 
						|
    returning it.
 | 
						|
    """
 | 
						|
    with PreserveLoggingContext():
 | 
						|
        res = fn(*args, **kwargs)
 | 
						|
 | 
						|
    if isinstance(res, defer.Deferred):
 | 
						|
        return preserve_context_over_deferred(res)
 | 
						|
    else:
 | 
						|
        return res
 | 
						|
 | 
						|
 | 
						|
def preserve_context_over_deferred(deferred, context=None):
 | 
						|
    """Given a deferred wrap it such that any callbacks added later to it will
 | 
						|
    be invoked with the current context.
 | 
						|
 | 
						|
    Deprecated: this almost certainly doesn't do want you want, ie make
 | 
						|
    the deferred follow the synapse logcontext rules: try
 | 
						|
    ``make_deferred_yieldable`` instead.
 | 
						|
    """
 | 
						|
    if context is None:
 | 
						|
        context = LoggingContext.current_context()
 | 
						|
    d = _PreservingContextDeferred(context)
 | 
						|
    deferred.chainDeferred(d)
 | 
						|
    return d
 | 
						|
 | 
						|
 | 
						|
def preserve_fn(f):
 | 
						|
    """Wraps a function, to ensure that the current context is restored after
 | 
						|
    return from the function, and that the sentinel context is set once the
 | 
						|
    deferred returned by the funtion completes.
 | 
						|
 | 
						|
    Useful for wrapping functions that return a deferred which you don't yield
 | 
						|
    on.
 | 
						|
    """
 | 
						|
    def reset_context(result):
 | 
						|
        LoggingContext.set_current_context(LoggingContext.sentinel)
 | 
						|
        return result
 | 
						|
 | 
						|
    def g(*args, **kwargs):
 | 
						|
        current = LoggingContext.current_context()
 | 
						|
        res = f(*args, **kwargs)
 | 
						|
        if isinstance(res, defer.Deferred) and not res.called:
 | 
						|
            # The function will have reset the context before returning, so
 | 
						|
            # we need to restore it now.
 | 
						|
            LoggingContext.set_current_context(current)
 | 
						|
 | 
						|
            # The original context will be restored when the deferred
 | 
						|
            # completes, but there is nothing waiting for it, so it will
 | 
						|
            # get leaked into the reactor or some other function which
 | 
						|
            # wasn't expecting it. We therefore need to reset the context
 | 
						|
            # here.
 | 
						|
            #
 | 
						|
            # (If this feels asymmetric, consider it this way: we are
 | 
						|
            # effectively forking a new thread of execution. We are
 | 
						|
            # probably currently within a ``with LoggingContext()`` block,
 | 
						|
            # which is supposed to have a single entry and exit point. But
 | 
						|
            # by spawning off another deferred, we are effectively
 | 
						|
            # adding a new exit point.)
 | 
						|
            res.addBoth(reset_context)
 | 
						|
        return res
 | 
						|
    return g
 | 
						|
 | 
						|
 | 
						|
@defer.inlineCallbacks
 | 
						|
def make_deferred_yieldable(deferred):
 | 
						|
    """Given a deferred, make it follow the Synapse logcontext rules:
 | 
						|
 | 
						|
    If the deferred has completed (or is not actually a Deferred), essentially
 | 
						|
    does nothing (just returns another completed deferred with the
 | 
						|
    result/failure).
 | 
						|
 | 
						|
    If the deferred has not yet completed, resets the logcontext before
 | 
						|
    returning a deferred. Then, when the deferred completes, restores the
 | 
						|
    current logcontext before running callbacks/errbacks.
 | 
						|
 | 
						|
    (This is more-or-less the opposite operation to preserve_fn.)
 | 
						|
    """
 | 
						|
    with PreserveLoggingContext():
 | 
						|
        r = yield deferred
 | 
						|
    defer.returnValue(r)
 | 
						|
 | 
						|
 | 
						|
# modules to ignore in `logcontext_tracer`
 | 
						|
_to_ignore = [
 | 
						|
    "synapse.util.logcontext",
 | 
						|
    "synapse.http.server",
 | 
						|
    "synapse.storage._base",
 | 
						|
    "synapse.util.async",
 | 
						|
]
 | 
						|
 | 
						|
 | 
						|
def logcontext_tracer(frame, event, arg):
 | 
						|
    """A tracer that logs whenever a logcontext "unexpectedly" changes within
 | 
						|
    a function. Probably inaccurate.
 | 
						|
 | 
						|
    Use by calling `sys.settrace(logcontext_tracer)` in the main thread.
 | 
						|
    """
 | 
						|
    if event == 'call':
 | 
						|
        name = frame.f_globals["__name__"]
 | 
						|
        if name.startswith("synapse"):
 | 
						|
            if name == "synapse.util.logcontext":
 | 
						|
                if frame.f_code.co_name in ["__enter__", "__exit__"]:
 | 
						|
                    tracer = frame.f_back.f_trace
 | 
						|
                    if tracer:
 | 
						|
                        tracer.just_changed = True
 | 
						|
 | 
						|
            tracer = frame.f_trace
 | 
						|
            if tracer:
 | 
						|
                return tracer
 | 
						|
 | 
						|
            if not any(name.startswith(ig) for ig in _to_ignore):
 | 
						|
                return LineTracer()
 | 
						|
 | 
						|
 | 
						|
class LineTracer(object):
 | 
						|
    __slots__ = ["context", "just_changed"]
 | 
						|
 | 
						|
    def __init__(self):
 | 
						|
        self.context = LoggingContext.current_context()
 | 
						|
        self.just_changed = False
 | 
						|
 | 
						|
    def __call__(self, frame, event, arg):
 | 
						|
        if event in 'line':
 | 
						|
            if self.just_changed:
 | 
						|
                self.context = LoggingContext.current_context()
 | 
						|
                self.just_changed = False
 | 
						|
            else:
 | 
						|
                c = LoggingContext.current_context()
 | 
						|
                if c != self.context:
 | 
						|
                    logger.info(
 | 
						|
                        "Context changed! %s -> %s, %s, %s",
 | 
						|
                        self.context, c,
 | 
						|
                        frame.f_code.co_filename, frame.f_lineno
 | 
						|
                    )
 | 
						|
                    self.context = c
 | 
						|
 | 
						|
        return self
 |