Source code for plaso.parsers.bencode_plugins.interface

# -*- coding: utf-8 -*-
"""bencode_interface contains basic interface for bencode plugins within Plaso.

Bencoded files are only one example of a type of object that the Plaso tool is
expected to encounter and process.  There can be and are many other parsers
which are designed to process specific data types.

BencodePlugin defines the attributes necessary for registration, discovery
and operation of plugins for bencoded files which will be used by
BencodeParser.
"""
from __future__ import unicode_literals

import abc

from plaso.lib import errors
from plaso.parsers import logger
from plaso.parsers import plugins


[docs]class BencodePlugin(plugins.BasePlugin): """This is an abstract class from which plugins should be based.""" # BENCODE_KEYS is a list of keys required by a plugin. # This is expected to be overridden by the processing plugin. # Ex. frozenset(['activity-date', 'done-date']) BENCODE_KEYS = frozenset(['any']) # This is expected to be overridden by the processing plugin. # URLS should contain a list of URLs with additional information about # this key or value. # Ex. ['https://wiki.theory.org/BitTorrentSpecification#Bencoding'] URLS = [] NAME = 'bencode' def _GetKeys(self, data, keys, depth=1): """Helper function to return keys nested in a bencode dict. By default this function will return the values for the named keys requested by a plugin in match{}. The default setting is to look a single layer down from the root (same as the check for plugin applicability). This level is suitable for most cases. For cases where there is variability in the name at the first level (e.g. it is the MAC addresses of a device, or a UUID) it is possible to override the depth limit and use _GetKeys to fetch from a deeper level. Args: data (dict[str, object]): bencode data values. keys (list[str]): keys that should be returned. depth (int): how many levels deep to check for a match. Returns: dict[str, object]: a dictionary with just the keys requested. """ keys = set(keys) match = {} if depth == 1: for key in keys: match[key] = data[key] else: for _, parsed_key, parsed_value in self._RecurseKey( data, depth=depth): if parsed_key in keys: match[parsed_key] = parsed_value if set(match.keys()) == keys: return match return match def _RecurseKey(self, recur_item, root='', depth=15): """Flattens nested dictionaries and lists by yielding their values. The hierarchy of a bencode file is a series of nested dictionaries and lists. This is a helper function helps plugins navigate the structure without having to reimplement their own recursive methods. This method implements an overridable depth limit to prevent processing extremely deeply nested dictionaries. If the limit is reached a debug message is logged indicating which key processing stopped on. Args: recur_item (object): object to be checked for additional nested items. root (str): the pathname of the current working key. depth (int): a counter to ensure we stop at the maximum recursion depth. Yields: tuple: containing: str: root str: key str: value """ if depth < 1: logger.debug('Recursion limit hit for key: {0:s}'.format(root)) return if isinstance(recur_item, (list, tuple)): for recur in recur_item: for key in self._RecurseKey(recur, root, depth): yield key return if not hasattr(recur_item, 'iteritems'): return for key, value in iter(recur_item.items()): yield root, key, value if isinstance(value, dict): value = [value] if isinstance(value, list): for item in value: if isinstance(item, dict): for keyval in self._RecurseKey( item, root=root + '/' + key, depth=depth - 1): yield keyval # pylint 1.9.3 wants a docstring for kwargs, but this is not useful to add. # pylint: disable=missing-param-doc
[docs] @abc.abstractmethod def GetEntries(self, parser_mediator, data=None, **kwargs): """Extracts event object from the values of entries within a bencoded file. This is the main method that a bencode plugin needs to implement. The contents of the bencode keys defined in BENCODE_KEYS can be made available to the plugin as both a matched{'KEY': 'value'} and as the entire bencoded data dictionary. The plugin should implement logic to parse the most relevant data set into a useful event for incorporation into the Plaso timeline. The attributes for a BencodeEvent should include the following: root = Root key this event was extracted from. key = Key the value resided in. time = Date this artifact was created in micro seconds (usec) from January 1, 1970 00:00:00 UTC. desc = Short description. Args: parser_mediator (ParserMediator): mediates interactions between parsers and other components, such as storage and dfvfs. data (Optional[dict[str, object]]): bencode data values.
""" # pylint 1.9.3 wants a docstring for kwargs, but this is not useful to add. # pylint: disable=missing-param-doc,arguments-differ
[docs] def Process(self, parser_mediator, data, **kwargs): """Determine if this is the correct plugin; if so proceed with processing. Process() checks if the current bencode file being processed is a match for a plugin by comparing the PATH and KEY requirements defined by a plugin. If both match processing continues; else raise WrongBencodePlugin. This function also extracts the required keys as defined in self.BENCODE_KEYS from the file and stores the result in match[key] and calls self.GetEntries() which holds the processing logic implemented by the plugin. Args: parser_mediator (ParserMediator): mediates interactions between parsers and other components, such as storage and dfvfs. data (dict[str, object]): bencode data values. Raises: WrongBencodePlugin: If this plugin is not able to process the given file. ValueError: If top level is not set. """ if data is None: raise ValueError('Data is not set.') if not set(data.keys()).issuperset(self.BENCODE_KEYS): raise errors.WrongBencodePlugin(self.NAME) # This will raise if unhandled keyword arguments are passed. super(BencodePlugin, self).Process(parser_mediator) logger.debug('Bencode Plugin Used: {0:s}'.format(self.NAME))
self.GetEntries(parser_mediator, data=data)