Source code for plaso.parsers.plist

"""Parser for binary and text Property List (plist) files."""

import binascii
import plistlib

from xml.parsers import expat

from plaso.lib import errors
from plaso.lib import specification
from plaso.parsers import interface
from plaso.parsers import logger
from plaso.parsers import manager



[docs]
class PlistParser(interface.FileObjectParser):
    """Parser for binary and text Property List (plist) files."""

    NAME = "plist"
    DATA_FORMAT = "Property list (plist) file"

    # 50 MB is 10x larger than any plist file seen to date.
    _MAXIMUM_FILE_SIZE = 50000000

    _UTF16BE_BYTE_ORDER_MARK = b"\xfe\xff"
    _UTF16LE_BYTE_ORDER_MARK = b"\xff\xfe"
    _UTF32BE_BYTE_ORDER_MARK = b"\x00\x00\xfe\xff"
    _UTF32LE_BYTE_ORDER_MARK = b"\xff\xfe\x00\x00"
    _UTF8_BYTE_ORDER_MARK = b"\xef\xbb\xbf"

    _plugin_classes = {}

    def _CheckByteOrderMark(self, plist_data):
        """Determines if the plist data starts with a byte-order-mark.

        Args:
          plist_data (bytes): plist data.

        Returns:
          tuple: containing:

            int: size of the byte-order-mark or 0 if no byte-order-mark was
                detected.
            str: encoding or ascii if no byte-order-mark was detected.
        """
        if plist_data.startswith(self._UTF32BE_BYTE_ORDER_MARK):
            return 4, "utf-32-be"

        if plist_data.startswith(self._UTF32LE_BYTE_ORDER_MARK):
            return 4, "utf-32-le"

        if plist_data.startswith(self._UTF16BE_BYTE_ORDER_MARK):
            return 2, "utf-16-be"

        if plist_data.startswith(self._UTF16LE_BYTE_ORDER_MARK):
            return 2, "utf-16-le"

        if plist_data.startswith(self._UTF8_BYTE_ORDER_MARK):
            return 3, "utf-8"

        return 0, "ascii"


[docs]
    @classmethod
    def GetFormatSpecification(cls):
        """Retrieves the format specification.

        Returns:
          FormatSpecification: a format specification or None if not available.
        """
        format_specification = specification.FormatSpecification(cls.NAME)
        format_specification.AddNewSignature(b"bplist", offset=0)
        return format_specification



[docs]
    def ParseFileObject(self, parser_mediator, file_object):
        """Parses a plist file-like object.

        Args:
          parser_mediator (ParserMediator): mediates interactions between parsers
              and other components, such as storage and dfVFS.
          file_object (dfvfs.FileIO): a file-like object.

        Raises:
          WrongParser: when the file cannot be parsed.
        """
        filename = parser_mediator.GetFilename()

        # Note that _MAXIMUM_FILE_SIZE prevents this read to become too large.
        plist_data = file_object.read()

        has_leading_whitespace = False

        is_binary_plist = plist_data.startswith(b"bplist0")
        if not is_binary_plist:
            byte_order_mark_size, encoding = self._CheckByteOrderMark(plist_data)

            xml_signature = "<?xml ".encode(encoding)
            is_xml = plist_data[byte_order_mark_size:].startswith(xml_signature)
            if not is_xml:
                # Preserve the byte-order-mark for plistlib.
                plist_data = b"".join(
                    [
                        plist_data[:byte_order_mark_size],
                        plist_data[byte_order_mark_size:].lstrip(),
                    ]
                )
                is_xml = plist_data[byte_order_mark_size:].startswith(xml_signature)
                has_leading_whitespace = is_xml

            if is_xml:
                plist_footer = "</plist>".encode(encoding)
                plist_data = plist_data.rstrip()

                if not plist_data.endswith(plist_footer):
                    raise errors.WrongParser(
                        "Unable to parse XML plist with error: missing plist XML root "
                        "element."
                    )

        try:
            top_level_object = plistlib.loads(plist_data)

        except (
            AttributeError,
            binascii.Error,
            expat.ExpatError,
            plistlib.InvalidFileException,
        ) as exception:
            raise errors.WrongParser(f"Unable to parse plist with error: {exception!s}")

        except (LookupError, ValueError) as exception:
            # LookupError will be raised in cases where the plist is an XML file
            # that contains an unsupported encoding.
            # ValueError will be raised in cases where the plist is an XML file
            # that contains an unsupported date and time value.
            parser_mediator.ProduceExtractionWarning(
                f"unable to parse XML plist with error: {exception!s}"
            )
            return

        if not top_level_object:
            # Do not produce an extraction warning for a binary plist without a top
            # level object or an XML plist with an empty top level object.
            if top_level_object is None and not is_binary_plist:
                parser_mediator.ProduceExtractionWarning(
                    (
                        "unable to parse XML plist file with error: missing top level "
                        "object"
                    )
                )
            return

        if has_leading_whitespace:
            parser_mediator.ProduceExtractionWarning(
                "XML plist file with leading whitespace"
            )

        display_name = parser_mediator.GetDisplayName()
        filename_lower_case = filename.lower()

        found_matching_plugin = False
        for plugin_name, plugin in self._plugins_per_name.items():
            if parser_mediator.abort:
                break

            profiling_name = "/".join([self.NAME, plugin.NAME])

            parser_mediator.SampleFormatCheckStartTiming(profiling_name)

            try:
                if not plugin.PLIST_PATH_FILTERS:
                    path_filter_match = True
                else:
                    path_filter_match = False
                    for path_filter in plugin.PLIST_PATH_FILTERS:
                        if path_filter.Match(filename_lower_case):
                            path_filter_match = True

                try:
                    required_format = plugin.CheckRequiredFormat(top_level_object)
                except Exception as exception:  # pylint: disable=broad-except
                    parser_mediator.ProduceExtractionWarning(
                        f"plugin: {plugin_name:s} unable to parse plist file with "
                        f"error: {exception!s}"
                    )

            finally:
                parser_mediator.SampleFormatCheckStopTiming(profiling_name)

            if not path_filter_match or not required_format:
                logger.debug(
                    f"Skipped parsing file: {display_name:s} "
                    f"with plugin: {plugin_name:s}"
                )
                continue

            logger.debug(f"Parsing file: {display_name:s} with plugin: {plugin_name:s}")

            parser_mediator.SampleStartTiming(profiling_name)

            try:
                plugin.UpdateChainAndProcess(
                    parser_mediator, top_level=top_level_object
                )
                found_matching_plugin = True

            except Exception as exception:  # pylint: disable=broad-except
                parser_mediator.ProduceExtractionWarning(
                    f"plugin: {plugin_name:s} unable to parse plist file with error: "
                    f"{exception!s}"
                )

            finally:
                parser_mediator.SampleStopTiming(profiling_name)

        if not found_matching_plugin and self._default_plugin:
            profiling_name = "/".join([self.NAME, self._default_plugin.NAME])

            parser_mediator.SampleStartTiming(profiling_name)

            try:
                self._default_plugin.UpdateChainAndProcess(
                    parser_mediator, top_level=top_level_object
                )
            finally:
                parser_mediator.SampleStopTiming(profiling_name)




manager.ParsersManager.RegisterParser(PlistParser)