Source code for plaso.parsers.recycler

"""Parser for Windows Recycle files, INFO2 and $I/$R pairs."""

import os

from dfdatetime import filetime as dfdatetime_filetime

from plaso.containers import events
from plaso.lib import dtfabric_helper
from plaso.lib import errors
from plaso.parsers import interface
from plaso.parsers import manager


[docs] class WinRecycleBinEventData(events.EventData): """Windows Recycle Bin event data. Attributes: deletion_time (dfdatetime.DateTimeValues): file entry deletion date and time. drive_number (int): drive number. file_size (int): file size. offset (int): offset of the Recycle Bin record relative to the start of the file, from which the event data was extracted. original_filename (str): filename. record_index (int): index of the record, from which the event data was extracted. short_filename (str): short filename. """ DATA_TYPE = "windows:metadata:deleted_item"
[docs] def __init__(self): """Initializes Windows Recycle Bin event data.""" super().__init__(data_type=self.DATA_TYPE) self.deletion_time = None self.drive_number = None self.file_size = None self.offset = None self.original_filename = None self.record_index = None self.short_filename = None
[docs] class WinRecycleBinParser(interface.FileObjectParser, dtfabric_helper.DtFabricHelper): """Parses the Windows $Recycle.Bin $I files.""" NAME = "recycle_bin" DATA_FORMAT = "Windows $Recycle.Bin $I file" _DEFINITION_FILE = os.path.join(os.path.dirname(__file__), "recycler.yaml") _SUPPORTED_FORMAT_VERSIONS = (1, 2) def _ParseOriginalFilename(self, file_object, format_version): """Parses the original filename. Args: file_object (FileIO): file-like object. format_version (int): format version. Returns: str: filename or None on error. Raises: ParseError: if the original filename cannot be read. """ file_offset = file_object.tell() if format_version == 1: data_type_map = self._GetDataTypeMap("recycle_bin_metadata_utf16le_string") else: data_type_map = self._GetDataTypeMap( "recycle_bin_metadata_utf16le_string_with_size" ) try: original_filename, _ = self._ReadStructureFromFileObject( file_object, file_offset, data_type_map ) except (ValueError, errors.ParseError) as exception: raise errors.ParseError( f"Unable to parse original filename with error: {exception!s}" ) if format_version == 1: return original_filename.rstrip("\x00") return original_filename.string.rstrip("\x00")
[docs] def ParseFileObject(self, parser_mediator, file_object): """Parses a Windows Recycle.Bin metadata ($I) file-like object. Args: parser_mediator (ParserMediator): mediates interactions between parsers and other components, such as storage and dfVFS. file_object (dfvfs.FileIO): file-like object. Raises: WrongParser: when the file cannot be parsed. """ # We may have to rely on filenames since this header is very generic. # TODO: Rethink this and potentially make a better test. filename = parser_mediator.GetFilename() if not filename.startswith("$I"): raise errors.WrongParser("Filename must start with $I.") file_header_map = self._GetDataTypeMap("recycle_bin_metadata_file_header") try: file_header, _ = self._ReadStructureFromFileObject( file_object, 0, file_header_map ) except (ValueError, errors.ParseError) as exception: raise errors.WrongParser( f"Unable to parse Windows Recycle.Bin metadata file header with " f"error: {exception!s}" ) if file_header.format_version not in self._SUPPORTED_FORMAT_VERSIONS: raise errors.WrongParser( f"Unsupported format version: " f"{file_header.format_version:d}." ) event_data = WinRecycleBinEventData() event_data.file_size = file_header.original_file_size try: event_data.original_filename = self._ParseOriginalFilename( file_object, file_header.format_version ) except (ValueError, errors.ParseError) as exception: parser_mediator.ProduceExtractionWarning( f"unable to parse original filename with error: {exception!s}." ) if file_header.deletion_time: event_data.deletion_time = dfdatetime_filetime.Filetime( timestamp=file_header.deletion_time ) parser_mediator.ProduceEventData(event_data)
[docs] class WinRecyclerInfo2Parser( interface.FileObjectParser, dtfabric_helper.DtFabricHelper ): """Parses the Windows Recycler INFO2 file.""" NAME = "recycle_bin_info2" DATA_FORMAT = "Windows Recycler INFO2 file" _DEFINITION_FILE = os.path.join(os.path.dirname(__file__), "recycler.yaml") _RECORD_INDEX_OFFSET = 0x104 _UNICODE_FILENAME_OFFSET = 0x118 def _ParseInfo2Record( self, parser_mediator, file_object, record_offset, record_size ): """Parses an INFO-2 record. Args: parser_mediator (ParserMediator): mediates interactions between parsers and other components, such as storage and dfVFS. file_object (dfvfs.FileIO): file-like object. record_offset (int): record offset. record_size (int): record size. Raises: ParseError: if the record cannot be read. """ record_data = self._ReadData(file_object, record_offset, record_size) record_map = self._GetDataTypeMap("recycler_info2_file_entry") try: record = self._ReadStructureFromByteStream( record_data, record_offset, record_map ) except (ValueError, errors.ParseError) as exception: raise errors.ParseError( ( f"Unable to map record data at offset: 0x{record_offset:08x} " f"with error: {exception!s}" ) ) code_page = parser_mediator.GetCodePage() # The original filename can contain remnant data after the end-of-string # character. ascii_filename = record.original_filename.split(b"\x00")[0] try: ascii_filename = ascii_filename.decode(code_page) except UnicodeDecodeError: ascii_filename = ascii_filename.decode(code_page, errors="replace") parser_mediator.ProduceExtractionWarning( "unable to decode original filename." ) unicode_filename = None if record_size > 280: record_offset += 280 utf16_string_map = self._GetDataTypeMap( "recycler_info2_file_entry_utf16le_string" ) try: unicode_filename = self._ReadStructureFromByteStream( record_data[280:], record_offset, utf16_string_map ) except (ValueError, errors.ParseError) as exception: raise errors.ParseError( ( f"Unable to map record data at offset: 0x{record_offset:08x} " f"with error: {exception!s}" ) ) event_data = WinRecycleBinEventData() event_data.drive_number = record.drive_number event_data.original_filename = unicode_filename or ascii_filename event_data.file_size = record.original_file_size event_data.offset = record_offset event_data.record_index = record.index if ascii_filename != unicode_filename: event_data.short_filename = ascii_filename if record.deletion_time: event_data.deletion_time = dfdatetime_filetime.Filetime( timestamp=record.deletion_time ) parser_mediator.ProduceEventData(event_data)
[docs] def ParseFileObject(self, parser_mediator, file_object): """Parses a Windows Recycler INFO2 file-like object. Args: parser_mediator (ParserMediator): mediates interactions between parsers and other components, such as storage and dfVFS. file_object (dfvfs.FileIO): file-like object. Raises: WrongParser: when the file cannot be parsed. """ # Since this header value is really generic it is hard not to use filename # as an indicator too. # TODO: Rethink this and potentially make a better test. filename = parser_mediator.GetFilename() if not filename.startswith("INFO2"): return file_header_map = self._GetDataTypeMap("recycler_info2_file_header") try: file_header, _ = self._ReadStructureFromFileObject( file_object, 0, file_header_map ) except (ValueError, errors.ParseError) as exception: raise errors.WrongParser( ( f"Unable to parse Windows Recycler INFO2 file header with " f"error: {exception!s}" ) ) if file_header.unknown1 != 5: parser_mediator.ProduceExtractionWarning("unsupported format signature.") return file_entry_size = file_header.file_entry_size if file_entry_size not in (280, 800): parser_mediator.ProduceExtractionWarning( f"unsupported file entry size: {file_entry_size:d}" ) return file_offset = file_object.get_offset() file_size = file_object.get_size() while file_offset < file_size: self._ParseInfo2Record( parser_mediator, file_object, file_offset, file_entry_size ) file_offset += file_entry_size
manager.ParsersManager.RegisterParsers([WinRecycleBinParser, WinRecyclerInfo2Parser])