Source code for plaso.parsers.text_plugins.android_logcat

"""Text parser plugin for Android logcat files.

Android logcat can have a number of output formats. This parser supports:
* 'threadtime' format
* 'time' format

The log file format is:
date time PID-TID/package priority/tag: message

For example:
12-10 13:02:50.071 1901-4229/com.google.android.gms V/AuthZen: Handling
delegate intent.

Where priority is:
V: Verbose (lowest priority)
D: Debug
I: Info
W: Warning
E: Error
A: Assert

In addition, support for the format modifiers:
* date with a year
* user identifier (uid)
* microseconds fraction of second precision (usec)
* time zone offset

Also see:
  https://developer.android.com/studio/debug/logcat
"""

import pyparsing

from dfdatetime import time_elements as dfdatetime_time_elements

from plaso.containers import events
from plaso.lib import dateless_helper
from plaso.lib import errors
from plaso.parsers import text_parser
from plaso.parsers.text_plugins import interface


[docs] class AndroidLogcatEventData(events.EventData): """Android logcat event data. Attributes: component_tag (str): the tag that indicates the system component from which the logcat line originates. file_offset (int): the file offset of where the log message was parsed. message (str): the log message. pid (int): process identifier (PID) that created the logcat line. priority (str): a character in the set {V, D, I, W, E, F, S}, which is ordered from lowest to highest priority. recorded_time (dfdatetime.DateTimeValues): date and time the log entry was recorded. thread_identifier (int): thread identifier (TID) that created the logcat line. user_identifier (int): the user identifier (UID) or Android ID of the logged process. """ DATA_TYPE = "android:logcat"
[docs] def __init__(self): """Initializes event data.""" super().__init__(data_type=self.DATA_TYPE) self.component_tag = None self.file_offset = None self.message = None self.pid = None self.priority = None self.recorded_time = None self.thread_identifier = None self.user_identifier = None
[docs] class AndroidLogcatTextPlugin( interface.TextPlugin, dateless_helper.DateLessLogFormatHelper ): """Text parser plugin for Android logcat files.""" NAME = "android_logcat" DATA_FORMAT = "Android logcat file" ENCODING = "utf-8" _INTEGER = pyparsing.Word(pyparsing.nums).set_parse_action( lambda tokens: int(tokens[0], 10) ) _TWO_DIGITS = pyparsing.Word(pyparsing.nums, exact=2).set_parse_action( lambda tokens: int(tokens[0], 10) ) _FOUR_DIGITS = pyparsing.Word(pyparsing.nums, exact=4).set_parse_action( lambda tokens: int(tokens[0], 10) ) _MONTH_DAY = _TWO_DIGITS + pyparsing.Suppress("-") + _TWO_DIGITS _YEAR_MONTH_DAY = ( _FOUR_DIGITS + pyparsing.Suppress("-") + _TWO_DIGITS + pyparsing.Suppress("-") + _TWO_DIGITS ) _FRACTION_OF_SECOND = pyparsing.Word(pyparsing.nums, exact=3) ^ pyparsing.Word( pyparsing.nums, exact=6 ) # Date and time values are formatted as: # 01-02 01:02:04.156 (year-less) # 2022-01-02 01:20:03.171 # 2022-01-02 11:44:23.183801 _DATE_TIME = ( pyparsing.Or([_YEAR_MONTH_DAY, _MONTH_DAY]) + _TWO_DIGITS + pyparsing.Suppress(":") + _TWO_DIGITS + pyparsing.Suppress(":") + _TWO_DIGITS + pyparsing.Suppress(".") + _FRACTION_OF_SECOND ) _TIME_ZONE_OFFSET = pyparsing.Word("+-", exact=1) + _TWO_DIGITS + _TWO_DIGITS _PID_AND_THREAD_IDENTIFIER = _INTEGER.set_results_name( "pid" ) + _INTEGER.set_results_name("thread_identifier") _USER_PID_AND_THREAD_IDENTIFIER = ( _INTEGER.set_results_name("user_identifier") + _PID_AND_THREAD_IDENTIFIER ) _END_OF_LINE = pyparsing.Suppress(pyparsing.LineEnd()) _BEGINNING_LINE = ( pyparsing.Suppress("--------- beginning of ") + pyparsing.one_of(["events", "kernel", "main", "radio", "system"]) + _END_OF_LINE ) _THREADTIME_LINE_BODY = ( pyparsing.Or([_USER_PID_AND_THREAD_IDENTIFIER, _PID_AND_THREAD_IDENTIFIER]) + pyparsing.Word("VDIWEFS", exact=1).set_results_name("priority") + pyparsing.Optional( pyparsing.Word( pyparsing.printables + " ", excludeChars=":" ).set_results_name("tag") ) ) _TIME_LINE_BODY = ( pyparsing.Word("VDIWEFS", exact=1).set_results_name("priority") + pyparsing.Suppress("/") + pyparsing.Word(pyparsing.printables + " ", excludeChars="(").set_results_name( "tag" ) + pyparsing.Suppress("(") + pyparsing.Or( [ _INTEGER.set_results_name("pid"), ( _INTEGER.set_results_name("user_identifier") + pyparsing.Suppress(":") + _INTEGER.set_results_name("pid") ), ] ) + pyparsing.Suppress(")") ) _LOG_LINE = ( _DATE_TIME.set_results_name("date_time") + pyparsing.Optional(_TIME_ZONE_OFFSET).set_results_name("time_zone_offset") + (_THREADTIME_LINE_BODY ^ _TIME_LINE_BODY) + pyparsing.Suppress(": ") + pyparsing.restOfLine().set_results_name("message") + _END_OF_LINE ) _LINE_STRUCTURES = [("beginning_line", _BEGINNING_LINE), ("log_line", _LOG_LINE)] VERIFICATION_GRAMMAR = _BEGINNING_LINE ^ _LOG_LINE def _ParseRecord(self, parser_mediator, key, structure): """Parses a pyparsing structure. Args: parser_mediator (ParserMediator): mediates interactions between parsers and other components, such as storage and dfVFS. key (str): name of the parsed structure. structure (pyparsing.ParseResults): tokens from a parsed log line. Raises: ParseError: if the structure cannot be parsed. """ if key != "beginning_line": event_data = AndroidLogcatEventData() event_data.component_tag = self._GetStringValueFromStructure( structure, "tag" ) event_data.file_offset = self._current_offset event_data.message = self._GetValueFromStructure(structure, "message") event_data.pid = self._GetValueFromStructure(structure, "pid") event_data.priority = self._GetValueFromStructure(structure, "priority") event_data.recorded_time = self._ParseTimeElements(structure) event_data.thread_identifier = self._GetValueFromStructure( structure, "thread_identifier" ) event_data.user_identifier = self._GetValueFromStructure( structure, "user_identifier" ) parser_mediator.ProduceEventData(event_data) def _ParseTimeElements(self, structure): """Parses date and time elements of a log line. Args: structure (pyparsing.ParseResults): tokens from a parsed log line. Returns: dfdatetime.TimeElements: date and time value. Raises: ParseError: if a valid date and time value cannot be derived from the time elements. """ try: time_elements_structure = self._GetValueFromStructure( structure, "date_time" ) has_year = len(time_elements_structure) == 7 if has_year: ( year, month, day_of_month, hours, minutes, seconds, fraction_of_second_string, ) = time_elements_structure else: ( month, day_of_month, hours, minutes, seconds, fraction_of_second_string, ) = time_elements_structure self._UpdateYear(month) year = self._GetRelativeYear() time_zone_offset = self._GetValueFromStructure( structure, "time_zone_offset" ) if time_zone_offset: time_zone_sign, time_zone_hours, time_zone_minutes = time_zone_offset time_zone_offset = (time_zone_hours * 60) + time_zone_minutes if time_zone_sign == "-": time_zone_offset *= -1 fraction_of_second = int(fraction_of_second_string, 10) time_elements_tuple = ( year, month, day_of_month, hours, minutes, seconds, fraction_of_second, ) if len(fraction_of_second_string) == 3: date_time = dfdatetime_time_elements.TimeElementsInMilliseconds( is_delta=(not has_year), time_elements_tuple=time_elements_tuple, time_zone_offset=time_zone_offset, ) else: date_time = dfdatetime_time_elements.TimeElementsInMicroseconds( is_delta=(not has_year), time_elements_tuple=time_elements_tuple, time_zone_offset=time_zone_offset, ) if time_zone_offset is None: date_time.is_local_time = True return date_time except (IndexError, TypeError, ValueError) as exception: raise errors.ParseError( f"Unable to parse time elements with error: {exception!s}" )
[docs] def CheckRequiredFormat(self, parser_mediator, text_reader): """Check if the log record has the minimal structure required by the plugin. Args: parser_mediator (ParserMediator): mediates interactions between parsers and other components, such as storage and dfVFS. text_reader (EncodedTextReader): text reader. Returns: bool: True if this is the correct plugin, False otherwise. """ try: structure = self._VerifyString(text_reader.lines) except errors.ParseError: return False self._SetEstimatedYear(parser_mediator) time_elements_structure = self._GetValueFromStructure(structure, "date_time") if time_elements_structure: try: self._ParseTimeElements(time_elements_structure) except errors.ParseError: return False return True
text_parser.TextLogParser.RegisterPlugin(AndroidLogcatTextPlugin)