By moving the dynamic argument construction to keyword-arguments, we can remove all of the specialized handling, and streamline it. If a tracing method wants to access these, they can define the kwargs, or ignore it be placing `**kwargs` at the end of the function's arguments list. Added deprecation warning to Analyzer class to make users aware of the Analyzer2 class. No removal date is planned. Signed-off-by: Mads Ynddal <m.ynddal@samsung.com> Message-id: 20230926103436.25700-13-mads@ynddal.dk Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com>
		
			
				
	
	
		
			360 lines
		
	
	
		
			13 KiB
		
	
	
	
		
			Python
		
	
	
		
			Executable File
		
	
	
	
	
			
		
		
	
	
			360 lines
		
	
	
		
			13 KiB
		
	
	
	
		
			Python
		
	
	
		
			Executable File
		
	
	
	
	
| #!/usr/bin/env python3
 | |
| #
 | |
| # Pretty-printer for simple trace backend binary trace files
 | |
| #
 | |
| # Copyright IBM, Corp. 2010
 | |
| #
 | |
| # This work is licensed under the terms of the GNU GPL, version 2.  See
 | |
| # the COPYING file in the top-level directory.
 | |
| #
 | |
| # For help see docs/devel/tracing.rst
 | |
| 
 | |
| import sys
 | |
| import struct
 | |
| import inspect
 | |
| import warnings
 | |
| from tracetool import read_events, Event
 | |
| from tracetool.backend.simple import is_string
 | |
| 
 | |
| __all__ = ['Analyzer', 'Analyzer2', 'process', 'run']
 | |
| 
 | |
| # This is the binary format that the QEMU "simple" trace backend
 | |
| # emits. There is no specification documentation because the format is
 | |
| # not guaranteed to be stable. Trace files must be parsed with the
 | |
| # same trace-events-all file and the same simpletrace.py file that
 | |
| # QEMU was built with.
 | |
| header_event_id = 0xffffffffffffffff
 | |
| header_magic    = 0xf2b177cb0aa429b4
 | |
| dropped_event_id = 0xfffffffffffffffe
 | |
| 
 | |
| record_type_mapping = 0
 | |
| record_type_event = 1
 | |
| 
 | |
| log_header_fmt = '=QQQ'
 | |
| rec_header_fmt = '=QQII'
 | |
| rec_header_fmt_len = struct.calcsize(rec_header_fmt)
 | |
| 
 | |
| class SimpleException(Exception):
 | |
|     pass
 | |
| 
 | |
| def read_header(fobj, hfmt):
 | |
|     '''Read a trace record header'''
 | |
|     hlen = struct.calcsize(hfmt)
 | |
|     hdr = fobj.read(hlen)
 | |
|     if len(hdr) != hlen:
 | |
|         raise SimpleException('Error reading header. Wrong filetype provided?')
 | |
|     return struct.unpack(hfmt, hdr)
 | |
| 
 | |
| def get_mapping(fobj):
 | |
|     (event_id, ) = struct.unpack('=Q', fobj.read(8))
 | |
|     (len, ) = struct.unpack('=L', fobj.read(4))
 | |
|     name = fobj.read(len).decode()
 | |
| 
 | |
|     return (event_id, name)
 | |
| 
 | |
| def read_record(fobj):
 | |
|     """Deserialize a trace record from a file into a tuple (event_num, timestamp, pid, args)."""
 | |
|     event_id, timestamp_ns, record_length, record_pid = read_header(fobj, rec_header_fmt)
 | |
|     args_payload = fobj.read(record_length - rec_header_fmt_len)
 | |
|     return (event_id, timestamp_ns, record_pid, args_payload)
 | |
| 
 | |
| def read_trace_header(fobj):
 | |
|     """Read and verify trace file header"""
 | |
|     _header_event_id, _header_magic, log_version = read_header(fobj, log_header_fmt)
 | |
|     if _header_event_id != header_event_id:
 | |
|         raise ValueError(f'Not a valid trace file, header id {_header_event_id} != {header_event_id}')
 | |
|     if _header_magic != header_magic:
 | |
|         raise ValueError(f'Not a valid trace file, header magic {_header_magic} != {header_magic}')
 | |
| 
 | |
|     if log_version not in [0, 2, 3, 4]:
 | |
|         raise ValueError(f'Unknown version {log_version} of tracelog format!')
 | |
|     if log_version != 4:
 | |
|         raise ValueError(f'Log format {log_version} not supported with this QEMU release!')
 | |
| 
 | |
| def read_trace_records(events, fobj, read_header):
 | |
|     """Deserialize trace records from a file, yielding record tuples (event, event_num, timestamp, pid, arg1, ..., arg6).
 | |
| 
 | |
|     Args:
 | |
|         event_mapping (str -> Event): events dict, indexed by name
 | |
|         fobj (file): input file
 | |
|         read_header (bool): whether headers were read from fobj
 | |
| 
 | |
|     """
 | |
|     frameinfo = inspect.getframeinfo(inspect.currentframe())
 | |
|     dropped_event = Event.build("Dropped_Event(uint64_t num_events_dropped)",
 | |
|                                 frameinfo.lineno + 1, frameinfo.filename)
 | |
| 
 | |
|     event_mapping = {e.name: e for e in events}
 | |
|     event_mapping["dropped"] = dropped_event
 | |
|     event_id_to_name = {dropped_event_id: "dropped"}
 | |
| 
 | |
|     # If there is no header assume event ID mapping matches events list
 | |
|     if not read_header:
 | |
|         for event_id, event in enumerate(events):
 | |
|             event_id_to_name[event_id] = event.name
 | |
| 
 | |
|     while True:
 | |
|         t = fobj.read(8)
 | |
|         if len(t) == 0:
 | |
|             break
 | |
| 
 | |
|         (rectype, ) = struct.unpack('=Q', t)
 | |
|         if rectype == record_type_mapping:
 | |
|             event_id, event_name = get_mapping(fobj)
 | |
|             event_id_to_name[event_id] = event_name
 | |
|         else:
 | |
|             event_id, timestamp_ns, pid, args_payload = read_record(fobj)
 | |
|             event_name = event_id_to_name[event_id]
 | |
| 
 | |
|             try:
 | |
|                 event = event_mapping[event_name]
 | |
|             except KeyError as e:
 | |
|                 raise SimpleException(
 | |
|                     f'{e} event is logged but is not declared in the trace events'
 | |
|                     'file, try using trace-events-all instead.'
 | |
|                 )
 | |
| 
 | |
|             offset = 0
 | |
|             args = []
 | |
|             for type, _ in event.args:
 | |
|                 if is_string(type):
 | |
|                     (length,) = struct.unpack_from('=L', args_payload, offset=offset)
 | |
|                     offset += 4
 | |
|                     s = args_payload[offset:offset+length]
 | |
|                     offset += length
 | |
|                     args.append(s)
 | |
|                 else:
 | |
|                     (value,) = struct.unpack_from('=Q', args_payload, offset=offset)
 | |
|                     offset += 8
 | |
|                     args.append(value)
 | |
| 
 | |
|             yield (event_mapping[event_name], event_name, timestamp_ns, pid) + tuple(args)
 | |
| 
 | |
| class Analyzer:
 | |
|     """[Deprecated. Refer to Analyzer2 instead.]
 | |
| 
 | |
|     A trace file analyzer which processes trace records.
 | |
| 
 | |
|     An analyzer can be passed to run() or process().  The begin() method is
 | |
|     invoked, then each trace record is processed, and finally the end() method
 | |
|     is invoked. When Analyzer is used as a context-manager (using the `with`
 | |
|     statement), begin() and end() are called automatically.
 | |
| 
 | |
|     If a method matching a trace event name exists, it is invoked to process
 | |
|     that trace record.  Otherwise the catchall() method is invoked.
 | |
| 
 | |
|     Example:
 | |
|     The following method handles the runstate_set(int new_state) trace event::
 | |
| 
 | |
|       def runstate_set(self, new_state):
 | |
|           ...
 | |
| 
 | |
|     The method can also take a timestamp argument before the trace event
 | |
|     arguments::
 | |
| 
 | |
|       def runstate_set(self, timestamp, new_state):
 | |
|           ...
 | |
| 
 | |
|     Timestamps have the uint64_t type and are in nanoseconds.
 | |
| 
 | |
|     The pid can be included in addition to the timestamp and is useful when
 | |
|     dealing with traces from multiple processes::
 | |
| 
 | |
|       def runstate_set(self, timestamp, pid, new_state):
 | |
|           ...
 | |
|     """
 | |
| 
 | |
|     def begin(self):
 | |
|         """Called at the start of the trace."""
 | |
|         pass
 | |
| 
 | |
|     def catchall(self, event, rec):
 | |
|         """Called if no specific method for processing a trace event has been found."""
 | |
|         pass
 | |
| 
 | |
|     def _build_fn(self, event):
 | |
|         fn = getattr(self, event.name, None)
 | |
|         if fn is None:
 | |
|             # Return early to avoid costly call to inspect.getfullargspec
 | |
|             return self.catchall
 | |
| 
 | |
|         event_argcount = len(event.args)
 | |
|         fn_argcount = len(inspect.getfullargspec(fn)[0]) - 1
 | |
|         if fn_argcount == event_argcount + 1:
 | |
|             # Include timestamp as first argument
 | |
|             return lambda _, rec: fn(*(rec[1:2] + rec[3:3 + event_argcount]))
 | |
|         elif fn_argcount == event_argcount + 2:
 | |
|             # Include timestamp and pid
 | |
|             return lambda _, rec: fn(*rec[1:3 + event_argcount])
 | |
|         else:
 | |
|             # Just arguments, no timestamp or pid
 | |
|             return lambda _, rec: fn(*rec[3:3 + event_argcount])
 | |
| 
 | |
|     def _process_event(self, rec_args, *, event, event_id, timestamp_ns, pid, **kwargs):
 | |
|         warnings.warn(
 | |
|             "Use of deprecated Analyzer class. Refer to Analyzer2 instead.",
 | |
|             DeprecationWarning,
 | |
|         )
 | |
| 
 | |
|         if not hasattr(self, '_fn_cache'):
 | |
|             # NOTE: Cannot depend on downstream subclasses to have
 | |
|             # super().__init__() because of legacy.
 | |
|             self._fn_cache = {}
 | |
| 
 | |
|         rec = (event_id, timestamp_ns, pid, *rec_args)
 | |
|         if event_id not in self._fn_cache:
 | |
|             self._fn_cache[event_id] = self._build_fn(event)
 | |
|         self._fn_cache[event_id](event, rec)
 | |
| 
 | |
|     def end(self):
 | |
|         """Called at the end of the trace."""
 | |
|         pass
 | |
| 
 | |
|     def __enter__(self):
 | |
|         self.begin()
 | |
|         return self
 | |
| 
 | |
|     def __exit__(self, exc_type, exc_val, exc_tb):
 | |
|         if exc_type is None:
 | |
|             self.end()
 | |
|         return False
 | |
| 
 | |
| class Analyzer2(Analyzer):
 | |
|     """A trace file analyzer which processes trace records.
 | |
| 
 | |
|     An analyzer can be passed to run() or process().  The begin() method is
 | |
|     invoked, then each trace record is processed, and finally the end() method
 | |
|     is invoked. When Analyzer is used as a context-manager (using the `with`
 | |
|     statement), begin() and end() are called automatically.
 | |
| 
 | |
|     If a method matching a trace event name exists, it is invoked to process
 | |
|     that trace record.  Otherwise the catchall() method is invoked.
 | |
| 
 | |
|     The methods are called with a set of keyword-arguments. These can be ignored
 | |
|     using `**kwargs` or defined like any keyword-argument.
 | |
| 
 | |
|     The following keyword-arguments are available, but make sure to have an
 | |
|     **kwargs to allow for unmatched arguments in the future:
 | |
|         event: Event object of current trace
 | |
|         event_id: The id of the event in the current trace file
 | |
|         timestamp_ns: The timestamp in nanoseconds of the trace
 | |
|         pid: The process id recorded for the given trace
 | |
| 
 | |
|     Example:
 | |
|     The following method handles the runstate_set(int new_state) trace event::
 | |
| 
 | |
|       def runstate_set(self, new_state, **kwargs):
 | |
|           ...
 | |
| 
 | |
|     The method can also explicitly take a timestamp keyword-argument with the
 | |
|     trace event arguments::
 | |
| 
 | |
|       def runstate_set(self, new_state, *, timestamp_ns, **kwargs):
 | |
|           ...
 | |
| 
 | |
|     Timestamps have the uint64_t type and are in nanoseconds.
 | |
| 
 | |
|     The pid can be included in addition to the timestamp and is useful when
 | |
|     dealing with traces from multiple processes:
 | |
| 
 | |
|       def runstate_set(self, new_state, *, timestamp_ns, pid, **kwargs):
 | |
|           ...
 | |
|     """
 | |
| 
 | |
|     def catchall(self, *rec_args, event, timestamp_ns, pid, event_id, **kwargs):
 | |
|         """Called if no specific method for processing a trace event has been found."""
 | |
|         pass
 | |
| 
 | |
|     def _process_event(self, rec_args, *, event, **kwargs):
 | |
|         fn = getattr(self, event.name, self.catchall)
 | |
|         fn(*rec_args, event=event, **kwargs)
 | |
| 
 | |
| def process(events, log, analyzer, read_header=True):
 | |
|     """Invoke an analyzer on each event in a log.
 | |
|     Args:
 | |
|         events (file-object or list or str): events list or file-like object or file path as str to read event data from
 | |
|         log (file-object or str): file-like object or file path as str to read log data from
 | |
|         analyzer (Analyzer): Instance of Analyzer to interpret the event data
 | |
|         read_header (bool, optional): Whether to read header data from the log data. Defaults to True.
 | |
|     """
 | |
| 
 | |
|     if isinstance(events, str):
 | |
|         with open(events, 'r') as f:
 | |
|             events_list = read_events(f, events)
 | |
|     elif isinstance(events, list):
 | |
|         # Treat as a list of events already produced by tracetool.read_events
 | |
|         events_list = events
 | |
|     else:
 | |
|         # Treat as an already opened file-object
 | |
|         events_list = read_events(events, events.name)
 | |
| 
 | |
|     if isinstance(log, str):
 | |
|         with open(log, 'rb') as log_fobj:
 | |
|             _process(events_list, log_fobj, analyzer, read_header)
 | |
|     else:
 | |
|         # Treat `log` as an already opened file-object. We will not close it,
 | |
|         # as we do not own it.
 | |
|         _process(events_list, log, analyzer, read_header)
 | |
| 
 | |
| def _process(events, log_fobj, analyzer, read_header=True):
 | |
|     """Internal function for processing
 | |
| 
 | |
|     Args:
 | |
|         events (list): list of events already produced by tracetool.read_events
 | |
|         log_fobj (file): file-object to read log data from
 | |
|         analyzer (Analyzer): the Analyzer to interpret the event data
 | |
|         read_header (bool, optional): Whether to read header data from the log data. Defaults to True.
 | |
|     """
 | |
| 
 | |
|     if read_header:
 | |
|         read_trace_header(log_fobj)
 | |
| 
 | |
|     with analyzer:
 | |
|         for event, event_id, timestamp_ns, record_pid, *rec_args in read_trace_records(events, log_fobj, read_header):
 | |
|             analyzer._process_event(
 | |
|                 rec_args,
 | |
|                 event=event,
 | |
|                 event_id=event_id,
 | |
|                 timestamp_ns=timestamp_ns,
 | |
|                 pid=record_pid,
 | |
|             )
 | |
| 
 | |
| def run(analyzer):
 | |
|     """Execute an analyzer on a trace file given on the command-line.
 | |
| 
 | |
|     This function is useful as a driver for simple analysis scripts.  More
 | |
|     advanced scripts will want to call process() instead."""
 | |
| 
 | |
|     try:
 | |
|         # NOTE: See built-in `argparse` module for a more robust cli interface
 | |
|         *no_header, trace_event_path, trace_file_path = sys.argv[1:]
 | |
|         assert no_header == [] or no_header == ['--no-header'], 'Invalid no-header argument'
 | |
|     except (AssertionError, ValueError):
 | |
|         raise SimpleException(f'usage: {sys.argv[0]} [--no-header] <trace-events> <trace-file>\n')
 | |
| 
 | |
|     with open(trace_event_path, 'r') as events_fobj, open(trace_file_path, 'rb') as log_fobj:
 | |
|         process(events_fobj, log_fobj, analyzer, read_header=not no_header)
 | |
| 
 | |
| if __name__ == '__main__':
 | |
|     class Formatter2(Analyzer2):
 | |
|         def __init__(self):
 | |
|             self.last_timestamp_ns = None
 | |
| 
 | |
|         def catchall(self, *rec_args, event, timestamp_ns, pid, event_id):
 | |
|             if self.last_timestamp_ns is None:
 | |
|                 self.last_timestamp_ns = timestamp_ns
 | |
|             delta_ns = timestamp_ns - self.last_timestamp_ns
 | |
|             self.last_timestamp_ns = timestamp_ns
 | |
| 
 | |
|             fields = [
 | |
|                 f'{name}={r}' if is_string(type) else f'{name}=0x{r:x}'
 | |
|                 for r, (type, name) in zip(rec_args, event.args)
 | |
|             ]
 | |
|             print(f'{event.name} {delta_ns / 1000:0.3f} {pid=} ' + ' '.join(fields))
 | |
| 
 | |
|     try:
 | |
|         run(Formatter2())
 | |
|     except SimpleException as e:
 | |
|         sys.stderr.write(str(e) + "\n")
 | |
|         sys.exit(1)
 |