123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307 |
- #!/usr/bin/env python3
- #
- # Pretty-printer for simple trace backend binary trace files
- #
- # Copyright IBM, Corp. 2010
- #
- # This work is licensed under the terms of the GNU GPL, version 2. See
- # the COPYING file in the top-level directory.
- #
- # For help see docs/devel/tracing.rst
- import sys
- import struct
- import inspect
- from tracetool import read_events, Event
- from tracetool.backend.simple import is_string
- __all__ = ['Analyzer', 'process', 'run']
- # This is the binary format that the QEMU "simple" trace backend
- # emits. There is no specification documentation because the format is
- # not guaranteed to be stable. Trace files must be parsed with the
- # same trace-events-all file and the same simpletrace.py file that
- # QEMU was built with.
- header_event_id = 0xffffffffffffffff
- header_magic = 0xf2b177cb0aa429b4
- dropped_event_id = 0xfffffffffffffffe
- record_type_mapping = 0
- record_type_event = 1
- log_header_fmt = '=QQQ'
- rec_header_fmt = '=QQII'
- rec_header_fmt_len = struct.calcsize(rec_header_fmt)
- class SimpleException(Exception):
- pass
- def read_header(fobj, hfmt):
- '''Read a trace record header'''
- hlen = struct.calcsize(hfmt)
- hdr = fobj.read(hlen)
- if len(hdr) != hlen:
- raise SimpleException('Error reading header. Wrong filetype provided?')
- return struct.unpack(hfmt, hdr)
- def get_mapping(fobj):
- (event_id, ) = struct.unpack('=Q', fobj.read(8))
- (len, ) = struct.unpack('=L', fobj.read(4))
- name = fobj.read(len).decode()
- return (event_id, name)
- def read_record(fobj):
- """Deserialize a trace record from a file into a tuple (event_num, timestamp, pid, args)."""
- event_id, timestamp_ns, record_length, record_pid = read_header(fobj, rec_header_fmt)
- args_payload = fobj.read(record_length - rec_header_fmt_len)
- return (event_id, timestamp_ns, record_pid, args_payload)
- def read_trace_header(fobj):
- """Read and verify trace file header"""
- _header_event_id, _header_magic, log_version = read_header(fobj, log_header_fmt)
- if _header_event_id != header_event_id:
- raise ValueError(f'Not a valid trace file, header id {_header_event_id} != {header_event_id}')
- if _header_magic != header_magic:
- raise ValueError(f'Not a valid trace file, header magic {_header_magic} != {header_magic}')
- if log_version not in [0, 2, 3, 4]:
- raise ValueError(f'Unknown version {log_version} of tracelog format!')
- if log_version != 4:
- raise ValueError(f'Log format {log_version} not supported with this QEMU release!')
- def read_trace_records(events, fobj, read_header):
- """Deserialize trace records from a file, yielding record tuples (event, event_num, timestamp, pid, arg1, ..., arg6).
- Args:
- event_mapping (str -> Event): events dict, indexed by name
- fobj (file): input file
- read_header (bool): whether headers were read from fobj
- """
- frameinfo = inspect.getframeinfo(inspect.currentframe())
- dropped_event = Event.build("Dropped_Event(uint64_t num_events_dropped)",
- frameinfo.lineno + 1, frameinfo.filename)
- event_mapping = {e.name: e for e in events}
- event_mapping["dropped"] = dropped_event
- event_id_to_name = {dropped_event_id: "dropped"}
- # If there is no header assume event ID mapping matches events list
- if not read_header:
- for event_id, event in enumerate(events):
- event_id_to_name[event_id] = event.name
- while True:
- t = fobj.read(8)
- if len(t) == 0:
- break
- (rectype, ) = struct.unpack('=Q', t)
- if rectype == record_type_mapping:
- event_id, event_name = get_mapping(fobj)
- event_id_to_name[event_id] = event_name
- else:
- event_id, timestamp_ns, pid, args_payload = read_record(fobj)
- event_name = event_id_to_name[event_id]
- try:
- event = event_mapping[event_name]
- except KeyError as e:
- raise SimpleException(
- f'{e} event is logged but is not declared in the trace events'
- 'file, try using trace-events-all instead.'
- )
- offset = 0
- args = []
- for type, _ in event.args:
- if is_string(type):
- (length,) = struct.unpack_from('=L', args_payload, offset=offset)
- offset += 4
- s = args_payload[offset:offset+length]
- offset += length
- args.append(s)
- else:
- (value,) = struct.unpack_from('=Q', args_payload, offset=offset)
- offset += 8
- args.append(value)
- yield (event_mapping[event_name], event_name, timestamp_ns, pid) + tuple(args)
- class Analyzer:
- """A trace file analyzer which processes trace records.
- An analyzer can be passed to run() or process(). The begin() method is
- invoked, then each trace record is processed, and finally the end() method
- is invoked. When Analyzer is used as a context-manager (using the `with`
- statement), begin() and end() are called automatically.
- If a method matching a trace event name exists, it is invoked to process
- that trace record. Otherwise the catchall() method is invoked.
- Example:
- The following method handles the runstate_set(int new_state) trace event::
- def runstate_set(self, new_state):
- ...
- The method can also take a timestamp argument before the trace event
- arguments::
- def runstate_set(self, timestamp, new_state):
- ...
- Timestamps have the uint64_t type and are in nanoseconds.
- The pid can be included in addition to the timestamp and is useful when
- dealing with traces from multiple processes::
- def runstate_set(self, timestamp, pid, new_state):
- ...
- """
- def begin(self):
- """Called at the start of the trace."""
- pass
- def catchall(self, event, rec):
- """Called if no specific method for processing a trace event has been found."""
- pass
- def _build_fn(self, event):
- fn = getattr(self, event.name, None)
- if fn is None:
- # Return early to avoid costly call to inspect.getfullargspec
- return self.catchall
- event_argcount = len(event.args)
- fn_argcount = len(inspect.getfullargspec(fn)[0]) - 1
- if fn_argcount == event_argcount + 1:
- # Include timestamp as first argument
- return lambda _, rec: fn(*(rec[1:2] + rec[3:3 + event_argcount]))
- elif fn_argcount == event_argcount + 2:
- # Include timestamp and pid
- return lambda _, rec: fn(*rec[1:3 + event_argcount])
- else:
- # Just arguments, no timestamp or pid
- return lambda _, rec: fn(*rec[3:3 + event_argcount])
- def _process_event(self, rec_args, *, event, event_id, timestamp_ns, pid, **kwargs):
- if not hasattr(self, '_fn_cache'):
- # NOTE: Cannot depend on downstream subclasses to have
- # super().__init__() because of legacy.
- self._fn_cache = {}
- rec = (event_id, timestamp_ns, pid, *rec_args)
- if event_id not in self._fn_cache:
- self._fn_cache[event_id] = self._build_fn(event)
- self._fn_cache[event_id](event, rec)
- def end(self):
- """Called at the end of the trace."""
- pass
- def __enter__(self):
- self.begin()
- return self
- def __exit__(self, exc_type, exc_val, exc_tb):
- if exc_type is None:
- self.end()
- return False
- def process(events, log, analyzer, read_header=True):
- """Invoke an analyzer on each event in a log.
- Args:
- events (file-object or list or str): events list or file-like object or file path as str to read event data from
- log (file-object or str): file-like object or file path as str to read log data from
- analyzer (Analyzer): Instance of Analyzer to interpret the event data
- read_header (bool, optional): Whether to read header data from the log data. Defaults to True.
- """
- if isinstance(events, str):
- with open(events, 'r') as f:
- events_list = read_events(f, events)
- elif isinstance(events, list):
- # Treat as a list of events already produced by tracetool.read_events
- events_list = events
- else:
- # Treat as an already opened file-object
- events_list = read_events(events, events.name)
- if isinstance(log, str):
- with open(log, 'rb') as log_fobj:
- _process(events_list, log_fobj, analyzer, read_header)
- else:
- # Treat `log` as an already opened file-object. We will not close it,
- # as we do not own it.
- _process(events_list, log, analyzer, read_header)
- def _process(events, log_fobj, analyzer, read_header=True):
- """Internal function for processing
- Args:
- events (list): list of events already produced by tracetool.read_events
- log_fobj (file): file-object to read log data from
- analyzer (Analyzer): the Analyzer to interpret the event data
- read_header (bool, optional): Whether to read header data from the log data. Defaults to True.
- """
- if read_header:
- read_trace_header(log_fobj)
- with analyzer:
- for event, event_id, timestamp_ns, record_pid, *rec_args in read_trace_records(events, log_fobj, read_header):
- analyzer._process_event(
- rec_args,
- event=event,
- event_id=event_id,
- timestamp_ns=timestamp_ns,
- pid=record_pid,
- )
- def run(analyzer):
- """Execute an analyzer on a trace file given on the command-line.
- This function is useful as a driver for simple analysis scripts. More
- advanced scripts will want to call process() instead."""
- try:
- # NOTE: See built-in `argparse` module for a more robust cli interface
- *no_header, trace_event_path, trace_file_path = sys.argv[1:]
- assert no_header == [] or no_header == ['--no-header'], 'Invalid no-header argument'
- except (AssertionError, ValueError):
- raise SimpleException(f'usage: {sys.argv[0]} [--no-header] <trace-events> <trace-file>\n')
- with open(trace_event_path, 'r') as events_fobj, open(trace_file_path, 'rb') as log_fobj:
- process(events_fobj, log_fobj, analyzer, read_header=not no_header)
- if __name__ == '__main__':
- class Formatter(Analyzer):
- def __init__(self):
- self.last_timestamp = None
- def catchall(self, event, rec):
- timestamp = rec[1]
- if self.last_timestamp is None:
- self.last_timestamp = timestamp
- delta_ns = timestamp - self.last_timestamp
- self.last_timestamp = timestamp
- fields = [event.name, '%0.3f' % (delta_ns / 1000.0),
- 'pid=%d' % rec[2]]
- i = 3
- for type, name in event.args:
- if is_string(type):
- fields.append('%s=%s' % (name, rec[i]))
- else:
- fields.append('%s=0x%x' % (name, rec[i]))
- i += 1
- print(' '.join(fields))
- try:
- run(Formatter())
- except SimpleException as e:
- sys.stderr.write(str(e) + "\n")
- sys.exit(1)
|