simpletrace.py 9.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288
  1. #!/usr/bin/env python3
  2. #
  3. # Pretty-printer for simple trace backend binary trace files
  4. #
  5. # Copyright IBM, Corp. 2010
  6. #
  7. # This work is licensed under the terms of the GNU GPL, version 2. See
  8. # the COPYING file in the top-level directory.
  9. #
  10. # For help see docs/devel/tracing.rst
  11. import sys
  12. import struct
  13. import inspect
  14. from tracetool import read_events, Event
  15. from tracetool.backend.simple import is_string
  16. __all__ = ['Analyzer', 'process', 'run']
  17. # This is the binary format that the QEMU "simple" trace backend
  18. # emits. There is no specification documentation because the format is
  19. # not guaranteed to be stable. Trace files must be parsed with the
  20. # same trace-events-all file and the same simpletrace.py file that
  21. # QEMU was built with.
  22. header_event_id = 0xffffffffffffffff
  23. header_magic = 0xf2b177cb0aa429b4
  24. dropped_event_id = 0xfffffffffffffffe
  25. record_type_mapping = 0
  26. record_type_event = 1
  27. log_header_fmt = '=QQQ'
  28. rec_header_fmt = '=QQII'
  29. def read_header(fobj, hfmt):
  30. '''Read a trace record header'''
  31. hlen = struct.calcsize(hfmt)
  32. hdr = fobj.read(hlen)
  33. if len(hdr) != hlen:
  34. return None
  35. return struct.unpack(hfmt, hdr)
  36. def get_record(event_mapping, event_id_to_name, rechdr, fobj):
  37. """Deserialize a trace record from a file into a tuple
  38. (name, timestamp, pid, arg1, ..., arg6)."""
  39. if rechdr is None:
  40. return None
  41. if rechdr[0] != dropped_event_id:
  42. event_id = rechdr[0]
  43. name = event_id_to_name[event_id]
  44. rec = (name, rechdr[1], rechdr[3])
  45. try:
  46. event = event_mapping[name]
  47. except KeyError as e:
  48. sys.stderr.write('%s event is logged but is not declared ' \
  49. 'in the trace events file, try using ' \
  50. 'trace-events-all instead.\n' % str(e))
  51. sys.exit(1)
  52. for type, name in event.args:
  53. if is_string(type):
  54. l = fobj.read(4)
  55. (len,) = struct.unpack('=L', l)
  56. s = fobj.read(len)
  57. rec = rec + (s,)
  58. else:
  59. (value,) = struct.unpack('=Q', fobj.read(8))
  60. rec = rec + (value,)
  61. else:
  62. rec = ("dropped", rechdr[1], rechdr[3])
  63. (value,) = struct.unpack('=Q', fobj.read(8))
  64. rec = rec + (value,)
  65. return rec
  66. def get_mapping(fobj):
  67. (event_id, ) = struct.unpack('=Q', fobj.read(8))
  68. (len, ) = struct.unpack('=L', fobj.read(4))
  69. name = fobj.read(len).decode()
  70. return (event_id, name)
  71. def read_record(event_mapping, event_id_to_name, fobj):
  72. """Deserialize a trace record from a file into a tuple (event_num, timestamp, pid, arg1, ..., arg6)."""
  73. rechdr = read_header(fobj, rec_header_fmt)
  74. return get_record(event_mapping, event_id_to_name, rechdr, fobj)
  75. def read_trace_header(fobj):
  76. """Read and verify trace file header"""
  77. header = read_header(fobj, log_header_fmt)
  78. if header is None:
  79. raise ValueError('Not a valid trace file!')
  80. if header[0] != header_event_id:
  81. raise ValueError('Not a valid trace file, header id %d != %d' %
  82. (header[0], header_event_id))
  83. if header[1] != header_magic:
  84. raise ValueError('Not a valid trace file, header magic %d != %d' %
  85. (header[1], header_magic))
  86. log_version = header[2]
  87. if log_version not in [0, 2, 3, 4]:
  88. raise ValueError('Unknown version of tracelog format!')
  89. if log_version != 4:
  90. raise ValueError('Log format %d not supported with this QEMU release!'
  91. % log_version)
  92. def read_trace_records(event_mapping, event_id_to_name, fobj):
  93. """Deserialize trace records from a file, yielding record tuples (event_num, timestamp, pid, arg1, ..., arg6).
  94. Note that `event_id_to_name` is modified if the file contains mapping records.
  95. Args:
  96. event_mapping (str -> Event): events dict, indexed by name
  97. event_id_to_name (int -> str): event names dict, indexed by event ID
  98. fobj (file): input file
  99. """
  100. while True:
  101. t = fobj.read(8)
  102. if len(t) == 0:
  103. break
  104. (rectype, ) = struct.unpack('=Q', t)
  105. if rectype == record_type_mapping:
  106. event_id, name = get_mapping(fobj)
  107. event_id_to_name[event_id] = name
  108. else:
  109. rec = read_record(event_mapping, event_id_to_name, fobj)
  110. yield rec
  111. class Analyzer(object):
  112. """A trace file analyzer which processes trace records.
  113. An analyzer can be passed to run() or process(). The begin() method is
  114. invoked, then each trace record is processed, and finally the end() method
  115. is invoked.
  116. If a method matching a trace event name exists, it is invoked to process
  117. that trace record. Otherwise the catchall() method is invoked.
  118. Example:
  119. The following method handles the runstate_set(int new_state) trace event::
  120. def runstate_set(self, new_state):
  121. ...
  122. The method can also take a timestamp argument before the trace event
  123. arguments::
  124. def runstate_set(self, timestamp, new_state):
  125. ...
  126. Timestamps have the uint64_t type and are in nanoseconds.
  127. The pid can be included in addition to the timestamp and is useful when
  128. dealing with traces from multiple processes::
  129. def runstate_set(self, timestamp, pid, new_state):
  130. ...
  131. """
  132. def begin(self):
  133. """Called at the start of the trace."""
  134. pass
  135. def catchall(self, event, rec):
  136. """Called if no specific method for processing a trace event has been found."""
  137. pass
  138. def end(self):
  139. """Called at the end of the trace."""
  140. pass
  141. def process(events, log, analyzer, read_header=True):
  142. """Invoke an analyzer on each event in a log.
  143. Args:
  144. events (file-object or list or str): events list or file-like object or file path as str to read event data from
  145. log (file-object or str): file-like object or file path as str to read log data from
  146. analyzer (Analyzer): Instance of Analyzer to interpret the event data
  147. read_header (bool, optional): Whether to read header data from the log data. Defaults to True.
  148. """
  149. if isinstance(events, str):
  150. with open(events, 'r') as f:
  151. events_list = read_events(f, events)
  152. elif isinstance(events, list):
  153. # Treat as a list of events already produced by tracetool.read_events
  154. events_list = events
  155. else:
  156. # Treat as an already opened file-object
  157. events_list = read_events(events, events.name)
  158. close_log = False
  159. if isinstance(log, str):
  160. log = open(log, 'rb')
  161. close_log = True
  162. if read_header:
  163. read_trace_header(log)
  164. frameinfo = inspect.getframeinfo(inspect.currentframe())
  165. dropped_event = Event.build("Dropped_Event(uint64_t num_events_dropped)",
  166. frameinfo.lineno + 1, frameinfo.filename)
  167. event_mapping = {"dropped": dropped_event}
  168. event_id_to_name = {dropped_event_id: "dropped"}
  169. for event in events_list:
  170. event_mapping[event.name] = event
  171. # If there is no header assume event ID mapping matches events list
  172. if not read_header:
  173. for event_id, event in enumerate(events_list):
  174. event_id_to_name[event_id] = event.name
  175. def build_fn(analyzer, event):
  176. if isinstance(event, str):
  177. return analyzer.catchall
  178. fn = getattr(analyzer, event.name, None)
  179. if fn is None:
  180. return analyzer.catchall
  181. event_argcount = len(event.args)
  182. fn_argcount = len(inspect.getfullargspec(fn)[0]) - 1
  183. if fn_argcount == event_argcount + 1:
  184. # Include timestamp as first argument
  185. return lambda _, rec: fn(*(rec[1:2] + rec[3:3 + event_argcount]))
  186. elif fn_argcount == event_argcount + 2:
  187. # Include timestamp and pid
  188. return lambda _, rec: fn(*rec[1:3 + event_argcount])
  189. else:
  190. # Just arguments, no timestamp or pid
  191. return lambda _, rec: fn(*rec[3:3 + event_argcount])
  192. analyzer.begin()
  193. fn_cache = {}
  194. for rec in read_trace_records(event_mapping, event_id_to_name, log):
  195. event_num = rec[0]
  196. event = event_mapping[event_num]
  197. if event_num not in fn_cache:
  198. fn_cache[event_num] = build_fn(analyzer, event)
  199. fn_cache[event_num](event, rec)
  200. analyzer.end()
  201. if close_log:
  202. log.close()
  203. def run(analyzer):
  204. """Execute an analyzer on a trace file given on the command-line.
  205. This function is useful as a driver for simple analysis scripts. More
  206. advanced scripts will want to call process() instead."""
  207. try:
  208. # NOTE: See built-in `argparse` module for a more robust cli interface
  209. *no_header, trace_event_path, trace_file_path = sys.argv[1:]
  210. assert no_header == [] or no_header == ['--no-header'], 'Invalid no-header argument'
  211. except (AssertionError, ValueError):
  212. sys.stderr.write(f'usage: {sys.argv[0]} [--no-header] <trace-events> <trace-file>\n')
  213. sys.exit(1)
  214. with open(trace_event_path, 'r') as events_fobj, open(trace_file_path, 'rb') as log_fobj:
  215. process(events_fobj, log_fobj, analyzer, read_header=not no_header)
  216. if __name__ == '__main__':
  217. class Formatter(Analyzer):
  218. def __init__(self):
  219. self.last_timestamp = None
  220. def catchall(self, event, rec):
  221. timestamp = rec[1]
  222. if self.last_timestamp is None:
  223. self.last_timestamp = timestamp
  224. delta_ns = timestamp - self.last_timestamp
  225. self.last_timestamp = timestamp
  226. fields = [event.name, '%0.3f' % (delta_ns / 1000.0),
  227. 'pid=%d' % rec[2]]
  228. i = 3
  229. for type, name in event.args:
  230. if is_string(type):
  231. fields.append('%s=%s' % (name, rec[i]))
  232. else:
  233. fields.append('%s=0x%x' % (name, rec[i]))
  234. i += 1
  235. print(' '.join(fields))
  236. run(Formatter())