Stefan Hajnoczi | 26f7227 | 2010-05-22 19:24:51 +0100 | [diff] [blame] | 1 | #!/usr/bin/env python |
| 2 | # |
| 3 | # Pretty-printer for simple trace backend binary trace files |
| 4 | # |
| 5 | # Copyright IBM, Corp. 2010 |
| 6 | # |
| 7 | # This work is licensed under the terms of the GNU GPL, version 2. See |
| 8 | # the COPYING file in the top-level directory. |
| 9 | # |
Philippe Mathieu-Daudé | 87e0331 | 2017-07-28 19:46:05 -0300 | [diff] [blame] | 10 | # For help see docs/devel/tracing.txt |
Stefan Hajnoczi | 26f7227 | 2010-05-22 19:24:51 +0100 | [diff] [blame] | 11 | |
Stefan Hajnoczi | 26f7227 | 2010-05-22 19:24:51 +0100 | [diff] [blame] | 12 | import struct |
| 13 | import re |
Stefan Hajnoczi | 59da668 | 2011-02-22 13:59:41 +0000 | [diff] [blame] | 14 | import inspect |
Daniel P. Berrange | d1b97bc | 2016-10-04 14:35:56 +0100 | [diff] [blame] | 15 | from tracetool import read_events, Event |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 16 | from tracetool.backend.simple import is_string |
Stefan Hajnoczi | 26f7227 | 2010-05-22 19:24:51 +0100 | [diff] [blame] | 17 | |
| 18 | header_event_id = 0xffffffffffffffff |
| 19 | header_magic = 0xf2b177cb0aa429b4 |
Stefan Hajnoczi | 0b5538c | 2011-02-26 18:38:39 +0000 | [diff] [blame] | 20 | dropped_event_id = 0xfffffffffffffffe |
Stefan Hajnoczi | 26f7227 | 2010-05-22 19:24:51 +0100 | [diff] [blame] | 21 | |
Daniel P. Berrange | 7f1b588 | 2016-10-04 14:35:50 +0100 | [diff] [blame] | 22 | record_type_mapping = 0 |
| 23 | record_type_event = 1 |
| 24 | |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 25 | log_header_fmt = '=QQQ' |
| 26 | rec_header_fmt = '=QQII' |
Stefan Hajnoczi | 26f7227 | 2010-05-22 19:24:51 +0100 | [diff] [blame] | 27 | |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 28 | def read_header(fobj, hfmt): |
| 29 | '''Read a trace record header''' |
| 30 | hlen = struct.calcsize(hfmt) |
| 31 | hdr = fobj.read(hlen) |
| 32 | if len(hdr) != hlen: |
Stefan Hajnoczi | 26f7227 | 2010-05-22 19:24:51 +0100 | [diff] [blame] | 33 | return None |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 34 | return struct.unpack(hfmt, hdr) |
Stefan Hajnoczi | 26f7227 | 2010-05-22 19:24:51 +0100 | [diff] [blame] | 35 | |
Daniel P. Berrange | 7f1b588 | 2016-10-04 14:35:50 +0100 | [diff] [blame] | 36 | def get_record(edict, idtoname, rechdr, fobj): |
| 37 | """Deserialize a trace record from a file into a tuple |
| 38 | (name, timestamp, pid, arg1, ..., arg6).""" |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 39 | if rechdr is None: |
| 40 | return None |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 41 | if rechdr[0] != dropped_event_id: |
| 42 | event_id = rechdr[0] |
Daniel P. Berrange | 7f1b588 | 2016-10-04 14:35:50 +0100 | [diff] [blame] | 43 | name = idtoname[event_id] |
| 44 | rec = (name, rechdr[1], rechdr[3]) |
Jose Ricardo Ziviani | 249e9f7 | 2017-05-29 13:30:04 -0300 | [diff] [blame] | 45 | try: |
| 46 | event = edict[name] |
| 47 | except KeyError, e: |
| 48 | import sys |
| 49 | sys.stderr.write('%s event is logged but is not declared ' \ |
| 50 | 'in the trace events file, try using ' \ |
| 51 | 'trace-events-all instead.\n' % str(e)) |
| 52 | sys.exit(1) |
| 53 | |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 54 | for type, name in event.args: |
| 55 | if is_string(type): |
| 56 | l = fobj.read(4) |
| 57 | (len,) = struct.unpack('=L', l) |
| 58 | s = fobj.read(len) |
| 59 | rec = rec + (s,) |
| 60 | else: |
| 61 | (value,) = struct.unpack('=Q', fobj.read(8)) |
| 62 | rec = rec + (value,) |
| 63 | else: |
Daniel P. Berrange | 7f1b588 | 2016-10-04 14:35:50 +0100 | [diff] [blame] | 64 | rec = ("dropped", rechdr[1], rechdr[3]) |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 65 | (value,) = struct.unpack('=Q', fobj.read(8)) |
| 66 | rec = rec + (value,) |
| 67 | return rec |
| 68 | |
Daniel P. Berrange | 7f1b588 | 2016-10-04 14:35:50 +0100 | [diff] [blame] | 69 | def get_mapping(fobj): |
| 70 | (event_id, ) = struct.unpack('=Q', fobj.read(8)) |
| 71 | (len, ) = struct.unpack('=L', fobj.read(4)) |
| 72 | name = fobj.read(len) |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 73 | |
Daniel P. Berrange | 7f1b588 | 2016-10-04 14:35:50 +0100 | [diff] [blame] | 74 | return (event_id, name) |
| 75 | |
| 76 | def read_record(edict, idtoname, fobj): |
Stefan Hajnoczi | 80ff35c | 2014-05-07 19:24:11 +0200 | [diff] [blame] | 77 | """Deserialize a trace record from a file into a tuple (event_num, timestamp, pid, arg1, ..., arg6).""" |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 78 | rechdr = read_header(fobj, rec_header_fmt) |
Daniel P. Berrange | 7f1b588 | 2016-10-04 14:35:50 +0100 | [diff] [blame] | 79 | return get_record(edict, idtoname, rechdr, fobj) |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 80 | |
Stefan Hajnoczi | 15327c3 | 2014-06-22 21:46:06 +0800 | [diff] [blame] | 81 | def read_trace_header(fobj): |
| 82 | """Read and verify trace file header""" |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 83 | header = read_header(fobj, log_header_fmt) |
Daniel P. Berrange | 25d5465 | 2017-01-25 16:14:17 +0000 | [diff] [blame] | 84 | if header is None: |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 85 | raise ValueError('Not a valid trace file!') |
Daniel P. Berrange | 25d5465 | 2017-01-25 16:14:17 +0000 | [diff] [blame] | 86 | if header[0] != header_event_id: |
| 87 | raise ValueError('Not a valid trace file, header id %d != %d' % |
| 88 | (header[0], header_event_id)) |
| 89 | if header[1] != header_magic: |
| 90 | raise ValueError('Not a valid trace file, header magic %d != %d' % |
| 91 | (header[1], header_magic)) |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 92 | |
| 93 | log_version = header[2] |
Daniel P. Berrange | 7f1b588 | 2016-10-04 14:35:50 +0100 | [diff] [blame] | 94 | if log_version not in [0, 2, 3, 4]: |
Lluís Vilanova | ef0bd3b | 2014-02-23 20:37:35 +0100 | [diff] [blame] | 95 | raise ValueError('Unknown version of tracelog format!') |
Daniel P. Berrange | 7f1b588 | 2016-10-04 14:35:50 +0100 | [diff] [blame] | 96 | if log_version != 4: |
Lluís Vilanova | ef0bd3b | 2014-02-23 20:37:35 +0100 | [diff] [blame] | 97 | raise ValueError('Log format %d not supported with this QEMU release!' |
| 98 | % log_version) |
Stefan Hajnoczi | 26f7227 | 2010-05-22 19:24:51 +0100 | [diff] [blame] | 99 | |
Stefan Hajnoczi | 840d835 | 2017-08-15 09:44:30 +0100 | [diff] [blame] | 100 | def read_trace_records(edict, idtoname, fobj): |
| 101 | """Deserialize trace records from a file, yielding record tuples (event_num, timestamp, pid, arg1, ..., arg6). |
| 102 | |
| 103 | Note that `idtoname` is modified if the file contains mapping records. |
| 104 | |
| 105 | Args: |
| 106 | edict (str -> Event): events dict, indexed by name |
| 107 | idtoname (int -> str): event names dict, indexed by event ID |
| 108 | fobj (file): input file |
| 109 | |
| 110 | """ |
Stefan Hajnoczi | 26f7227 | 2010-05-22 19:24:51 +0100 | [diff] [blame] | 111 | while True: |
Daniel P. Berrange | 7f1b588 | 2016-10-04 14:35:50 +0100 | [diff] [blame] | 112 | t = fobj.read(8) |
| 113 | if len(t) == 0: |
Stefan Hajnoczi | 26f7227 | 2010-05-22 19:24:51 +0100 | [diff] [blame] | 114 | break |
| 115 | |
Daniel P. Berrange | 7f1b588 | 2016-10-04 14:35:50 +0100 | [diff] [blame] | 116 | (rectype, ) = struct.unpack('=Q', t) |
| 117 | if rectype == record_type_mapping: |
| 118 | event_id, name = get_mapping(fobj) |
| 119 | idtoname[event_id] = name |
| 120 | else: |
| 121 | rec = read_record(edict, idtoname, fobj) |
| 122 | |
| 123 | yield rec |
Stefan Hajnoczi | 26f7227 | 2010-05-22 19:24:51 +0100 | [diff] [blame] | 124 | |
Stefan Hajnoczi | 59da668 | 2011-02-22 13:59:41 +0000 | [diff] [blame] | 125 | class Analyzer(object): |
| 126 | """A trace file analyzer which processes trace records. |
Stefan Hajnoczi | 26f7227 | 2010-05-22 19:24:51 +0100 | [diff] [blame] | 127 | |
Stefan Hajnoczi | 59da668 | 2011-02-22 13:59:41 +0000 | [diff] [blame] | 128 | An analyzer can be passed to run() or process(). The begin() method is |
| 129 | invoked, then each trace record is processed, and finally the end() method |
| 130 | is invoked. |
Stefan Hajnoczi | 26f7227 | 2010-05-22 19:24:51 +0100 | [diff] [blame] | 131 | |
Stefan Hajnoczi | 59da668 | 2011-02-22 13:59:41 +0000 | [diff] [blame] | 132 | If a method matching a trace event name exists, it is invoked to process |
Stefan Hajnoczi | 659370f | 2017-04-11 10:56:54 +0100 | [diff] [blame] | 133 | that trace record. Otherwise the catchall() method is invoked. |
| 134 | |
| 135 | Example: |
| 136 | The following method handles the runstate_set(int new_state) trace event:: |
| 137 | |
| 138 | def runstate_set(self, new_state): |
| 139 | ... |
| 140 | |
| 141 | The method can also take a timestamp argument before the trace event |
| 142 | arguments:: |
| 143 | |
| 144 | def runstate_set(self, timestamp, new_state): |
| 145 | ... |
| 146 | |
| 147 | Timestamps have the uint64_t type and are in nanoseconds. |
| 148 | |
| 149 | The pid can be included in addition to the timestamp and is useful when |
| 150 | dealing with traces from multiple processes:: |
| 151 | |
| 152 | def runstate_set(self, timestamp, pid, new_state): |
| 153 | ... |
| 154 | """ |
Stefan Hajnoczi | 26f7227 | 2010-05-22 19:24:51 +0100 | [diff] [blame] | 155 | |
Stefan Hajnoczi | 59da668 | 2011-02-22 13:59:41 +0000 | [diff] [blame] | 156 | def begin(self): |
| 157 | """Called at the start of the trace.""" |
| 158 | pass |
Stefan Hajnoczi | 26f7227 | 2010-05-22 19:24:51 +0100 | [diff] [blame] | 159 | |
Stefan Hajnoczi | 59da668 | 2011-02-22 13:59:41 +0000 | [diff] [blame] | 160 | def catchall(self, event, rec): |
| 161 | """Called if no specific method for processing a trace event has been found.""" |
| 162 | pass |
| 163 | |
| 164 | def end(self): |
| 165 | """Called at the end of the trace.""" |
| 166 | pass |
| 167 | |
Stefan Hajnoczi | 15327c3 | 2014-06-22 21:46:06 +0800 | [diff] [blame] | 168 | def process(events, log, analyzer, read_header=True): |
Stefan Hajnoczi | 59da668 | 2011-02-22 13:59:41 +0000 | [diff] [blame] | 169 | """Invoke an analyzer on each event in a log.""" |
| 170 | if isinstance(events, str): |
Daniel P. Berrange | d1b97bc | 2016-10-04 14:35:56 +0100 | [diff] [blame] | 171 | events = read_events(open(events, 'r')) |
Stefan Hajnoczi | 59da668 | 2011-02-22 13:59:41 +0000 | [diff] [blame] | 172 | if isinstance(log, str): |
| 173 | log = open(log, 'rb') |
| 174 | |
Stefan Hajnoczi | 15327c3 | 2014-06-22 21:46:06 +0800 | [diff] [blame] | 175 | if read_header: |
| 176 | read_trace_header(log) |
| 177 | |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 178 | dropped_event = Event.build("Dropped_Event(uint64_t num_events_dropped)") |
Daniel P. Berrange | 7f1b588 | 2016-10-04 14:35:50 +0100 | [diff] [blame] | 179 | edict = {"dropped": dropped_event} |
Stefan Hajnoczi | 840d835 | 2017-08-15 09:44:30 +0100 | [diff] [blame] | 180 | idtoname = {dropped_event_id: "dropped"} |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 181 | |
Daniel P. Berrange | 7f1b588 | 2016-10-04 14:35:50 +0100 | [diff] [blame] | 182 | for event in events: |
| 183 | edict[event.name] = event |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 184 | |
Stefan Hajnoczi | 840d835 | 2017-08-15 09:44:30 +0100 | [diff] [blame] | 185 | # If there is no header assume event ID mapping matches events list |
| 186 | if not read_header: |
| 187 | for event_id, event in enumerate(events): |
| 188 | idtoname[event_id] = event.name |
| 189 | |
Stefan Hajnoczi | 59da668 | 2011-02-22 13:59:41 +0000 | [diff] [blame] | 190 | def build_fn(analyzer, event): |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 191 | if isinstance(event, str): |
| 192 | return analyzer.catchall |
| 193 | |
| 194 | fn = getattr(analyzer, event.name, None) |
Stefan Hajnoczi | 59da668 | 2011-02-22 13:59:41 +0000 | [diff] [blame] | 195 | if fn is None: |
| 196 | return analyzer.catchall |
| 197 | |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 198 | event_argcount = len(event.args) |
Stefan Hajnoczi | 59da668 | 2011-02-22 13:59:41 +0000 | [diff] [blame] | 199 | fn_argcount = len(inspect.getargspec(fn)[0]) - 1 |
| 200 | if fn_argcount == event_argcount + 1: |
| 201 | # Include timestamp as first argument |
Stefan Hajnoczi | 80ff35c | 2014-05-07 19:24:11 +0200 | [diff] [blame] | 202 | return lambda _, rec: fn(*((rec[1:2],) + rec[3:3 + event_argcount])) |
| 203 | elif fn_argcount == event_argcount + 2: |
| 204 | # Include timestamp and pid |
| 205 | return lambda _, rec: fn(*rec[1:3 + event_argcount]) |
Stefan Hajnoczi | 59da668 | 2011-02-22 13:59:41 +0000 | [diff] [blame] | 206 | else: |
Stefan Hajnoczi | 80ff35c | 2014-05-07 19:24:11 +0200 | [diff] [blame] | 207 | # Just arguments, no timestamp or pid |
| 208 | return lambda _, rec: fn(*rec[3:3 + event_argcount]) |
Stefan Hajnoczi | 59da668 | 2011-02-22 13:59:41 +0000 | [diff] [blame] | 209 | |
| 210 | analyzer.begin() |
| 211 | fn_cache = {} |
Stefan Hajnoczi | 840d835 | 2017-08-15 09:44:30 +0100 | [diff] [blame] | 212 | for rec in read_trace_records(edict, idtoname, log): |
Stefan Hajnoczi | 59da668 | 2011-02-22 13:59:41 +0000 | [diff] [blame] | 213 | event_num = rec[0] |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 214 | event = edict[event_num] |
Stefan Hajnoczi | 59da668 | 2011-02-22 13:59:41 +0000 | [diff] [blame] | 215 | if event_num not in fn_cache: |
| 216 | fn_cache[event_num] = build_fn(analyzer, event) |
| 217 | fn_cache[event_num](event, rec) |
| 218 | analyzer.end() |
| 219 | |
| 220 | def run(analyzer): |
| 221 | """Execute an analyzer on a trace file given on the command-line. |
| 222 | |
| 223 | This function is useful as a driver for simple analysis scripts. More |
| 224 | advanced scripts will want to call process() instead.""" |
| 225 | import sys |
| 226 | |
Stefan Hajnoczi | 15327c3 | 2014-06-22 21:46:06 +0800 | [diff] [blame] | 227 | read_header = True |
| 228 | if len(sys.argv) == 4 and sys.argv[1] == '--no-header': |
| 229 | read_header = False |
| 230 | del sys.argv[1] |
| 231 | elif len(sys.argv) != 3: |
| 232 | sys.stderr.write('usage: %s [--no-header] <trace-events> ' \ |
| 233 | '<trace-file>\n' % sys.argv[0]) |
Stefan Hajnoczi | 59da668 | 2011-02-22 13:59:41 +0000 | [diff] [blame] | 234 | sys.exit(1) |
| 235 | |
Daniel P. Berrange | d1b97bc | 2016-10-04 14:35:56 +0100 | [diff] [blame] | 236 | events = read_events(open(sys.argv[1], 'r')) |
Stefan Hajnoczi | 15327c3 | 2014-06-22 21:46:06 +0800 | [diff] [blame] | 237 | process(events, sys.argv[2], analyzer, read_header=read_header) |
Stefan Hajnoczi | 59da668 | 2011-02-22 13:59:41 +0000 | [diff] [blame] | 238 | |
| 239 | if __name__ == '__main__': |
| 240 | class Formatter(Analyzer): |
| 241 | def __init__(self): |
| 242 | self.last_timestamp = None |
| 243 | |
| 244 | def catchall(self, event, rec): |
| 245 | timestamp = rec[1] |
| 246 | if self.last_timestamp is None: |
| 247 | self.last_timestamp = timestamp |
| 248 | delta_ns = timestamp - self.last_timestamp |
| 249 | self.last_timestamp = timestamp |
| 250 | |
Stefan Hajnoczi | 80ff35c | 2014-05-07 19:24:11 +0200 | [diff] [blame] | 251 | fields = [event.name, '%0.3f' % (delta_ns / 1000.0), |
| 252 | 'pid=%d' % rec[2]] |
| 253 | i = 3 |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 254 | for type, name in event.args: |
| 255 | if is_string(type): |
Stefan Hajnoczi | 80ff35c | 2014-05-07 19:24:11 +0200 | [diff] [blame] | 256 | fields.append('%s=%s' % (name, rec[i])) |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 257 | else: |
Stefan Hajnoczi | 80ff35c | 2014-05-07 19:24:11 +0200 | [diff] [blame] | 258 | fields.append('%s=0x%x' % (name, rec[i])) |
Harsh Prateek Bora | 90a147a | 2012-07-18 15:16:00 +0530 | [diff] [blame] | 259 | i += 1 |
Stefan Hajnoczi | 59da668 | 2011-02-22 13:59:41 +0000 | [diff] [blame] | 260 | print ' '.join(fields) |
| 261 | |
| 262 | run(Formatter()) |