blob: a65d0a364d40d47f1f869515712bb177f775e2b6 [file] [log] [blame]
Jan Kiszka626c4272011-10-07 09:37:49 +02001#!/usr/bin/python
2#
3# top-like utility for displaying kvm statistics
4#
5# Copyright 2006-2008 Qumranet Technologies
6# Copyright 2008-2011 Red Hat, Inc.
7#
8# Authors:
9# Avi Kivity <avi@redhat.com>
10#
11# This work is licensed under the terms of the GNU GPL, version 2. See
12# the COPYING file in the top-level directory.
13
14import curses
15import sys, os, time, optparse
16
17class DebugfsProvider(object):
18 def __init__(self):
19 self.base = '/sys/kernel/debug/kvm'
20 self._fields = os.listdir(self.base)
21 def fields(self):
22 return self._fields
23 def select(self, fields):
24 self._fields = fields
25 def read(self):
26 def val(key):
27 return int(file(self.base + '/' + key).read())
28 return dict([(key, val(key)) for key in self._fields])
29
30vmx_exit_reasons = {
31 0: 'EXCEPTION_NMI',
32 1: 'EXTERNAL_INTERRUPT',
33 2: 'TRIPLE_FAULT',
34 7: 'PENDING_INTERRUPT',
35 8: 'NMI_WINDOW',
36 9: 'TASK_SWITCH',
37 10: 'CPUID',
38 12: 'HLT',
39 14: 'INVLPG',
40 15: 'RDPMC',
41 16: 'RDTSC',
42 18: 'VMCALL',
43 19: 'VMCLEAR',
44 20: 'VMLAUNCH',
45 21: 'VMPTRLD',
46 22: 'VMPTRST',
47 23: 'VMREAD',
48 24: 'VMRESUME',
49 25: 'VMWRITE',
50 26: 'VMOFF',
51 27: 'VMON',
52 28: 'CR_ACCESS',
53 29: 'DR_ACCESS',
54 30: 'IO_INSTRUCTION',
55 31: 'MSR_READ',
56 32: 'MSR_WRITE',
57 33: 'INVALID_STATE',
58 36: 'MWAIT_INSTRUCTION',
59 39: 'MONITOR_INSTRUCTION',
60 40: 'PAUSE_INSTRUCTION',
61 41: 'MCE_DURING_VMENTRY',
62 43: 'TPR_BELOW_THRESHOLD',
63 44: 'APIC_ACCESS',
64 48: 'EPT_VIOLATION',
65 49: 'EPT_MISCONFIG',
66 54: 'WBINVD',
67 55: 'XSETBV',
68}
69
70svm_exit_reasons = {
71 0x000: 'READ_CR0',
72 0x003: 'READ_CR3',
73 0x004: 'READ_CR4',
74 0x008: 'READ_CR8',
75 0x010: 'WRITE_CR0',
76 0x013: 'WRITE_CR3',
77 0x014: 'WRITE_CR4',
78 0x018: 'WRITE_CR8',
79 0x020: 'READ_DR0',
80 0x021: 'READ_DR1',
81 0x022: 'READ_DR2',
82 0x023: 'READ_DR3',
83 0x024: 'READ_DR4',
84 0x025: 'READ_DR5',
85 0x026: 'READ_DR6',
86 0x027: 'READ_DR7',
87 0x030: 'WRITE_DR0',
88 0x031: 'WRITE_DR1',
89 0x032: 'WRITE_DR2',
90 0x033: 'WRITE_DR3',
91 0x034: 'WRITE_DR4',
92 0x035: 'WRITE_DR5',
93 0x036: 'WRITE_DR6',
94 0x037: 'WRITE_DR7',
95 0x040: 'EXCP_BASE',
96 0x060: 'INTR',
97 0x061: 'NMI',
98 0x062: 'SMI',
99 0x063: 'INIT',
100 0x064: 'VINTR',
101 0x065: 'CR0_SEL_WRITE',
102 0x066: 'IDTR_READ',
103 0x067: 'GDTR_READ',
104 0x068: 'LDTR_READ',
105 0x069: 'TR_READ',
106 0x06a: 'IDTR_WRITE',
107 0x06b: 'GDTR_WRITE',
108 0x06c: 'LDTR_WRITE',
109 0x06d: 'TR_WRITE',
110 0x06e: 'RDTSC',
111 0x06f: 'RDPMC',
112 0x070: 'PUSHF',
113 0x071: 'POPF',
114 0x072: 'CPUID',
115 0x073: 'RSM',
116 0x074: 'IRET',
117 0x075: 'SWINT',
118 0x076: 'INVD',
119 0x077: 'PAUSE',
120 0x078: 'HLT',
121 0x079: 'INVLPG',
122 0x07a: 'INVLPGA',
123 0x07b: 'IOIO',
124 0x07c: 'MSR',
125 0x07d: 'TASK_SWITCH',
126 0x07e: 'FERR_FREEZE',
127 0x07f: 'SHUTDOWN',
128 0x080: 'VMRUN',
129 0x081: 'VMMCALL',
130 0x082: 'VMLOAD',
131 0x083: 'VMSAVE',
132 0x084: 'STGI',
133 0x085: 'CLGI',
134 0x086: 'SKINIT',
135 0x087: 'RDTSCP',
136 0x088: 'ICEBP',
137 0x089: 'WBINVD',
138 0x08a: 'MONITOR',
139 0x08b: 'MWAIT',
140 0x08c: 'MWAIT_COND',
141 0x400: 'NPF',
142}
143
Michael Ellerman27d318a2014-06-17 17:54:31 +1000144# From include/uapi/linux/kvm.h, KVM_EXIT_xxx
145userspace_exit_reasons = {
146 0: 'UNKNOWN',
147 1: 'EXCEPTION',
148 2: 'IO',
149 3: 'HYPERCALL',
150 4: 'DEBUG',
151 5: 'HLT',
152 6: 'MMIO',
153 7: 'IRQ_WINDOW_OPEN',
154 8: 'SHUTDOWN',
155 9: 'FAIL_ENTRY',
156 10: 'INTR',
157 11: 'SET_TPR',
158 12: 'TPR_ACCESS',
159 13: 'S390_SIEIC',
160 14: 'S390_RESET',
161 15: 'DCR',
162 16: 'NMI',
163 17: 'INTERNAL_ERROR',
164 18: 'OSI',
165 19: 'PAPR_HCALL',
166 20: 'S390_UCONTROL',
167 21: 'WATCHDOG',
168 22: 'S390_TSCH',
169 23: 'EPR',
Jens Freimannc5854ac2012-06-06 02:05:18 +0000170}
171
Michael Ellerman4d4103f2014-06-17 17:54:32 +1000172x86_exit_reasons = {
Jan Kiszka626c4272011-10-07 09:37:49 +0200173 'vmx': vmx_exit_reasons,
174 'svm': svm_exit_reasons,
175}
176
Michael Ellerman4d4103f2014-06-17 17:54:32 +1000177sc_perf_evt_open = None
Jan Kiszka626c4272011-10-07 09:37:49 +0200178exit_reasons = None
179
Michael Ellermana15d5642014-06-17 17:54:34 +1000180ioctl_numbers = {
181 'SET_FILTER' : 0x40082406,
182 'ENABLE' : 0x00002400,
183 'DISABLE' : 0x00002401,
184}
185
Michael Ellerman4d4103f2014-06-17 17:54:32 +1000186def x86_init(flag):
187 globals().update({
188 'sc_perf_evt_open' : 298,
189 'exit_reasons' : x86_exit_reasons[flag],
190 })
191
192def s390_init():
193 globals().update({
194 'sc_perf_evt_open' : 331
195 })
196
197def detect_platform():
198 for line in file('/proc/cpuinfo').readlines():
199 if line.startswith('flags'):
200 for flag in line.split():
201 if flag in x86_exit_reasons:
202 x86_init(flag)
203 return
204 elif line.startswith('vendor_id'):
205 for flag in line.split():
206 if flag == 'IBM/S390':
207 s390_init()
208 return
209
210detect_platform()
Jan Kiszka626c4272011-10-07 09:37:49 +0200211
212def invert(d):
213 return dict((x[1], x[0]) for x in d.iteritems())
214
Michael Ellerman27d318a2014-06-17 17:54:31 +1000215filters = {}
216filters['kvm_userspace_exit'] = ('reason', invert(userspace_exit_reasons))
217if exit_reasons:
218 filters['kvm_exit'] = ('exit_reason', invert(exit_reasons))
Jan Kiszka626c4272011-10-07 09:37:49 +0200219
220import ctypes, struct, array
221
222libc = ctypes.CDLL('libc.so.6')
223syscall = libc.syscall
224class perf_event_attr(ctypes.Structure):
225 _fields_ = [('type', ctypes.c_uint32),
226 ('size', ctypes.c_uint32),
227 ('config', ctypes.c_uint64),
228 ('sample_freq', ctypes.c_uint64),
229 ('sample_type', ctypes.c_uint64),
230 ('read_format', ctypes.c_uint64),
231 ('flags', ctypes.c_uint64),
232 ('wakeup_events', ctypes.c_uint32),
233 ('bp_type', ctypes.c_uint32),
234 ('bp_addr', ctypes.c_uint64),
235 ('bp_len', ctypes.c_uint64),
236 ]
237def _perf_event_open(attr, pid, cpu, group_fd, flags):
Heinz Graalfs1b3e6f82012-10-29 02:13:20 +0000238 return syscall(sc_perf_evt_open, ctypes.pointer(attr), ctypes.c_int(pid),
Jan Kiszka626c4272011-10-07 09:37:49 +0200239 ctypes.c_int(cpu), ctypes.c_int(group_fd),
240 ctypes.c_long(flags))
241
242PERF_TYPE_HARDWARE = 0
243PERF_TYPE_SOFTWARE = 1
244PERF_TYPE_TRACEPOINT = 2
245PERF_TYPE_HW_CACHE = 3
246PERF_TYPE_RAW = 4
247PERF_TYPE_BREAKPOINT = 5
248
249PERF_SAMPLE_IP = 1 << 0
250PERF_SAMPLE_TID = 1 << 1
251PERF_SAMPLE_TIME = 1 << 2
252PERF_SAMPLE_ADDR = 1 << 3
253PERF_SAMPLE_READ = 1 << 4
254PERF_SAMPLE_CALLCHAIN = 1 << 5
255PERF_SAMPLE_ID = 1 << 6
256PERF_SAMPLE_CPU = 1 << 7
257PERF_SAMPLE_PERIOD = 1 << 8
258PERF_SAMPLE_STREAM_ID = 1 << 9
259PERF_SAMPLE_RAW = 1 << 10
260
261PERF_FORMAT_TOTAL_TIME_ENABLED = 1 << 0
262PERF_FORMAT_TOTAL_TIME_RUNNING = 1 << 1
263PERF_FORMAT_ID = 1 << 2
264PERF_FORMAT_GROUP = 1 << 3
265
266import re
267
268sys_tracing = '/sys/kernel/debug/tracing'
269
270class Group(object):
271 def __init__(self, cpu):
272 self.events = []
273 self.group_leader = None
274 self.cpu = cpu
275 def add_event(self, name, event_set, tracepoint, filter = None):
276 self.events.append(Event(group = self,
277 name = name, event_set = event_set,
278 tracepoint = tracepoint, filter = filter))
279 if len(self.events) == 1:
280 self.file = os.fdopen(self.events[0].fd)
281 def read(self):
282 bytes = 8 * (1 + len(self.events))
283 fmt = 'xxxxxxxx' + 'q' * len(self.events)
284 return dict(zip([event.name for event in self.events],
285 struct.unpack(fmt, self.file.read(bytes))))
286
287class Event(object):
288 def __init__(self, group, name, event_set, tracepoint, filter = None):
289 self.name = name
290 attr = perf_event_attr()
291 attr.type = PERF_TYPE_TRACEPOINT
292 attr.size = ctypes.sizeof(attr)
293 id_path = os.path.join(sys_tracing, 'events', event_set,
294 tracepoint, 'id')
295 id = int(file(id_path).read())
296 attr.config = id
297 attr.sample_type = (PERF_SAMPLE_RAW
298 | PERF_SAMPLE_TIME
299 | PERF_SAMPLE_CPU)
300 attr.sample_period = 1
301 attr.read_format = PERF_FORMAT_GROUP
302 group_leader = -1
303 if group.events:
304 group_leader = group.events[0].fd
305 fd = _perf_event_open(attr, -1, group.cpu, group_leader, 0)
306 if fd == -1:
307 raise Exception('perf_event_open failed')
308 if filter:
309 import fcntl
Michael Ellermana15d5642014-06-17 17:54:34 +1000310 fcntl.ioctl(fd, ioctl_numbers['SET_FILTER'], filter)
Jan Kiszka626c4272011-10-07 09:37:49 +0200311 self.fd = fd
312 def enable(self):
313 import fcntl
Michael Ellermana15d5642014-06-17 17:54:34 +1000314 fcntl.ioctl(self.fd, ioctl_numbers['ENABLE'], 0)
Jan Kiszka626c4272011-10-07 09:37:49 +0200315 def disable(self):
316 import fcntl
Michael Ellermana15d5642014-06-17 17:54:34 +1000317 fcntl.ioctl(self.fd, ioctl_numbers['DISABLE'], 0)
Jan Kiszka626c4272011-10-07 09:37:49 +0200318
319class TracepointProvider(object):
320 def __init__(self):
321 path = os.path.join(sys_tracing, 'events', 'kvm')
322 fields = [f
323 for f in os.listdir(path)
324 if os.path.isdir(os.path.join(path, f))]
325 extra = []
326 for f in fields:
327 if f in filters:
328 subfield, values = filters[f]
329 for name, number in values.iteritems():
330 extra.append(f + '(' + name + ')')
331 fields += extra
332 self._setup(fields)
333 self.select(fields)
334 def fields(self):
335 return self._fields
Michael Ellerman763952d2014-06-17 17:54:30 +1000336
337 def _online_cpus(self):
338 l = []
339 pattern = r'cpu([0-9]+)'
340 basedir = '/sys/devices/system/cpu'
341 for entry in os.listdir(basedir):
342 match = re.match(pattern, entry)
343 if not match:
344 continue
345 path = os.path.join(basedir, entry, 'online')
346 if os.path.exists(path) and open(path).read().strip() != '1':
347 continue
348 l.append(int(match.group(1)))
349 return l
350
Jan Kiszka626c4272011-10-07 09:37:49 +0200351 def _setup(self, _fields):
352 self._fields = _fields
Michael Ellerman763952d2014-06-17 17:54:30 +1000353 cpus = self._online_cpus()
Jan Kiszka626c4272011-10-07 09:37:49 +0200354 import resource
Michael Ellerman763952d2014-06-17 17:54:30 +1000355 nfiles = len(cpus) * 1000
Jan Kiszka626c4272011-10-07 09:37:49 +0200356 resource.setrlimit(resource.RLIMIT_NOFILE, (nfiles, nfiles))
357 events = []
358 self.group_leaders = []
Michael Ellerman763952d2014-06-17 17:54:30 +1000359 for cpu in cpus:
Jan Kiszka626c4272011-10-07 09:37:49 +0200360 group = Group(cpu)
361 for name in _fields:
362 tracepoint = name
363 filter = None
364 m = re.match(r'(.*)\((.*)\)', name)
365 if m:
366 tracepoint, sub = m.groups()
367 filter = '%s==%d\0' % (filters[tracepoint][0],
368 filters[tracepoint][1][sub])
369 event = group.add_event(name, event_set = 'kvm',
370 tracepoint = tracepoint,
371 filter = filter)
372 self.group_leaders.append(group)
373 def select(self, fields):
374 for group in self.group_leaders:
375 for event in group.events:
376 if event.name in fields:
377 event.enable()
378 else:
379 event.disable()
380 def read(self):
381 from collections import defaultdict
382 ret = defaultdict(int)
383 for group in self.group_leaders:
384 for name, val in group.read().iteritems():
385 ret[name] += val
386 return ret
387
388class Stats:
Paolo Bonzinib763adf2014-05-21 12:42:26 +0200389 def __init__(self, providers, fields = None):
390 self.providers = providers
Jan Kiszka626c4272011-10-07 09:37:49 +0200391 self.fields_filter = fields
392 self._update()
393 def _update(self):
394 def wanted(key):
395 import re
396 if not self.fields_filter:
397 return True
398 return re.match(self.fields_filter, key) is not None
Paolo Bonzinib763adf2014-05-21 12:42:26 +0200399 self.values = dict()
400 for d in providers:
401 provider_fields = [key for key in d.fields() if wanted(key)]
402 for key in provider_fields:
403 self.values[key] = None
404 d.select(provider_fields)
Jan Kiszka626c4272011-10-07 09:37:49 +0200405 def set_fields_filter(self, fields_filter):
406 self.fields_filter = fields_filter
407 self._update()
408 def get(self):
Paolo Bonzinib763adf2014-05-21 12:42:26 +0200409 for d in providers:
410 new = d.read()
411 for key in d.fields():
412 oldval = self.values.get(key, (0, 0))
413 newval = new[key]
414 newdelta = None
415 if oldval is not None:
416 newdelta = newval - oldval[0]
417 self.values[key] = (newval, newdelta)
Jan Kiszka626c4272011-10-07 09:37:49 +0200418 return self.values
419
420if not os.access('/sys/kernel/debug', os.F_OK):
421 print 'Please enable CONFIG_DEBUG_FS in your kernel'
422 sys.exit(1)
423if not os.access('/sys/kernel/debug/kvm', os.F_OK):
424 print "Please mount debugfs ('mount -t debugfs debugfs /sys/kernel/debug')"
425 print "and ensure the kvm modules are loaded"
426 sys.exit(1)
427
428label_width = 40
429number_width = 10
430
431def tui(screen, stats):
432 curses.use_default_colors()
433 curses.noecho()
434 drilldown = False
435 fields_filter = stats.fields_filter
436 def update_drilldown():
437 if not fields_filter:
438 if drilldown:
439 stats.set_fields_filter(None)
440 else:
441 stats.set_fields_filter(r'^[^\(]*$')
442 update_drilldown()
443 def refresh(sleeptime):
444 screen.erase()
445 screen.addstr(0, 0, 'kvm statistics')
446 row = 2
447 s = stats.get()
448 def sortkey(x):
449 if s[x][1]:
450 return (-s[x][1], -s[x][0])
451 else:
452 return (0, -s[x][0])
453 for key in sorted(s.keys(), key = sortkey):
454 if row >= screen.getmaxyx()[0]:
455 break
456 values = s[key]
457 if not values[0] and not values[1]:
458 break
459 col = 1
460 screen.addstr(row, col, key)
461 col += label_width
462 screen.addstr(row, col, '%10d' % (values[0],))
463 col += number_width
464 if values[1] is not None:
465 screen.addstr(row, col, '%8d' % (values[1] / sleeptime,))
466 row += 1
467 screen.refresh()
468
469 sleeptime = 0.25
470 while True:
471 refresh(sleeptime)
472 curses.halfdelay(int(sleeptime * 10))
473 sleeptime = 3
474 try:
475 c = screen.getkey()
476 if c == 'x':
477 drilldown = not drilldown
478 update_drilldown()
479 if c == 'q':
480 break
481 except KeyboardInterrupt:
482 break
483 except curses.error:
484 continue
485
486def batch(stats):
487 s = stats.get()
488 time.sleep(1)
489 s = stats.get()
490 for key in sorted(s.keys()):
491 values = s[key]
492 print '%-22s%10d%10d' % (key, values[0], values[1])
493
494def log(stats):
495 keys = sorted(stats.get().iterkeys())
496 def banner():
497 for k in keys:
498 print '%10s' % k[0:9],
499 print
500 def statline():
501 s = stats.get()
502 for k in keys:
503 print ' %9d' % s[k][1],
504 print
505 line = 0
506 banner_repeat = 20
507 while True:
508 time.sleep(1)
509 if line % banner_repeat == 0:
510 banner()
511 statline()
512 line += 1
513
514options = optparse.OptionParser()
515options.add_option('-1', '--once', '--batch',
516 action = 'store_true',
517 default = False,
518 dest = 'once',
519 help = 'run in batch mode for one second',
520 )
521options.add_option('-l', '--log',
522 action = 'store_true',
523 default = False,
524 dest = 'log',
525 help = 'run in logging mode (like vmstat)',
526 )
Paolo Bonzinib763adf2014-05-21 12:42:26 +0200527options.add_option('-t', '--tracepoints',
528 action = 'store_true',
529 default = False,
530 dest = 'tracepoints',
531 help = 'retrieve statistics from tracepoints',
532 )
533options.add_option('-d', '--debugfs',
534 action = 'store_true',
535 default = False,
536 dest = 'debugfs',
537 help = 'retrieve statistics from debugfs',
538 )
Jan Kiszka626c4272011-10-07 09:37:49 +0200539options.add_option('-f', '--fields',
540 action = 'store',
541 default = None,
542 dest = 'fields',
543 help = 'fields to display (regex)',
544 )
545(options, args) = options.parse_args(sys.argv)
546
Paolo Bonzinib763adf2014-05-21 12:42:26 +0200547providers = []
548if options.tracepoints:
549 providers.append(TracepointProvider())
550if options.debugfs:
551 providers.append(DebugfsProvider())
Jan Kiszka626c4272011-10-07 09:37:49 +0200552
Paolo Bonzinib763adf2014-05-21 12:42:26 +0200553if len(providers) == 0:
554 try:
555 providers = [TracepointProvider()]
556 except:
557 providers = [DebugfsProvider()]
558
559stats = Stats(providers, fields = options.fields)
Jan Kiszka626c4272011-10-07 09:37:49 +0200560
561if options.log:
562 log(stats)
563elif not options.once:
564 import curses.wrapper
565 curses.wrapper(tui, stats)
566else:
567 batch(stats)