blob: 8f6f00715e2b554df7aa6f80e4cc6c7f1c994d2f [file] [log] [blame]
Jan Kiszka626c4272011-10-07 09:37:49 +02001#!/usr/bin/python
2#
3# top-like utility for displaying kvm statistics
4#
5# Copyright 2006-2008 Qumranet Technologies
6# Copyright 2008-2011 Red Hat, Inc.
7#
8# Authors:
9# Avi Kivity <avi@redhat.com>
10#
11# This work is licensed under the terms of the GNU GPL, version 2. See
12# the COPYING file in the top-level directory.
13
14import curses
Michael Ellerman47253982014-06-17 17:54:35 +100015import sys, os, time, optparse, ctypes
Wei Huang874b1cf2015-01-21 16:15:31 -050016from ctypes import *
Jan Kiszka626c4272011-10-07 09:37:49 +020017
18class DebugfsProvider(object):
19 def __init__(self):
20 self.base = '/sys/kernel/debug/kvm'
21 self._fields = os.listdir(self.base)
22 def fields(self):
23 return self._fields
24 def select(self, fields):
25 self._fields = fields
26 def read(self):
27 def val(key):
28 return int(file(self.base + '/' + key).read())
29 return dict([(key, val(key)) for key in self._fields])
30
31vmx_exit_reasons = {
32 0: 'EXCEPTION_NMI',
33 1: 'EXTERNAL_INTERRUPT',
34 2: 'TRIPLE_FAULT',
35 7: 'PENDING_INTERRUPT',
36 8: 'NMI_WINDOW',
37 9: 'TASK_SWITCH',
38 10: 'CPUID',
39 12: 'HLT',
40 14: 'INVLPG',
41 15: 'RDPMC',
42 16: 'RDTSC',
43 18: 'VMCALL',
44 19: 'VMCLEAR',
45 20: 'VMLAUNCH',
46 21: 'VMPTRLD',
47 22: 'VMPTRST',
48 23: 'VMREAD',
49 24: 'VMRESUME',
50 25: 'VMWRITE',
51 26: 'VMOFF',
52 27: 'VMON',
53 28: 'CR_ACCESS',
54 29: 'DR_ACCESS',
55 30: 'IO_INSTRUCTION',
56 31: 'MSR_READ',
57 32: 'MSR_WRITE',
58 33: 'INVALID_STATE',
59 36: 'MWAIT_INSTRUCTION',
60 39: 'MONITOR_INSTRUCTION',
61 40: 'PAUSE_INSTRUCTION',
62 41: 'MCE_DURING_VMENTRY',
63 43: 'TPR_BELOW_THRESHOLD',
64 44: 'APIC_ACCESS',
65 48: 'EPT_VIOLATION',
66 49: 'EPT_MISCONFIG',
67 54: 'WBINVD',
68 55: 'XSETBV',
Wei Huang2c9d5352015-01-21 16:15:30 -050069 56: 'APIC_WRITE',
70 58: 'INVPCID',
Jan Kiszka626c4272011-10-07 09:37:49 +020071}
72
73svm_exit_reasons = {
74 0x000: 'READ_CR0',
75 0x003: 'READ_CR3',
76 0x004: 'READ_CR4',
77 0x008: 'READ_CR8',
78 0x010: 'WRITE_CR0',
79 0x013: 'WRITE_CR3',
80 0x014: 'WRITE_CR4',
81 0x018: 'WRITE_CR8',
82 0x020: 'READ_DR0',
83 0x021: 'READ_DR1',
84 0x022: 'READ_DR2',
85 0x023: 'READ_DR3',
86 0x024: 'READ_DR4',
87 0x025: 'READ_DR5',
88 0x026: 'READ_DR6',
89 0x027: 'READ_DR7',
90 0x030: 'WRITE_DR0',
91 0x031: 'WRITE_DR1',
92 0x032: 'WRITE_DR2',
93 0x033: 'WRITE_DR3',
94 0x034: 'WRITE_DR4',
95 0x035: 'WRITE_DR5',
96 0x036: 'WRITE_DR6',
97 0x037: 'WRITE_DR7',
98 0x040: 'EXCP_BASE',
99 0x060: 'INTR',
100 0x061: 'NMI',
101 0x062: 'SMI',
102 0x063: 'INIT',
103 0x064: 'VINTR',
104 0x065: 'CR0_SEL_WRITE',
105 0x066: 'IDTR_READ',
106 0x067: 'GDTR_READ',
107 0x068: 'LDTR_READ',
108 0x069: 'TR_READ',
109 0x06a: 'IDTR_WRITE',
110 0x06b: 'GDTR_WRITE',
111 0x06c: 'LDTR_WRITE',
112 0x06d: 'TR_WRITE',
113 0x06e: 'RDTSC',
114 0x06f: 'RDPMC',
115 0x070: 'PUSHF',
116 0x071: 'POPF',
117 0x072: 'CPUID',
118 0x073: 'RSM',
119 0x074: 'IRET',
120 0x075: 'SWINT',
121 0x076: 'INVD',
122 0x077: 'PAUSE',
123 0x078: 'HLT',
124 0x079: 'INVLPG',
125 0x07a: 'INVLPGA',
126 0x07b: 'IOIO',
127 0x07c: 'MSR',
128 0x07d: 'TASK_SWITCH',
129 0x07e: 'FERR_FREEZE',
130 0x07f: 'SHUTDOWN',
131 0x080: 'VMRUN',
132 0x081: 'VMMCALL',
133 0x082: 'VMLOAD',
134 0x083: 'VMSAVE',
135 0x084: 'STGI',
136 0x085: 'CLGI',
137 0x086: 'SKINIT',
138 0x087: 'RDTSCP',
139 0x088: 'ICEBP',
140 0x089: 'WBINVD',
141 0x08a: 'MONITOR',
142 0x08b: 'MWAIT',
143 0x08c: 'MWAIT_COND',
Wei Huang2c9d5352015-01-21 16:15:30 -0500144 0x08d: 'XSETBV',
Jan Kiszka626c4272011-10-07 09:37:49 +0200145 0x400: 'NPF',
146}
147
Michael Ellerman27d318a2014-06-17 17:54:31 +1000148# From include/uapi/linux/kvm.h, KVM_EXIT_xxx
149userspace_exit_reasons = {
150 0: 'UNKNOWN',
151 1: 'EXCEPTION',
152 2: 'IO',
153 3: 'HYPERCALL',
154 4: 'DEBUG',
155 5: 'HLT',
156 6: 'MMIO',
157 7: 'IRQ_WINDOW_OPEN',
158 8: 'SHUTDOWN',
159 9: 'FAIL_ENTRY',
160 10: 'INTR',
161 11: 'SET_TPR',
162 12: 'TPR_ACCESS',
163 13: 'S390_SIEIC',
164 14: 'S390_RESET',
165 15: 'DCR',
166 16: 'NMI',
167 17: 'INTERNAL_ERROR',
168 18: 'OSI',
169 19: 'PAPR_HCALL',
170 20: 'S390_UCONTROL',
171 21: 'WATCHDOG',
172 22: 'S390_TSCH',
173 23: 'EPR',
Wei Huang2c9d5352015-01-21 16:15:30 -0500174 24: 'SYSTEM_EVENT',
Jens Freimannc5854ac2012-06-06 02:05:18 +0000175}
176
Michael Ellerman4d4103f2014-06-17 17:54:32 +1000177x86_exit_reasons = {
Jan Kiszka626c4272011-10-07 09:37:49 +0200178 'vmx': vmx_exit_reasons,
179 'svm': svm_exit_reasons,
180}
181
Michael Ellerman4d4103f2014-06-17 17:54:32 +1000182sc_perf_evt_open = None
Jan Kiszka626c4272011-10-07 09:37:49 +0200183exit_reasons = None
184
Michael Ellermana15d5642014-06-17 17:54:34 +1000185ioctl_numbers = {
186 'SET_FILTER' : 0x40082406,
187 'ENABLE' : 0x00002400,
188 'DISABLE' : 0x00002401,
189}
190
Michael Ellerman4d4103f2014-06-17 17:54:32 +1000191def x86_init(flag):
192 globals().update({
193 'sc_perf_evt_open' : 298,
194 'exit_reasons' : x86_exit_reasons[flag],
195 })
196
197def s390_init():
198 globals().update({
199 'sc_perf_evt_open' : 331
200 })
201
Michael Ellerman47253982014-06-17 17:54:35 +1000202def ppc_init():
203 globals().update({
204 'sc_perf_evt_open' : 319,
205 'ioctl_numbers' : {
206 'SET_FILTER' : 0x80002406 | (ctypes.sizeof(ctypes.c_char_p) << 16),
207 'ENABLE' : 0x20002400,
208 'DISABLE' : 0x20002401,
209 }
210 })
211
Wei Huangedcbc402015-01-21 16:15:29 -0500212def aarch64_init():
213 globals().update({
214 'sc_perf_evt_open' : 241
215 })
216
Michael Ellerman4d4103f2014-06-17 17:54:32 +1000217def detect_platform():
Michael Ellerman47253982014-06-17 17:54:35 +1000218 if os.uname()[4].startswith('ppc'):
219 ppc_init()
220 return
Wei Huangedcbc402015-01-21 16:15:29 -0500221 elif os.uname()[4].startswith('aarch64'):
222 aarch64_init()
223 return
Michael Ellerman47253982014-06-17 17:54:35 +1000224
Michael Ellerman4d4103f2014-06-17 17:54:32 +1000225 for line in file('/proc/cpuinfo').readlines():
226 if line.startswith('flags'):
227 for flag in line.split():
228 if flag in x86_exit_reasons:
229 x86_init(flag)
230 return
231 elif line.startswith('vendor_id'):
232 for flag in line.split():
233 if flag == 'IBM/S390':
234 s390_init()
235 return
236
237detect_platform()
Jan Kiszka626c4272011-10-07 09:37:49 +0200238
239def invert(d):
240 return dict((x[1], x[0]) for x in d.iteritems())
241
Michael Ellerman27d318a2014-06-17 17:54:31 +1000242filters = {}
243filters['kvm_userspace_exit'] = ('reason', invert(userspace_exit_reasons))
244if exit_reasons:
245 filters['kvm_exit'] = ('exit_reason', invert(exit_reasons))
Jan Kiszka626c4272011-10-07 09:37:49 +0200246
Michael Ellerman47253982014-06-17 17:54:35 +1000247import struct, array
Jan Kiszka626c4272011-10-07 09:37:49 +0200248
249libc = ctypes.CDLL('libc.so.6')
250syscall = libc.syscall
Wei Huang874b1cf2015-01-21 16:15:31 -0500251get_errno = libc.__errno_location
252get_errno.restype = POINTER(c_int)
253
Jan Kiszka626c4272011-10-07 09:37:49 +0200254class perf_event_attr(ctypes.Structure):
255 _fields_ = [('type', ctypes.c_uint32),
256 ('size', ctypes.c_uint32),
257 ('config', ctypes.c_uint64),
258 ('sample_freq', ctypes.c_uint64),
259 ('sample_type', ctypes.c_uint64),
260 ('read_format', ctypes.c_uint64),
261 ('flags', ctypes.c_uint64),
262 ('wakeup_events', ctypes.c_uint32),
263 ('bp_type', ctypes.c_uint32),
264 ('bp_addr', ctypes.c_uint64),
265 ('bp_len', ctypes.c_uint64),
266 ]
267def _perf_event_open(attr, pid, cpu, group_fd, flags):
Heinz Graalfs1b3e6f82012-10-29 02:13:20 +0000268 return syscall(sc_perf_evt_open, ctypes.pointer(attr), ctypes.c_int(pid),
Jan Kiszka626c4272011-10-07 09:37:49 +0200269 ctypes.c_int(cpu), ctypes.c_int(group_fd),
270 ctypes.c_long(flags))
271
272PERF_TYPE_HARDWARE = 0
273PERF_TYPE_SOFTWARE = 1
274PERF_TYPE_TRACEPOINT = 2
275PERF_TYPE_HW_CACHE = 3
276PERF_TYPE_RAW = 4
277PERF_TYPE_BREAKPOINT = 5
278
279PERF_SAMPLE_IP = 1 << 0
280PERF_SAMPLE_TID = 1 << 1
281PERF_SAMPLE_TIME = 1 << 2
282PERF_SAMPLE_ADDR = 1 << 3
283PERF_SAMPLE_READ = 1 << 4
284PERF_SAMPLE_CALLCHAIN = 1 << 5
285PERF_SAMPLE_ID = 1 << 6
286PERF_SAMPLE_CPU = 1 << 7
287PERF_SAMPLE_PERIOD = 1 << 8
288PERF_SAMPLE_STREAM_ID = 1 << 9
289PERF_SAMPLE_RAW = 1 << 10
290
291PERF_FORMAT_TOTAL_TIME_ENABLED = 1 << 0
292PERF_FORMAT_TOTAL_TIME_RUNNING = 1 << 1
293PERF_FORMAT_ID = 1 << 2
294PERF_FORMAT_GROUP = 1 << 3
295
296import re
297
298sys_tracing = '/sys/kernel/debug/tracing'
299
300class Group(object):
301 def __init__(self, cpu):
302 self.events = []
303 self.group_leader = None
304 self.cpu = cpu
305 def add_event(self, name, event_set, tracepoint, filter = None):
306 self.events.append(Event(group = self,
307 name = name, event_set = event_set,
308 tracepoint = tracepoint, filter = filter))
309 if len(self.events) == 1:
310 self.file = os.fdopen(self.events[0].fd)
311 def read(self):
312 bytes = 8 * (1 + len(self.events))
313 fmt = 'xxxxxxxx' + 'q' * len(self.events)
314 return dict(zip([event.name for event in self.events],
315 struct.unpack(fmt, self.file.read(bytes))))
316
317class Event(object):
318 def __init__(self, group, name, event_set, tracepoint, filter = None):
319 self.name = name
320 attr = perf_event_attr()
321 attr.type = PERF_TYPE_TRACEPOINT
322 attr.size = ctypes.sizeof(attr)
323 id_path = os.path.join(sys_tracing, 'events', event_set,
324 tracepoint, 'id')
325 id = int(file(id_path).read())
326 attr.config = id
327 attr.sample_type = (PERF_SAMPLE_RAW
328 | PERF_SAMPLE_TIME
329 | PERF_SAMPLE_CPU)
330 attr.sample_period = 1
331 attr.read_format = PERF_FORMAT_GROUP
332 group_leader = -1
333 if group.events:
334 group_leader = group.events[0].fd
335 fd = _perf_event_open(attr, -1, group.cpu, group_leader, 0)
336 if fd == -1:
Wei Huang874b1cf2015-01-21 16:15:31 -0500337 err = get_errno()[0]
338 raise Exception('perf_event_open failed, errno = ' + err.__str__())
Jan Kiszka626c4272011-10-07 09:37:49 +0200339 if filter:
340 import fcntl
Michael Ellermana15d5642014-06-17 17:54:34 +1000341 fcntl.ioctl(fd, ioctl_numbers['SET_FILTER'], filter)
Jan Kiszka626c4272011-10-07 09:37:49 +0200342 self.fd = fd
343 def enable(self):
344 import fcntl
Michael Ellermana15d5642014-06-17 17:54:34 +1000345 fcntl.ioctl(self.fd, ioctl_numbers['ENABLE'], 0)
Jan Kiszka626c4272011-10-07 09:37:49 +0200346 def disable(self):
347 import fcntl
Michael Ellermana15d5642014-06-17 17:54:34 +1000348 fcntl.ioctl(self.fd, ioctl_numbers['DISABLE'], 0)
Jan Kiszka626c4272011-10-07 09:37:49 +0200349
350class TracepointProvider(object):
351 def __init__(self):
352 path = os.path.join(sys_tracing, 'events', 'kvm')
353 fields = [f
354 for f in os.listdir(path)
355 if os.path.isdir(os.path.join(path, f))]
356 extra = []
357 for f in fields:
358 if f in filters:
359 subfield, values = filters[f]
360 for name, number in values.iteritems():
361 extra.append(f + '(' + name + ')')
362 fields += extra
363 self._setup(fields)
364 self.select(fields)
365 def fields(self):
366 return self._fields
Michael Ellerman763952d2014-06-17 17:54:30 +1000367
368 def _online_cpus(self):
369 l = []
370 pattern = r'cpu([0-9]+)'
371 basedir = '/sys/devices/system/cpu'
372 for entry in os.listdir(basedir):
373 match = re.match(pattern, entry)
374 if not match:
375 continue
376 path = os.path.join(basedir, entry, 'online')
377 if os.path.exists(path) and open(path).read().strip() != '1':
378 continue
379 l.append(int(match.group(1)))
380 return l
381
Jan Kiszka626c4272011-10-07 09:37:49 +0200382 def _setup(self, _fields):
383 self._fields = _fields
Michael Ellerman763952d2014-06-17 17:54:30 +1000384 cpus = self._online_cpus()
Jan Kiszka626c4272011-10-07 09:37:49 +0200385 import resource
Michael Ellerman763952d2014-06-17 17:54:30 +1000386 nfiles = len(cpus) * 1000
Jan Kiszka626c4272011-10-07 09:37:49 +0200387 resource.setrlimit(resource.RLIMIT_NOFILE, (nfiles, nfiles))
388 events = []
389 self.group_leaders = []
Michael Ellerman763952d2014-06-17 17:54:30 +1000390 for cpu in cpus:
Jan Kiszka626c4272011-10-07 09:37:49 +0200391 group = Group(cpu)
392 for name in _fields:
393 tracepoint = name
394 filter = None
395 m = re.match(r'(.*)\((.*)\)', name)
396 if m:
397 tracepoint, sub = m.groups()
398 filter = '%s==%d\0' % (filters[tracepoint][0],
399 filters[tracepoint][1][sub])
400 event = group.add_event(name, event_set = 'kvm',
401 tracepoint = tracepoint,
402 filter = filter)
403 self.group_leaders.append(group)
404 def select(self, fields):
405 for group in self.group_leaders:
406 for event in group.events:
407 if event.name in fields:
408 event.enable()
409 else:
410 event.disable()
411 def read(self):
412 from collections import defaultdict
413 ret = defaultdict(int)
414 for group in self.group_leaders:
415 for name, val in group.read().iteritems():
416 ret[name] += val
417 return ret
418
419class Stats:
Paolo Bonzinib763adf2014-05-21 12:42:26 +0200420 def __init__(self, providers, fields = None):
421 self.providers = providers
Jan Kiszka626c4272011-10-07 09:37:49 +0200422 self.fields_filter = fields
423 self._update()
424 def _update(self):
425 def wanted(key):
426 import re
427 if not self.fields_filter:
428 return True
429 return re.match(self.fields_filter, key) is not None
Paolo Bonzinib763adf2014-05-21 12:42:26 +0200430 self.values = dict()
431 for d in providers:
432 provider_fields = [key for key in d.fields() if wanted(key)]
433 for key in provider_fields:
434 self.values[key] = None
435 d.select(provider_fields)
Jan Kiszka626c4272011-10-07 09:37:49 +0200436 def set_fields_filter(self, fields_filter):
437 self.fields_filter = fields_filter
438 self._update()
439 def get(self):
Paolo Bonzinib763adf2014-05-21 12:42:26 +0200440 for d in providers:
441 new = d.read()
442 for key in d.fields():
443 oldval = self.values.get(key, (0, 0))
444 newval = new[key]
445 newdelta = None
446 if oldval is not None:
447 newdelta = newval - oldval[0]
448 self.values[key] = (newval, newdelta)
Jan Kiszka626c4272011-10-07 09:37:49 +0200449 return self.values
450
451if not os.access('/sys/kernel/debug', os.F_OK):
452 print 'Please enable CONFIG_DEBUG_FS in your kernel'
453 sys.exit(1)
454if not os.access('/sys/kernel/debug/kvm', os.F_OK):
455 print "Please mount debugfs ('mount -t debugfs debugfs /sys/kernel/debug')"
456 print "and ensure the kvm modules are loaded"
457 sys.exit(1)
458
459label_width = 40
460number_width = 10
461
462def tui(screen, stats):
463 curses.use_default_colors()
464 curses.noecho()
465 drilldown = False
466 fields_filter = stats.fields_filter
467 def update_drilldown():
468 if not fields_filter:
469 if drilldown:
470 stats.set_fields_filter(None)
471 else:
472 stats.set_fields_filter(r'^[^\(]*$')
473 update_drilldown()
474 def refresh(sleeptime):
475 screen.erase()
476 screen.addstr(0, 0, 'kvm statistics')
477 row = 2
478 s = stats.get()
479 def sortkey(x):
480 if s[x][1]:
481 return (-s[x][1], -s[x][0])
482 else:
483 return (0, -s[x][0])
484 for key in sorted(s.keys(), key = sortkey):
485 if row >= screen.getmaxyx()[0]:
486 break
487 values = s[key]
488 if not values[0] and not values[1]:
489 break
490 col = 1
491 screen.addstr(row, col, key)
492 col += label_width
493 screen.addstr(row, col, '%10d' % (values[0],))
494 col += number_width
495 if values[1] is not None:
496 screen.addstr(row, col, '%8d' % (values[1] / sleeptime,))
497 row += 1
498 screen.refresh()
499
500 sleeptime = 0.25
501 while True:
502 refresh(sleeptime)
503 curses.halfdelay(int(sleeptime * 10))
504 sleeptime = 3
505 try:
506 c = screen.getkey()
507 if c == 'x':
508 drilldown = not drilldown
509 update_drilldown()
510 if c == 'q':
511 break
512 except KeyboardInterrupt:
513 break
514 except curses.error:
515 continue
516
517def batch(stats):
518 s = stats.get()
519 time.sleep(1)
520 s = stats.get()
521 for key in sorted(s.keys()):
522 values = s[key]
523 print '%-22s%10d%10d' % (key, values[0], values[1])
524
525def log(stats):
526 keys = sorted(stats.get().iterkeys())
527 def banner():
528 for k in keys:
529 print '%10s' % k[0:9],
530 print
531 def statline():
532 s = stats.get()
533 for k in keys:
534 print ' %9d' % s[k][1],
535 print
536 line = 0
537 banner_repeat = 20
538 while True:
539 time.sleep(1)
540 if line % banner_repeat == 0:
541 banner()
542 statline()
543 line += 1
544
545options = optparse.OptionParser()
546options.add_option('-1', '--once', '--batch',
547 action = 'store_true',
548 default = False,
549 dest = 'once',
550 help = 'run in batch mode for one second',
551 )
552options.add_option('-l', '--log',
553 action = 'store_true',
554 default = False,
555 dest = 'log',
556 help = 'run in logging mode (like vmstat)',
557 )
Paolo Bonzinib763adf2014-05-21 12:42:26 +0200558options.add_option('-t', '--tracepoints',
559 action = 'store_true',
560 default = False,
561 dest = 'tracepoints',
562 help = 'retrieve statistics from tracepoints',
563 )
564options.add_option('-d', '--debugfs',
565 action = 'store_true',
566 default = False,
567 dest = 'debugfs',
568 help = 'retrieve statistics from debugfs',
569 )
Jan Kiszka626c4272011-10-07 09:37:49 +0200570options.add_option('-f', '--fields',
571 action = 'store',
572 default = None,
573 dest = 'fields',
574 help = 'fields to display (regex)',
575 )
576(options, args) = options.parse_args(sys.argv)
577
Paolo Bonzinib763adf2014-05-21 12:42:26 +0200578providers = []
579if options.tracepoints:
580 providers.append(TracepointProvider())
581if options.debugfs:
582 providers.append(DebugfsProvider())
Jan Kiszka626c4272011-10-07 09:37:49 +0200583
Paolo Bonzinib763adf2014-05-21 12:42:26 +0200584if len(providers) == 0:
585 try:
586 providers = [TracepointProvider()]
587 except:
588 providers = [DebugfsProvider()]
589
590stats = Stats(providers, fields = options.fields)
Jan Kiszka626c4272011-10-07 09:37:49 +0200591
592if options.log:
593 log(stats)
594elif not options.once:
595 import curses.wrapper
596 curses.wrapper(tui, stats)
597else:
598 batch(stats)