kvm: Set the perf exclude_host attribute if available

The performance counting framework in Linux 3.2 and onwards supports
an attribute to exclude events generated by the host when running
KVM. Setting this attribute allows us to get more reliable
measurements of the guest machine. For example, on a highly loaded
system, the instruction counts from the guest can be severely
distorted by the host kernel (e.g., by page fault handlers).

This changeset introduces a check for the attribute and enables it in
the KVM CPU if present.
This commit is contained in:
Andreas Sandberg 2013-10-15 10:09:23 +02:00
parent d4f205ea2f
commit 4b8be6a90b
3 changed files with 86 additions and 2 deletions

View file

@ -794,12 +794,35 @@ def CheckLeading(context):
context.Result(ret) context.Result(ret)
return ret return ret
# Add a custom Check function to test for structure members.
def CheckMember(context, include, decl, member, include_quotes="<>"):
context.Message("Checking for member %s in %s..." %
(member, decl))
text = """
#include %(header)s
int main(){
%(decl)s test;
(void)test.%(member)s;
return 0;
};
""" % { "header" : include_quotes[0] + include + include_quotes[1],
"decl" : decl,
"member" : member,
}
ret = context.TryCompile(text, extension=".cc")
context.Result(ret)
return ret
# Platform-specific configuration. Note again that we assume that all # Platform-specific configuration. Note again that we assume that all
# builds under a given build root run on the same host platform. # builds under a given build root run on the same host platform.
conf = Configure(main, conf = Configure(main,
conf_dir = joinpath(build_root, '.scons_config'), conf_dir = joinpath(build_root, '.scons_config'),
log_file = joinpath(build_root, 'scons_config.log'), log_file = joinpath(build_root, 'scons_config.log'),
custom_tests = { 'CheckLeading' : CheckLeading }) custom_tests = {
'CheckLeading' : CheckLeading,
'CheckMember' : CheckMember,
})
# Check for leading underscores. Don't really need to worry either # Check for leading underscores. Don't really need to worry either
# way so don't need to check the return code. # way so don't need to check the return code.
@ -964,6 +987,12 @@ def is_isa_kvm_compatible(isa):
return host_isa in isa_comp_table.get(isa, []) return host_isa in isa_comp_table.get(isa, [])
# Check if the exclude_host attribute is available. We want this to
# get accurate instruction counts in KVM.
main['HAVE_PERF_ATTR_EXCLUDE_HOST'] = conf.CheckMember(
'linux/perf_event.h', 'struct perf_event_attr', 'exclude_host')
###################################################################### ######################################################################
# #
# Finish the configuration # Finish the configuration
@ -1065,7 +1094,8 @@ sticky_vars.AddVariables(
# These variables get exported to #defines in config/*.hh (see src/SConscript). # These variables get exported to #defines in config/*.hh (see src/SConscript).
export_vars += ['USE_FENV', 'SS_COMPATIBLE_FP', 'TARGET_ISA', 'CP_ANNOTATE', export_vars += ['USE_FENV', 'SS_COMPATIBLE_FP', 'TARGET_ISA', 'CP_ANNOTATE',
'USE_POSIX_CLOCK', 'PROTOCOL', 'HAVE_PROTOBUF'] 'USE_POSIX_CLOCK', 'PROTOCOL', 'HAVE_PROTOBUF',
'HAVE_PERF_ATTR_EXCLUDE_HOST']
################################################### ###################################################
# #
@ -1243,6 +1273,13 @@ for variant_path in variant_paths:
"target ISA combination" "target ISA combination"
env['USE_KVM'] = False env['USE_KVM'] = False
# Warn about missing optional functionality
if env['USE_KVM']:
if not main['HAVE_PERF_ATTR_EXCLUDE_HOST']:
print "Warning: perf_event headers lack support for the " \
"exclude_host attribute. KVM instruction counts will " \
"be inaccurate."
# Save sticky variable settings back to current variables file # Save sticky variable settings back to current variables file
sticky_vars.Save(current_vars_file, env) sticky_vars.Save(current_vars_file, env)

View file

@ -1133,6 +1133,12 @@ BaseKvmCPU::setupCounters()
cfgCycles.disabled(true) cfgCycles.disabled(true)
.pinned(true); .pinned(true);
// Try to exclude the host. We set both exclude_hv and
// exclude_host since different architectures use slightly
// different APIs in the kernel.
cfgCycles.exclude_hv(true)
.exclude_host(true);
if (perfControlledByTimer) { if (perfControlledByTimer) {
// We need to configure the cycles counter to send overflows // We need to configure the cycles counter to send overflows
// since we are going to use it to trigger timer signals that // since we are going to use it to trigger timer signals that
@ -1206,6 +1212,12 @@ BaseKvmCPU::setupInstCounter(uint64_t period)
PerfKvmCounterConfig cfgInstructions(PERF_TYPE_HARDWARE, PerfKvmCounterConfig cfgInstructions(PERF_TYPE_HARDWARE,
PERF_COUNT_HW_INSTRUCTIONS); PERF_COUNT_HW_INSTRUCTIONS);
// Try to exclude the host. We set both exclude_hv and
// exclude_host since different architectures use slightly
// different APIs in the kernel.
cfgInstructions.exclude_hv(true)
.exclude_host(true);
if (period) { if (period) {
// Setup a sampling counter if that has been requested. // Setup a sampling counter if that has been requested.
cfgInstructions.wakeupEvents(1) cfgInstructions.wakeupEvents(1)

View file

@ -45,6 +45,8 @@
#include <inttypes.h> #include <inttypes.h>
#include "config/have_perf_attr_exclude_host.hh"
/** /**
* PerfEvent counter configuration. * PerfEvent counter configuration.
*/ */
@ -125,6 +127,39 @@ class PerfKvmCounterConfig
return *this; return *this;
} }
/**
* Exclude the events from the host (i.e., only include events
* from the guest system).
*
* Intel CPUs seem to support this attribute from Linux 3.2 and
* onwards. Non-x86 architectures currently ignore this attribute
* (Linux 3.12-rc5).
*
* @warn This attribute is ignored if it isn't present in the
* kernel headers or if the kernel doesn't support it.
*
* @param val true to exclude host events
*/
PerfKvmCounterConfig &exclude_host(bool val) {
#if HAVE_PERF_ATTR_EXCLUDE_HOST == 1
attr.exclude_host = val;
#endif
return *this;
}
/**
* Exclude the hyper visor (i.e., only include events from the
* guest system).
*
* @warn This is attribute only seems to be ignored on Intel.
*
* @param val true to exclude host events
*/
PerfKvmCounterConfig &exclude_hv(bool val) {
attr.exclude_hv = val;
return *this;
}
/** Underlying perf_event_attr structure describing the counter */ /** Underlying perf_event_attr structure describing the counter */
struct perf_event_attr attr; struct perf_event_attr attr;
}; };