kvm: Set the perf exclude_host attribute if available
The performance counting framework in Linux 3.2 and onwards supports an attribute to exclude events generated by the host when running KVM. Setting this attribute allows us to get more reliable measurements of the guest machine. For example, on a highly loaded system, the instruction counts from the guest can be severely distorted by the host kernel (e.g., by page fault handlers). This changeset introduces a check for the attribute and enables it in the KVM CPU if present.
This commit is contained in:
parent
d4f205ea2f
commit
4b8be6a90b
3 changed files with 86 additions and 2 deletions
41
SConstruct
41
SConstruct
|
@ -794,12 +794,35 @@ def CheckLeading(context):
|
||||||
context.Result(ret)
|
context.Result(ret)
|
||||||
return ret
|
return ret
|
||||||
|
|
||||||
|
# Add a custom Check function to test for structure members.
|
||||||
|
def CheckMember(context, include, decl, member, include_quotes="<>"):
|
||||||
|
context.Message("Checking for member %s in %s..." %
|
||||||
|
(member, decl))
|
||||||
|
text = """
|
||||||
|
#include %(header)s
|
||||||
|
int main(){
|
||||||
|
%(decl)s test;
|
||||||
|
(void)test.%(member)s;
|
||||||
|
return 0;
|
||||||
|
};
|
||||||
|
""" % { "header" : include_quotes[0] + include + include_quotes[1],
|
||||||
|
"decl" : decl,
|
||||||
|
"member" : member,
|
||||||
|
}
|
||||||
|
|
||||||
|
ret = context.TryCompile(text, extension=".cc")
|
||||||
|
context.Result(ret)
|
||||||
|
return ret
|
||||||
|
|
||||||
# Platform-specific configuration. Note again that we assume that all
|
# Platform-specific configuration. Note again that we assume that all
|
||||||
# builds under a given build root run on the same host platform.
|
# builds under a given build root run on the same host platform.
|
||||||
conf = Configure(main,
|
conf = Configure(main,
|
||||||
conf_dir = joinpath(build_root, '.scons_config'),
|
conf_dir = joinpath(build_root, '.scons_config'),
|
||||||
log_file = joinpath(build_root, 'scons_config.log'),
|
log_file = joinpath(build_root, 'scons_config.log'),
|
||||||
custom_tests = { 'CheckLeading' : CheckLeading })
|
custom_tests = {
|
||||||
|
'CheckLeading' : CheckLeading,
|
||||||
|
'CheckMember' : CheckMember,
|
||||||
|
})
|
||||||
|
|
||||||
# Check for leading underscores. Don't really need to worry either
|
# Check for leading underscores. Don't really need to worry either
|
||||||
# way so don't need to check the return code.
|
# way so don't need to check the return code.
|
||||||
|
@ -964,6 +987,12 @@ def is_isa_kvm_compatible(isa):
|
||||||
return host_isa in isa_comp_table.get(isa, [])
|
return host_isa in isa_comp_table.get(isa, [])
|
||||||
|
|
||||||
|
|
||||||
|
# Check if the exclude_host attribute is available. We want this to
|
||||||
|
# get accurate instruction counts in KVM.
|
||||||
|
main['HAVE_PERF_ATTR_EXCLUDE_HOST'] = conf.CheckMember(
|
||||||
|
'linux/perf_event.h', 'struct perf_event_attr', 'exclude_host')
|
||||||
|
|
||||||
|
|
||||||
######################################################################
|
######################################################################
|
||||||
#
|
#
|
||||||
# Finish the configuration
|
# Finish the configuration
|
||||||
|
@ -1065,7 +1094,8 @@ sticky_vars.AddVariables(
|
||||||
|
|
||||||
# These variables get exported to #defines in config/*.hh (see src/SConscript).
|
# These variables get exported to #defines in config/*.hh (see src/SConscript).
|
||||||
export_vars += ['USE_FENV', 'SS_COMPATIBLE_FP', 'TARGET_ISA', 'CP_ANNOTATE',
|
export_vars += ['USE_FENV', 'SS_COMPATIBLE_FP', 'TARGET_ISA', 'CP_ANNOTATE',
|
||||||
'USE_POSIX_CLOCK', 'PROTOCOL', 'HAVE_PROTOBUF']
|
'USE_POSIX_CLOCK', 'PROTOCOL', 'HAVE_PROTOBUF',
|
||||||
|
'HAVE_PERF_ATTR_EXCLUDE_HOST']
|
||||||
|
|
||||||
###################################################
|
###################################################
|
||||||
#
|
#
|
||||||
|
@ -1243,6 +1273,13 @@ for variant_path in variant_paths:
|
||||||
"target ISA combination"
|
"target ISA combination"
|
||||||
env['USE_KVM'] = False
|
env['USE_KVM'] = False
|
||||||
|
|
||||||
|
# Warn about missing optional functionality
|
||||||
|
if env['USE_KVM']:
|
||||||
|
if not main['HAVE_PERF_ATTR_EXCLUDE_HOST']:
|
||||||
|
print "Warning: perf_event headers lack support for the " \
|
||||||
|
"exclude_host attribute. KVM instruction counts will " \
|
||||||
|
"be inaccurate."
|
||||||
|
|
||||||
# Save sticky variable settings back to current variables file
|
# Save sticky variable settings back to current variables file
|
||||||
sticky_vars.Save(current_vars_file, env)
|
sticky_vars.Save(current_vars_file, env)
|
||||||
|
|
||||||
|
|
|
@ -1133,6 +1133,12 @@ BaseKvmCPU::setupCounters()
|
||||||
cfgCycles.disabled(true)
|
cfgCycles.disabled(true)
|
||||||
.pinned(true);
|
.pinned(true);
|
||||||
|
|
||||||
|
// Try to exclude the host. We set both exclude_hv and
|
||||||
|
// exclude_host since different architectures use slightly
|
||||||
|
// different APIs in the kernel.
|
||||||
|
cfgCycles.exclude_hv(true)
|
||||||
|
.exclude_host(true);
|
||||||
|
|
||||||
if (perfControlledByTimer) {
|
if (perfControlledByTimer) {
|
||||||
// We need to configure the cycles counter to send overflows
|
// We need to configure the cycles counter to send overflows
|
||||||
// since we are going to use it to trigger timer signals that
|
// since we are going to use it to trigger timer signals that
|
||||||
|
@ -1206,6 +1212,12 @@ BaseKvmCPU::setupInstCounter(uint64_t period)
|
||||||
PerfKvmCounterConfig cfgInstructions(PERF_TYPE_HARDWARE,
|
PerfKvmCounterConfig cfgInstructions(PERF_TYPE_HARDWARE,
|
||||||
PERF_COUNT_HW_INSTRUCTIONS);
|
PERF_COUNT_HW_INSTRUCTIONS);
|
||||||
|
|
||||||
|
// Try to exclude the host. We set both exclude_hv and
|
||||||
|
// exclude_host since different architectures use slightly
|
||||||
|
// different APIs in the kernel.
|
||||||
|
cfgInstructions.exclude_hv(true)
|
||||||
|
.exclude_host(true);
|
||||||
|
|
||||||
if (period) {
|
if (period) {
|
||||||
// Setup a sampling counter if that has been requested.
|
// Setup a sampling counter if that has been requested.
|
||||||
cfgInstructions.wakeupEvents(1)
|
cfgInstructions.wakeupEvents(1)
|
||||||
|
|
|
@ -45,6 +45,8 @@
|
||||||
|
|
||||||
#include <inttypes.h>
|
#include <inttypes.h>
|
||||||
|
|
||||||
|
#include "config/have_perf_attr_exclude_host.hh"
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* PerfEvent counter configuration.
|
* PerfEvent counter configuration.
|
||||||
*/
|
*/
|
||||||
|
@ -125,6 +127,39 @@ class PerfKvmCounterConfig
|
||||||
return *this;
|
return *this;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Exclude the events from the host (i.e., only include events
|
||||||
|
* from the guest system).
|
||||||
|
*
|
||||||
|
* Intel CPUs seem to support this attribute from Linux 3.2 and
|
||||||
|
* onwards. Non-x86 architectures currently ignore this attribute
|
||||||
|
* (Linux 3.12-rc5).
|
||||||
|
*
|
||||||
|
* @warn This attribute is ignored if it isn't present in the
|
||||||
|
* kernel headers or if the kernel doesn't support it.
|
||||||
|
*
|
||||||
|
* @param val true to exclude host events
|
||||||
|
*/
|
||||||
|
PerfKvmCounterConfig &exclude_host(bool val) {
|
||||||
|
#if HAVE_PERF_ATTR_EXCLUDE_HOST == 1
|
||||||
|
attr.exclude_host = val;
|
||||||
|
#endif
|
||||||
|
return *this;
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Exclude the hyper visor (i.e., only include events from the
|
||||||
|
* guest system).
|
||||||
|
*
|
||||||
|
* @warn This is attribute only seems to be ignored on Intel.
|
||||||
|
*
|
||||||
|
* @param val true to exclude host events
|
||||||
|
*/
|
||||||
|
PerfKvmCounterConfig &exclude_hv(bool val) {
|
||||||
|
attr.exclude_hv = val;
|
||||||
|
return *this;
|
||||||
|
}
|
||||||
|
|
||||||
/** Underlying perf_event_attr structure describing the counter */
|
/** Underlying perf_event_attr structure describing the counter */
|
||||||
struct perf_event_attr attr;
|
struct perf_event_attr attr;
|
||||||
};
|
};
|
||||||
|
|
Loading…
Reference in a new issue