blob: 71551b7527cceae1be3c1369236b319ba53373f7 [file] [log] [blame] [edit]
use perf_event::events::{Cache, CacheOp, CacheResult, Hardware, WhichCache};
use perf_event::{Builder, Group};
fn main() -> std::io::Result<()> {
const ACCESS: Cache = Cache {
which: WhichCache::L1D,
operation: CacheOp::READ,
result: CacheResult::ACCESS,
};
const MISS: Cache = Cache {
result: CacheResult::MISS,
..ACCESS
};
let mut group = Group::new()?;
let access_counter = Builder::new().group(&mut group).kind(ACCESS).build()?;
let miss_counter = Builder::new().group(&mut group).kind(MISS).build()?;
let branches = Builder::new()
.group(&mut group)
.kind(Hardware::BRANCH_INSTRUCTIONS)
.build()?;
let missed_branches = Builder::new()
.group(&mut group)
.kind(Hardware::BRANCH_MISSES)
.build()?;
let insns = Builder::new()
.group(&mut group)
.kind(Hardware::INSTRUCTIONS)
.build()?;
let cycles = Builder::new()
.group(&mut group)
.kind(Hardware::CPU_CYCLES)
.build()?;
// Note that if you add more counters than you actually have hardware for,
// the kernel will time-slice them, which means you may get no coverage for
// short measurements. See the documentation.
//
// On my machine, this program won't collect any data unless I disable the
// NMI watchdog, as described in the documentation for `Group`. My machine
// has four counters, and this program tries to use all of them, but the NMI
// watchdog uses one up.
let mut vec = (0..=100000).collect::<Vec<_>>();
group.enable()?;
vec.sort();
println!("{:?}", &vec[0..10]);
group.disable()?;
let counts = group.read()?;
println!(
"enabled for {}ns, actually running for {}ns",
counts.time_enabled(),
counts.time_running()
);
if counts.time_running() == 0 {
println!("Group was never running; no results available.");
return Ok(());
}
if counts.time_running() < counts.time_enabled() {
println!("Counts cover only a portion of the execution.");
}
println!(
"L1D cache misses/references: {} / {} ({:.0}%)",
counts[&miss_counter],
counts[&access_counter],
(counts[&miss_counter] as f64 / counts[&access_counter] as f64) * 100.0
);
println!(
"branch prediction misses/total: {} / {} ({:.0}%)",
counts[&missed_branches],
counts[&branches],
(counts[&missed_branches] as f64 / counts[&branches] as f64) * 100.0
);
println!(
"{} instructions, {} cycles ({:.2} cpi)",
counts[&insns],
counts[&cycles],
counts[&cycles] as f64 / counts[&insns] as f64
);
// You can iterate over a `Counts` value:
for (id, value) in &counts {
println!("Counter id {} has value {}", id, value);
}
Ok(())
}