use perf_event::{Builder, Group}; use perf_event::events::{Cache, CacheOp, CacheResult, Hardware, WhichCache}; fn main() -> std::io::Result<()> { const ACCESS: Cache = Cache { which: WhichCache::L1D, operation: CacheOp::READ, result: CacheResult::ACCESS, }; const MISS: Cache = Cache { result: CacheResult::MISS, ..ACCESS }; let mut group = Group::new()?; let access_counter = Builder::new().group(&mut group).kind(ACCESS).build()?; let miss_counter = Builder::new().group(&mut group).kind(MISS).build()?; let branches = Builder::new().group(&mut group).kind(Hardware::BRANCH_INSTRUCTIONS).build()?; let missed_branches = Builder::new().group(&mut group).kind(Hardware::BRANCH_MISSES).build()?; // Note that if you add more counters than you actually have hardware for, // the kernel will time-slice them, which means you may get no coverage for // short measurements. See the documentation. let vec = (0..=51).collect::>(); group.enable()?; println!("{:?}", vec); group.disable()?; let counts = group.read()?; println!("L1D cache misses/references: {} / {} ({:.0}%)", counts[&miss_counter], counts[&access_counter], (counts[&miss_counter] as f64 / counts[&access_counter] as f64) * 100.0); println!("branch prediction misses/total: {} / {} ({:.0}%)", counts[&missed_branches], counts[&branches], (counts[&missed_branches] as f64 / counts[&branches] as f64) * 100.0); // You can iterate over a `Counts` value: for (id, value) in &counts { println!("Counter id {} has value {}", id, value); } Ok(()) }