summaryrefslogtreecommitdiffstats
path: root/compiler/rustc_codegen_llvm/src/coverageinfo/mapgen.rs
diff options
context:
space:
mode:
Diffstat (limited to 'compiler/rustc_codegen_llvm/src/coverageinfo/mapgen.rs')
-rw-r--r--compiler/rustc_codegen_llvm/src/coverageinfo/mapgen.rs287
1 files changed, 204 insertions, 83 deletions
diff --git a/compiler/rustc_codegen_llvm/src/coverageinfo/mapgen.rs b/compiler/rustc_codegen_llvm/src/coverageinfo/mapgen.rs
index d4e775256..274e0aeaa 100644
--- a/compiler/rustc_codegen_llvm/src/coverageinfo/mapgen.rs
+++ b/compiler/rustc_codegen_llvm/src/coverageinfo/mapgen.rs
@@ -1,18 +1,20 @@
use crate::common::CodegenCx;
use crate::coverageinfo;
use crate::coverageinfo::ffi::CounterMappingRegion;
-use crate::coverageinfo::map_data::FunctionCoverage;
+use crate::coverageinfo::map_data::{FunctionCoverage, FunctionCoverageCollector};
use crate::llvm;
-use rustc_codegen_ssa::traits::ConstMethods;
-use rustc_data_structures::fx::FxIndexSet;
+use itertools::Itertools as _;
+use rustc_codegen_ssa::traits::{BaseTypeMethods, ConstMethods};
+use rustc_data_structures::fx::{FxIndexMap, FxIndexSet};
use rustc_hir::def::DefKind;
use rustc_hir::def_id::DefId;
use rustc_index::IndexVec;
use rustc_middle::bug;
-use rustc_middle::middle::codegen_fn_attrs::CodegenFnAttrFlags;
+use rustc_middle::mir;
use rustc_middle::mir::coverage::CodeRegion;
-use rustc_middle::ty::TyCtxt;
+use rustc_middle::ty::{self, TyCtxt};
+use rustc_span::def_id::DefIdSet;
use rustc_span::Symbol;
/// Generates and exports the Coverage Map.
@@ -56,21 +58,40 @@ pub fn finalize(cx: &CodegenCx<'_, '_>) {
return;
}
- let mut global_file_table = GlobalFileTable::new(tcx);
+ let function_coverage_entries = function_coverage_map
+ .into_iter()
+ .map(|(instance, function_coverage)| (instance, function_coverage.into_finished()))
+ .collect::<Vec<_>>();
+
+ let all_file_names =
+ function_coverage_entries.iter().flat_map(|(_, fn_cov)| fn_cov.all_file_names());
+ let global_file_table = GlobalFileTable::new(all_file_names);
+
+ // Encode all filenames referenced by coverage mappings in this CGU.
+ let filenames_buffer = global_file_table.make_filenames_buffer(tcx);
+
+ let filenames_size = filenames_buffer.len();
+ let filenames_val = cx.const_bytes(&filenames_buffer);
+ let filenames_ref = coverageinfo::hash_bytes(&filenames_buffer);
+
+ // Generate the coverage map header, which contains the filenames used by
+ // this CGU's coverage mappings, and store it in a well-known global.
+ let cov_data_val = generate_coverage_map(cx, version, filenames_size, filenames_val);
+ coverageinfo::save_cov_data_to_mod(cx, cov_data_val);
+
+ let mut unused_function_names = Vec::new();
+ let covfun_section_name = coverageinfo::covfun_section_name(cx);
// Encode coverage mappings and generate function records
- let mut function_data = Vec::new();
- for (instance, mut function_coverage) in function_coverage_map {
+ for (instance, function_coverage) in function_coverage_entries {
debug!("Generate function coverage for {}, {:?}", cx.codegen_unit.name(), instance);
- function_coverage.simplify_expressions();
- let function_coverage = function_coverage;
let mangled_function_name = tcx.symbol_name(instance).name;
let source_hash = function_coverage.source_hash();
let is_used = function_coverage.is_used();
let coverage_mapping_buffer =
- encode_mappings_for_function(&mut global_file_table, &function_coverage);
+ encode_mappings_for_function(&global_file_table, &function_coverage);
if coverage_mapping_buffer.is_empty() {
if function_coverage.is_used() {
@@ -84,21 +105,10 @@ pub fn finalize(cx: &CodegenCx<'_, '_>) {
}
}
- function_data.push((mangled_function_name, source_hash, is_used, coverage_mapping_buffer));
- }
-
- // Encode all filenames referenced by counters/expressions in this module
- let filenames_buffer = global_file_table.into_filenames_buffer();
-
- let filenames_size = filenames_buffer.len();
- let filenames_val = cx.const_bytes(&filenames_buffer);
- let filenames_ref = coverageinfo::hash_bytes(&filenames_buffer);
-
- // Generate the LLVM IR representation of the coverage map and store it in a well-known global
- let cov_data_val = generate_coverage_map(cx, version, filenames_size, filenames_val);
+ if !is_used {
+ unused_function_names.push(mangled_function_name);
+ }
- let covfun_section_name = coverageinfo::covfun_section_name(cx);
- for (mangled_function_name, source_hash, is_used, coverage_mapping_buffer) in function_data {
save_function_record(
cx,
&covfun_section_name,
@@ -110,90 +120,143 @@ pub fn finalize(cx: &CodegenCx<'_, '_>) {
);
}
- // Save the coverage data value to LLVM IR
- coverageinfo::save_cov_data_to_mod(cx, cov_data_val);
+ // For unused functions, we need to take their mangled names and store them
+ // in a specially-named global array. LLVM's `InstrProfiling` pass will
+ // detect this global and include those names in its `__llvm_prf_names`
+ // section. (See `llvm/lib/Transforms/Instrumentation/InstrProfiling.cpp`.)
+ if !unused_function_names.is_empty() {
+ assert!(cx.codegen_unit.is_code_coverage_dead_code_cgu());
+
+ let name_globals = unused_function_names
+ .into_iter()
+ .map(|mangled_function_name| cx.const_str(mangled_function_name).0)
+ .collect::<Vec<_>>();
+ let initializer = cx.const_array(cx.type_ptr(), &name_globals);
+
+ let array = llvm::add_global(cx.llmod, cx.val_ty(initializer), "__llvm_coverage_names");
+ llvm::set_global_constant(array, true);
+ llvm::set_linkage(array, llvm::Linkage::InternalLinkage);
+ llvm::set_initializer(array, initializer);
+ }
}
+/// Maps "global" (per-CGU) file ID numbers to their underlying filenames.
struct GlobalFileTable {
- global_file_table: FxIndexSet<Symbol>,
+ /// This "raw" table doesn't include the working dir, so a filename's
+ /// global ID is its index in this set **plus one**.
+ raw_file_table: FxIndexSet<Symbol>,
}
impl GlobalFileTable {
- fn new(tcx: TyCtxt<'_>) -> Self {
- let mut global_file_table = FxIndexSet::default();
+ fn new(all_file_names: impl IntoIterator<Item = Symbol>) -> Self {
+ // Collect all of the filenames into a set. Filenames usually come in
+ // contiguous runs, so we can dedup adjacent ones to save work.
+ let mut raw_file_table = all_file_names.into_iter().dedup().collect::<FxIndexSet<Symbol>>();
+
+ // Sort the file table by its actual string values, not the arbitrary
+ // ordering of its symbols.
+ raw_file_table.sort_unstable_by(|a, b| a.as_str().cmp(b.as_str()));
+
+ Self { raw_file_table }
+ }
+
+ fn global_file_id_for_file_name(&self, file_name: Symbol) -> u32 {
+ let raw_id = self.raw_file_table.get_index_of(&file_name).unwrap_or_else(|| {
+ bug!("file name not found in prepared global file table: {file_name}");
+ });
+ // The raw file table doesn't include an entry for the working dir
+ // (which has ID 0), so add 1 to get the correct ID.
+ (raw_id + 1) as u32
+ }
+
+ fn make_filenames_buffer(&self, tcx: TyCtxt<'_>) -> Vec<u8> {
// LLVM Coverage Mapping Format version 6 (zero-based encoded as 5)
// requires setting the first filename to the compilation directory.
// Since rustc generates coverage maps with relative paths, the
// compilation directory can be combined with the relative paths
// to get absolute paths, if needed.
- let working_dir = Symbol::intern(
- &tcx.sess.opts.working_dir.remapped_path_if_available().to_string_lossy(),
- );
- global_file_table.insert(working_dir);
- Self { global_file_table }
- }
-
- fn global_file_id_for_file_name(&mut self, file_name: Symbol) -> u32 {
- let (global_file_id, _) = self.global_file_table.insert_full(file_name);
- global_file_id as u32
- }
-
- fn into_filenames_buffer(self) -> Vec<u8> {
- // This method takes `self` so that the caller can't accidentally
- // modify the original file table after encoding it into a buffer.
+ use rustc_session::RemapFileNameExt;
+ let working_dir: &str = &tcx.sess.opts.working_dir.for_codegen(&tcx.sess).to_string_lossy();
llvm::build_byte_buffer(|buffer| {
coverageinfo::write_filenames_section_to_buffer(
- self.global_file_table.iter().map(Symbol::as_str),
+ // Insert the working dir at index 0, before the other filenames.
+ std::iter::once(working_dir).chain(self.raw_file_table.iter().map(Symbol::as_str)),
buffer,
);
})
}
}
+rustc_index::newtype_index! {
+ // Tell the newtype macro to not generate `Encode`/`Decode` impls.
+ #[custom_encodable]
+ struct LocalFileId {}
+}
+
+/// Holds a mapping from "local" (per-function) file IDs to "global" (per-CGU)
+/// file IDs.
+#[derive(Default)]
+struct VirtualFileMapping {
+ local_to_global: IndexVec<LocalFileId, u32>,
+ global_to_local: FxIndexMap<u32, LocalFileId>,
+}
+
+impl VirtualFileMapping {
+ fn local_id_for_global(&mut self, global_file_id: u32) -> LocalFileId {
+ *self
+ .global_to_local
+ .entry(global_file_id)
+ .or_insert_with(|| self.local_to_global.push(global_file_id))
+ }
+
+ fn into_vec(self) -> Vec<u32> {
+ self.local_to_global.raw
+ }
+}
+
/// Using the expressions and counter regions collected for a single function,
/// generate the variable-sized payload of its corresponding `__llvm_covfun`
/// entry. The payload is returned as a vector of bytes.
///
/// Newly-encountered filenames will be added to the global file table.
fn encode_mappings_for_function(
- global_file_table: &mut GlobalFileTable,
+ global_file_table: &GlobalFileTable,
function_coverage: &FunctionCoverage<'_>,
) -> Vec<u8> {
- let (expressions, counter_regions) = function_coverage.get_expressions_and_counter_regions();
-
- let mut counter_regions = counter_regions.collect::<Vec<_>>();
+ let counter_regions = function_coverage.counter_regions();
if counter_regions.is_empty() {
return Vec::new();
}
- let mut virtual_file_mapping = IndexVec::<u32, u32>::new();
+ let expressions = function_coverage.counter_expressions().collect::<Vec<_>>();
+
+ let mut virtual_file_mapping = VirtualFileMapping::default();
let mut mapping_regions = Vec::with_capacity(counter_regions.len());
- // Sort the list of (counter, region) mapping pairs by region, so that they
- // can be grouped by filename. Prepare file IDs for each filename, and
- // prepare the mapping data so that we can pass it through FFI to LLVM.
- counter_regions.sort_by_key(|(_counter, region)| *region);
- for counter_regions_for_file in
- counter_regions.group_by(|(_, a), (_, b)| a.file_name == b.file_name)
+ // Group mappings into runs with the same filename, preserving the order
+ // yielded by `FunctionCoverage`.
+ // Prepare file IDs for each filename, and prepare the mapping data so that
+ // we can pass it through FFI to LLVM.
+ for (file_name, counter_regions_for_file) in
+ &counter_regions.group_by(|(_counter, region)| region.file_name)
{
- // Look up (or allocate) the global file ID for this filename.
- let file_name = counter_regions_for_file[0].1.file_name;
+ // Look up the global file ID for this filename.
let global_file_id = global_file_table.global_file_id_for_file_name(file_name);
// Associate that global file ID with a local file ID for this function.
- let local_file_id: u32 = virtual_file_mapping.push(global_file_id);
- debug!(" file id: local {local_file_id} => global {global_file_id} = '{file_name:?}'");
+ let local_file_id = virtual_file_mapping.local_id_for_global(global_file_id);
+ debug!(" file id: {local_file_id:?} => global {global_file_id} = '{file_name:?}'");
// For each counter/region pair in this function+file, convert it to a
// form suitable for FFI.
- for &(counter, region) in counter_regions_for_file {
+ for (counter, region) in counter_regions_for_file {
let CodeRegion { file_name: _, start_line, start_col, end_line, end_col } = *region;
debug!("Adding counter {counter:?} to map for {region:?}");
mapping_regions.push(CounterMappingRegion::code_region(
counter,
- local_file_id,
+ local_file_id.as_u32(),
start_line,
start_col,
end_line,
@@ -205,7 +268,7 @@ fn encode_mappings_for_function(
// Encode the function's coverage mappings into a buffer.
llvm::build_byte_buffer(|buffer| {
coverageinfo::write_mapping_to_buffer(
- virtual_file_mapping.raw,
+ virtual_file_mapping.into_vec(),
expressions,
mapping_regions,
buffer,
@@ -289,13 +352,12 @@ fn save_function_record(
/// `-Clink-dead-code` will not generate code for unused generic functions.)
///
/// We can find the unused functions (including generic functions) by the set difference of all MIR
-/// `DefId`s (`tcx` query `mir_keys`) minus the codegenned `DefId`s (`tcx` query
-/// `codegened_and_inlined_items`).
+/// `DefId`s (`tcx` query `mir_keys`) minus the codegenned `DefId`s (`codegenned_and_inlined_items`).
///
-/// These unused functions are then codegen'd in one of the CGUs which is marked as the
-/// "code coverage dead code cgu" during the partitioning process. This prevents us from generating
-/// code regions for the same function more than once which can lead to linker errors regarding
-/// duplicate symbols.
+/// These unused functions don't need to be codegenned, but we do need to add them to the function
+/// coverage map (in a single designated CGU) so that we still emit coverage mappings for them.
+/// We also end up adding their symbol names to a special global array that LLVM will include in
+/// its embedded coverage data.
fn add_unused_functions(cx: &CodegenCx<'_, '_>) {
assert!(cx.codegen_unit.is_code_coverage_dead_code_cgu());
@@ -315,7 +377,7 @@ fn add_unused_functions(cx: &CodegenCx<'_, '_>) {
// generic functions from consideration as well.
if !matches!(
kind,
- DefKind::Fn | DefKind::AssocFn | DefKind::Closure | DefKind::Generator
+ DefKind::Fn | DefKind::AssocFn | DefKind::Closure | DefKind::Coroutine
) {
return None;
}
@@ -326,21 +388,80 @@ fn add_unused_functions(cx: &CodegenCx<'_, '_>) {
})
.collect();
- let codegenned_def_ids = tcx.codegened_and_inlined_items(());
+ let codegenned_def_ids = codegenned_and_inlined_items(tcx);
- for non_codegenned_def_id in
- eligible_def_ids.into_iter().filter(|id| !codegenned_def_ids.contains(id))
- {
- let codegen_fn_attrs = tcx.codegen_fn_attrs(non_codegenned_def_id);
-
- // If a function is marked `#[coverage(off)]`, then skip generating a
- // dead code stub for it.
- if codegen_fn_attrs.flags.contains(CodegenFnAttrFlags::NO_COVERAGE) {
- debug!("skipping unused fn marked #[coverage(off)]: {:?}", non_codegenned_def_id);
+ // For each `DefId` that should have coverage instrumentation but wasn't
+ // codegenned, add it to the function coverage map as an unused function.
+ for def_id in eligible_def_ids.into_iter().filter(|id| !codegenned_def_ids.contains(id)) {
+ // Skip any function that didn't have coverage data added to it by the
+ // coverage instrumentor.
+ let body = tcx.instance_mir(ty::InstanceDef::Item(def_id));
+ let Some(function_coverage_info) = body.function_coverage_info.as_deref() else {
continue;
+ };
+
+ debug!("generating unused fn: {def_id:?}");
+ let instance = declare_unused_fn(tcx, def_id);
+ add_unused_function_coverage(cx, instance, function_coverage_info);
+ }
+}
+
+/// All items participating in code generation together with (instrumented)
+/// items inlined into them.
+fn codegenned_and_inlined_items(tcx: TyCtxt<'_>) -> DefIdSet {
+ let (items, cgus) = tcx.collect_and_partition_mono_items(());
+ let mut visited = DefIdSet::default();
+ let mut result = items.clone();
+
+ for cgu in cgus {
+ for item in cgu.items().keys() {
+ if let mir::mono::MonoItem::Fn(ref instance) = item {
+ let did = instance.def_id();
+ if !visited.insert(did) {
+ continue;
+ }
+ let body = tcx.instance_mir(instance.def);
+ for block in body.basic_blocks.iter() {
+ for statement in &block.statements {
+ let mir::StatementKind::Coverage(_) = statement.kind else { continue };
+ let scope = statement.source_info.scope;
+ if let Some(inlined) = scope.inlined_instance(&body.source_scopes) {
+ result.insert(inlined.def_id());
+ }
+ }
+ }
+ }
}
+ }
- debug!("generating unused fn: {:?}", non_codegenned_def_id);
- cx.define_unused_fn(non_codegenned_def_id);
+ result
+}
+
+fn declare_unused_fn<'tcx>(tcx: TyCtxt<'tcx>, def_id: DefId) -> ty::Instance<'tcx> {
+ ty::Instance::new(
+ def_id,
+ ty::GenericArgs::for_item(tcx, def_id, |param, _| {
+ if let ty::GenericParamDefKind::Lifetime = param.kind {
+ tcx.lifetimes.re_erased.into()
+ } else {
+ tcx.mk_param_from_def(param)
+ }
+ }),
+ )
+}
+
+fn add_unused_function_coverage<'tcx>(
+ cx: &CodegenCx<'_, 'tcx>,
+ instance: ty::Instance<'tcx>,
+ function_coverage_info: &'tcx mir::coverage::FunctionCoverageInfo,
+) {
+ // An unused function's mappings will automatically be rewritten to map to
+ // zero, because none of its counters/expressions are marked as seen.
+ let function_coverage = FunctionCoverageCollector::unused(instance, function_coverage_info);
+
+ if let Some(coverage_context) = cx.coverage_context() {
+ coverage_context.function_coverage_map.borrow_mut().insert(instance, function_coverage);
+ } else {
+ bug!("Could not get the `coverage_context`");
}
}