Skip to content

Commit adf9b5f

Browse files
authored
Rollup merge of #133418 - Zalathar:spans, r=jieyouxu
coverage: Store coverage source regions as `Span` until codegen Historically, coverage spans were converted into line/column coordinates during the MIR instrumentation pass. This PR moves that conversion step into codegen, so that coverage spans spend most of their time stored as `Span` instead. In addition to being conceptually nicer, this also reduces the size of coverage mappings in MIR, because `Span` is smaller than 4x u32. --- There should be no changes to coverage output.
2 parents af1ca15 + 2748009 commit adf9b5f

13 files changed

+251
-285
lines changed

compiler/rustc_codegen_llvm/src/coverageinfo/ffi.rs

+10-26
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,4 @@
1-
use rustc_middle::mir::coverage::{CounterId, CovTerm, ExpressionId, SourceRegion};
2-
3-
use crate::coverageinfo::mapgen::LocalFileId;
1+
use rustc_middle::mir::coverage::{CounterId, CovTerm, ExpressionId};
42

53
/// Must match the layout of `LLVMRustCounterKind`.
64
#[derive(Copy, Clone, Debug)]
@@ -126,45 +124,31 @@ pub(crate) struct CoverageSpan {
126124
/// Local index into the function's local-to-global file ID table.
127125
/// The value at that index is itself an index into the coverage filename
128126
/// table in the CGU's `__llvm_covmap` section.
129-
file_id: u32,
127+
pub(crate) file_id: u32,
130128

131129
/// 1-based starting line of the source code span.
132-
start_line: u32,
130+
pub(crate) start_line: u32,
133131
/// 1-based starting column of the source code span.
134-
start_col: u32,
132+
pub(crate) start_col: u32,
135133
/// 1-based ending line of the source code span.
136-
end_line: u32,
134+
pub(crate) end_line: u32,
137135
/// 1-based ending column of the source code span. High bit must be unset.
138-
end_col: u32,
139-
}
140-
141-
impl CoverageSpan {
142-
pub(crate) fn from_source_region(
143-
local_file_id: LocalFileId,
144-
code_region: &SourceRegion,
145-
) -> Self {
146-
let file_id = local_file_id.as_u32();
147-
let &SourceRegion { start_line, start_col, end_line, end_col } = code_region;
148-
// Internally, LLVM uses the high bit of `end_col` to distinguish between
149-
// code regions and gap regions, so it can't be used by the column number.
150-
assert!(end_col & (1u32 << 31) == 0, "high bit of `end_col` must be unset: {end_col:#X}");
151-
Self { file_id, start_line, start_col, end_line, end_col }
152-
}
136+
pub(crate) end_col: u32,
153137
}
154138

155139
/// Must match the layout of `LLVMRustCoverageCodeRegion`.
156140
#[derive(Clone, Debug)]
157141
#[repr(C)]
158142
pub(crate) struct CodeRegion {
159-
pub(crate) span: CoverageSpan,
143+
pub(crate) cov_span: CoverageSpan,
160144
pub(crate) counter: Counter,
161145
}
162146

163147
/// Must match the layout of `LLVMRustCoverageBranchRegion`.
164148
#[derive(Clone, Debug)]
165149
#[repr(C)]
166150
pub(crate) struct BranchRegion {
167-
pub(crate) span: CoverageSpan,
151+
pub(crate) cov_span: CoverageSpan,
168152
pub(crate) true_counter: Counter,
169153
pub(crate) false_counter: Counter,
170154
}
@@ -173,7 +157,7 @@ pub(crate) struct BranchRegion {
173157
#[derive(Clone, Debug)]
174158
#[repr(C)]
175159
pub(crate) struct MCDCBranchRegion {
176-
pub(crate) span: CoverageSpan,
160+
pub(crate) cov_span: CoverageSpan,
177161
pub(crate) true_counter: Counter,
178162
pub(crate) false_counter: Counter,
179163
pub(crate) mcdc_branch_params: mcdc::BranchParameters,
@@ -183,6 +167,6 @@ pub(crate) struct MCDCBranchRegion {
183167
#[derive(Clone, Debug)]
184168
#[repr(C)]
185169
pub(crate) struct MCDCDecisionRegion {
186-
pub(crate) span: CoverageSpan,
170+
pub(crate) cov_span: CoverageSpan,
187171
pub(crate) mcdc_decision_params: mcdc::DecisionParameters,
188172
}

compiler/rustc_codegen_llvm/src/coverageinfo/map_data.rs

+7-7
Original file line numberDiff line numberDiff line change
@@ -3,9 +3,9 @@ use rustc_data_structures::fx::FxIndexSet;
33
use rustc_index::bit_set::BitSet;
44
use rustc_middle::mir::coverage::{
55
CounterId, CovTerm, Expression, ExpressionId, FunctionCoverageInfo, Mapping, MappingKind, Op,
6-
SourceRegion,
76
};
87
use rustc_middle::ty::Instance;
8+
use rustc_span::Span;
99
use tracing::{debug, instrument};
1010

1111
use crate::coverageinfo::ffi::{Counter, CounterExpression, ExprKind};
@@ -220,16 +220,16 @@ impl<'tcx> FunctionCoverage<'tcx> {
220220
})
221221
}
222222

223-
/// Converts this function's coverage mappings into an intermediate form
224-
/// that will be used by `mapgen` when preparing for FFI.
225-
pub(crate) fn counter_regions(
223+
/// Yields all this function's coverage mappings, after simplifying away
224+
/// unused counters and counter expressions.
225+
pub(crate) fn mapping_spans(
226226
&self,
227-
) -> impl Iterator<Item = (MappingKind, &SourceRegion)> + ExactSizeIterator {
227+
) -> impl Iterator<Item = (MappingKind, Span)> + ExactSizeIterator + Captures<'_> {
228228
self.function_coverage_info.mappings.iter().map(move |mapping| {
229-
let Mapping { kind, source_region } = mapping;
229+
let &Mapping { ref kind, span } = mapping;
230230
let kind =
231231
kind.map_terms(|term| if self.is_zero_term(term) { CovTerm::Zero } else { term });
232-
(kind, source_region)
232+
(kind, span)
233233
})
234234
}
235235

compiler/rustc_codegen_llvm/src/coverageinfo/mapgen.rs

+66-63
Original file line numberDiff line numberDiff line change
@@ -1,12 +1,14 @@
1+
mod spans;
2+
13
use std::ffi::CString;
2-
use std::iter;
4+
use std::sync::Arc;
35

46
use itertools::Itertools as _;
57
use rustc_abi::Align;
68
use rustc_codegen_ssa::traits::{
79
BaseTypeCodegenMethods, ConstCodegenMethods, StaticCodegenMethods,
810
};
9-
use rustc_data_structures::fx::{FxHashSet, FxIndexMap, FxIndexSet};
11+
use rustc_data_structures::fx::{FxHashSet, FxIndexMap};
1012
use rustc_hir::def_id::{DefId, LocalDefId};
1113
use rustc_index::IndexVec;
1214
use rustc_middle::mir::coverage::MappingKind;
@@ -15,7 +17,7 @@ use rustc_middle::{bug, mir};
1517
use rustc_session::RemapFileNameExt;
1618
use rustc_session::config::RemapPathScopeComponents;
1719
use rustc_span::def_id::DefIdSet;
18-
use rustc_span::{Span, Symbol};
20+
use rustc_span::{SourceFile, StableSourceFileId};
1921
use rustc_target::spec::HasTargetSpec;
2022
use tracing::debug;
2123

@@ -72,11 +74,11 @@ pub(crate) fn finalize(cx: &CodegenCx<'_, '_>) {
7274
.map(|(instance, function_coverage)| (instance, function_coverage.into_finished()))
7375
.collect::<Vec<_>>();
7476

75-
let all_file_names = function_coverage_entries
77+
let all_files = function_coverage_entries
7678
.iter()
7779
.map(|(_, fn_cov)| fn_cov.function_coverage_info.body_span)
78-
.map(|span| span_file_name(tcx, span));
79-
let global_file_table = GlobalFileTable::new(all_file_names);
80+
.map(|span| tcx.sess.source_map().lookup_source_file(span.lo()));
81+
let global_file_table = GlobalFileTable::new(all_files);
8082

8183
// Encode all filenames referenced by coverage mappings in this CGU.
8284
let filenames_buffer = global_file_table.make_filenames_buffer(tcx);
@@ -103,15 +105,8 @@ pub(crate) fn finalize(cx: &CodegenCx<'_, '_>) {
103105
encode_mappings_for_function(tcx, &global_file_table, &function_coverage);
104106

105107
if coverage_mapping_buffer.is_empty() {
106-
if function_coverage.is_used() {
107-
bug!(
108-
"A used function should have had coverage mapping data but did not: {}",
109-
mangled_function_name
110-
);
111-
} else {
112-
debug!("unused function had no coverage mapping data: {}", mangled_function_name);
113-
continue;
114-
}
108+
debug!("function has no mappings to embed; skipping");
109+
continue;
115110
}
116111

117112
if !is_used {
@@ -148,54 +143,62 @@ pub(crate) fn finalize(cx: &CodegenCx<'_, '_>) {
148143
}
149144
}
150145

151-
/// Maps "global" (per-CGU) file ID numbers to their underlying filenames.
146+
/// Maps "global" (per-CGU) file ID numbers to their underlying source files.
152147
struct GlobalFileTable {
153-
/// This "raw" table doesn't include the working dir, so a filename's
148+
/// This "raw" table doesn't include the working dir, so a file's
154149
/// global ID is its index in this set **plus one**.
155-
raw_file_table: FxIndexSet<Symbol>,
150+
raw_file_table: FxIndexMap<StableSourceFileId, Arc<SourceFile>>,
156151
}
157152

158153
impl GlobalFileTable {
159-
fn new(all_file_names: impl IntoIterator<Item = Symbol>) -> Self {
160-
// Collect all of the filenames into a set. Filenames usually come in
161-
// contiguous runs, so we can dedup adjacent ones to save work.
162-
let mut raw_file_table = all_file_names.into_iter().dedup().collect::<FxIndexSet<Symbol>>();
154+
fn new(all_files: impl IntoIterator<Item = Arc<SourceFile>>) -> Self {
155+
// Collect all of the files into a set. Files usually come in contiguous
156+
// runs, so we can dedup adjacent ones to save work.
157+
let mut raw_file_table = all_files
158+
.into_iter()
159+
.dedup_by(|a, b| a.stable_id == b.stable_id)
160+
.map(|f| (f.stable_id, f))
161+
.collect::<FxIndexMap<StableSourceFileId, Arc<SourceFile>>>();
163162

164-
// Sort the file table by its actual string values, not the arbitrary
165-
// ordering of its symbols.
166-
raw_file_table.sort_unstable_by(|a, b| a.as_str().cmp(b.as_str()));
163+
// Sort the file table by its underlying filenames.
164+
raw_file_table.sort_unstable_by(|_, a, _, b| {
165+
Ord::cmp(&a.name, &b.name).then_with(|| Ord::cmp(&a.stable_id, &b.stable_id))
166+
});
167167

168168
Self { raw_file_table }
169169
}
170170

171-
fn global_file_id_for_file_name(&self, file_name: Symbol) -> GlobalFileId {
172-
let raw_id = self.raw_file_table.get_index_of(&file_name).unwrap_or_else(|| {
173-
bug!("file name not found in prepared global file table: {file_name}");
171+
fn global_file_id_for_file(&self, file: &SourceFile) -> GlobalFileId {
172+
let raw_id = self.raw_file_table.get_index_of(&file.stable_id).unwrap_or_else(|| {
173+
bug!("file not found in prepared global file table: {:?}", file.name);
174174
});
175175
// The raw file table doesn't include an entry for the working dir
176176
// (which has ID 0), so add 1 to get the correct ID.
177177
GlobalFileId::from_usize(raw_id + 1)
178178
}
179179

180180
fn make_filenames_buffer(&self, tcx: TyCtxt<'_>) -> Vec<u8> {
181+
let mut table = Vec::with_capacity(self.raw_file_table.len() + 1);
182+
181183
// LLVM Coverage Mapping Format version 6 (zero-based encoded as 5)
182184
// requires setting the first filename to the compilation directory.
183185
// Since rustc generates coverage maps with relative paths, the
184186
// compilation directory can be combined with the relative paths
185187
// to get absolute paths, if needed.
186-
use rustc_session::RemapFileNameExt;
187-
use rustc_session::config::RemapPathScopeComponents;
188-
let working_dir: &str = &tcx
189-
.sess
190-
.opts
191-
.working_dir
192-
.for_scope(tcx.sess, RemapPathScopeComponents::MACRO)
193-
.to_string_lossy();
194-
195-
// Insert the working dir at index 0, before the other filenames.
196-
let filenames =
197-
iter::once(working_dir).chain(self.raw_file_table.iter().map(Symbol::as_str));
198-
llvm_cov::write_filenames_to_buffer(filenames)
188+
table.push(
189+
tcx.sess
190+
.opts
191+
.working_dir
192+
.for_scope(tcx.sess, RemapPathScopeComponents::MACRO)
193+
.to_string_lossy(),
194+
);
195+
196+
// Add the regular entries after the base directory.
197+
table.extend(self.raw_file_table.values().map(|file| {
198+
file.name.for_scope(tcx.sess, RemapPathScopeComponents::MACRO).to_string_lossy()
199+
}));
200+
201+
llvm_cov::write_filenames_to_buffer(table.iter().map(|f| f.as_ref()))
199202
}
200203
}
201204

@@ -208,7 +211,7 @@ rustc_index::newtype_index! {
208211
/// An index into a function's list of global file IDs. That underlying list
209212
/// of local-to-global mappings will be embedded in the function's record in
210213
/// the `__llvm_covfun` linker section.
211-
pub(crate) struct LocalFileId {}
214+
struct LocalFileId {}
212215
}
213216

214217
/// Holds a mapping from "local" (per-function) file IDs to "global" (per-CGU)
@@ -234,13 +237,6 @@ impl VirtualFileMapping {
234237
}
235238
}
236239

237-
fn span_file_name(tcx: TyCtxt<'_>, span: Span) -> Symbol {
238-
let source_file = tcx.sess.source_map().lookup_source_file(span.lo());
239-
let name =
240-
source_file.name.for_scope(tcx.sess, RemapPathScopeComponents::MACRO).to_string_lossy();
241-
Symbol::intern(&name)
242-
}
243-
244240
/// Using the expressions and counter regions collected for a single function,
245241
/// generate the variable-sized payload of its corresponding `__llvm_covfun`
246242
/// entry. The payload is returned as a vector of bytes.
@@ -251,11 +247,13 @@ fn encode_mappings_for_function(
251247
global_file_table: &GlobalFileTable,
252248
function_coverage: &FunctionCoverage<'_>,
253249
) -> Vec<u8> {
254-
let counter_regions = function_coverage.counter_regions();
255-
if counter_regions.is_empty() {
250+
let mapping_spans = function_coverage.mapping_spans();
251+
if mapping_spans.is_empty() {
256252
return Vec::new();
257253
}
258254

255+
let fn_cov_info = function_coverage.function_coverage_info;
256+
259257
let expressions = function_coverage.counter_expressions().collect::<Vec<_>>();
260258

261259
let mut virtual_file_mapping = VirtualFileMapping::default();
@@ -265,42 +263,47 @@ fn encode_mappings_for_function(
265263
let mut mcdc_decision_regions = vec![];
266264

267265
// Currently a function's mappings must all be in the same file as its body span.
268-
let file_name = span_file_name(tcx, function_coverage.function_coverage_info.body_span);
266+
let source_map = tcx.sess.source_map();
267+
let source_file = source_map.lookup_source_file(fn_cov_info.body_span.lo());
269268

270-
// Look up the global file ID for that filename.
271-
let global_file_id = global_file_table.global_file_id_for_file_name(file_name);
269+
// Look up the global file ID for that file.
270+
let global_file_id = global_file_table.global_file_id_for_file(&source_file);
272271

273272
// Associate that global file ID with a local file ID for this function.
274273
let local_file_id = virtual_file_mapping.local_id_for_global(global_file_id);
275-
debug!(" file id: {local_file_id:?} => {global_file_id:?} = '{file_name:?}'");
276274

277-
// For each counter/region pair in this function+file, convert it to a
275+
let make_cov_span = |span| {
276+
spans::make_coverage_span(local_file_id, source_map, fn_cov_info, &source_file, span)
277+
};
278+
279+
// For each coverage mapping span in this function+file, convert it to a
278280
// form suitable for FFI.
279-
for (mapping_kind, region) in counter_regions {
280-
debug!("Adding counter {mapping_kind:?} to map for {region:?}");
281-
let span = ffi::CoverageSpan::from_source_region(local_file_id, region);
281+
for (mapping_kind, span) in mapping_spans {
282+
debug!("Adding counter {mapping_kind:?} to map for {span:?}");
283+
let Some(cov_span) = make_cov_span(span) else { continue };
282284
match mapping_kind {
283285
MappingKind::Code(term) => {
284-
code_regions.push(ffi::CodeRegion { span, counter: ffi::Counter::from_term(term) });
286+
code_regions
287+
.push(ffi::CodeRegion { cov_span, counter: ffi::Counter::from_term(term) });
285288
}
286289
MappingKind::Branch { true_term, false_term } => {
287290
branch_regions.push(ffi::BranchRegion {
288-
span,
291+
cov_span,
289292
true_counter: ffi::Counter::from_term(true_term),
290293
false_counter: ffi::Counter::from_term(false_term),
291294
});
292295
}
293296
MappingKind::MCDCBranch { true_term, false_term, mcdc_params } => {
294297
mcdc_branch_regions.push(ffi::MCDCBranchRegion {
295-
span,
298+
cov_span,
296299
true_counter: ffi::Counter::from_term(true_term),
297300
false_counter: ffi::Counter::from_term(false_term),
298301
mcdc_branch_params: ffi::mcdc::BranchParameters::from(mcdc_params),
299302
});
300303
}
301304
MappingKind::MCDCDecision(mcdc_decision_params) => {
302305
mcdc_decision_regions.push(ffi::MCDCDecisionRegion {
303-
span,
306+
cov_span,
304307
mcdc_decision_params: ffi::mcdc::DecisionParameters::from(mcdc_decision_params),
305308
});
306309
}

0 commit comments

Comments
 (0)