Skip to content

Commit 8e21bd0

Browse files
committed
Auto merge of #75416 - richkadel:llvm-coverage-map-gen-5.3, r=richkadel
LLVM IR coverage encoding aligns closer to Clang's I found some areas for improvement while attempting to debug the SegFault issue when running rust programs compiled using MSVC, with coverage instrumentation. I discovered that LLVM's coverage writer was generating incomplete function name variable names (that's not a typo: the name of the variable that holds a function name). The existing implementation used one-up numbers to distinguish variables, and correcting the names did not fix the MSVC coverage bug, but the fix in this PR makes the names and resulting LLVM IR easier to follow and more consistent with Clang's implementation. I also changed the way the `-Zinstrument-coverage` option is supported in symbol_export.rs. The original implementation was incorrect, and the corrected version matches the handling for `-Zprofile-generate`, as it turns out. (An argument could be made that maybe `-Zinstrument-coverage` should automatically enable `-Cprofile-generate`. In fact, if `-Cprofile-generate` is analagous to Clang's `-fprofile-generate`, as some documentation implies, Clang always requires this flag for its implementation of source-based code coverage. This would require a little more validation, and if implemented, would probably require updating some of the user-facing messages related to `-Cprofile-generate` to not be so specific to the PGO use case.) None of these changes fixed the MSVC coverage problems, but they should still be welcome improvements. Lastly, I added some additional FIXME comments in instrument_coverage.rs describing issues I found with the generated LLVM IR that would be resolved if the coverage instrumentation is injected with a `Statement` instead of as a new `BasicBlock`. I describe seven advantages of this change, but it requires some discussion before making a change like this. r? @tmandry
2 parents 55b9adf + ba18978 commit 8e21bd0

File tree

12 files changed

+161
-39
lines changed

12 files changed

+161
-39
lines changed

src/librustc_codegen_llvm/coverageinfo/mod.rs

+11-1
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,7 @@ use llvm::coverageinfo::CounterMappingRegion;
88
use log::debug;
99
use rustc_codegen_ssa::coverageinfo::map::{CounterExpression, ExprKind, FunctionCoverage, Region};
1010
use rustc_codegen_ssa::traits::{
11-
BaseTypeMethods, CoverageInfoBuilderMethods, CoverageInfoMethods, StaticMethods,
11+
BaseTypeMethods, CoverageInfoBuilderMethods, CoverageInfoMethods, MiscMethods, StaticMethods,
1212
};
1313
use rustc_data_structures::fx::FxHashMap;
1414
use rustc_llvm::RustString;
@@ -44,6 +44,16 @@ impl CoverageInfoMethods for CodegenCx<'ll, 'tcx> {
4444
}
4545

4646
impl CoverageInfoBuilderMethods<'tcx> for Builder<'a, 'll, 'tcx> {
47+
/// Calls llvm::createPGOFuncNameVar() with the given function instance's mangled function name.
48+
/// The LLVM API returns an llvm::GlobalVariable containing the function name, with the specific
49+
/// variable name and linkage required by LLVM InstrProf source-based coverage instrumentation.
50+
fn create_pgo_func_name_var(&self, instance: Instance<'tcx>) -> Self::Value {
51+
let llfn = self.cx.get_fn(instance);
52+
let mangled_fn_name = CString::new(self.tcx.symbol_name(instance).name)
53+
.expect("error converting function name to C string");
54+
unsafe { llvm::LLVMRustCoverageCreatePGOFuncNameVar(llfn, mangled_fn_name.as_ptr()) }
55+
}
56+
4757
fn add_counter_region(
4858
&mut self,
4959
instance: Instance<'tcx>,

src/librustc_codegen_llvm/intrinsic.rs

+7-7
Original file line numberDiff line numberDiff line change
@@ -215,19 +215,19 @@ impl IntrinsicCallMethods<'tcx> for Builder<'a, 'll, 'tcx> {
215215
self.call(llfn, &[], None)
216216
}
217217
sym::count_code_region => {
218-
let coverageinfo = tcx.coverageinfo(caller_instance.def_id());
219-
let mangled_fn = tcx.symbol_name(caller_instance);
220-
let (mangled_fn_name, _len_val) = self.const_str(Symbol::intern(mangled_fn.name));
221-
let num_counters = self.const_u32(coverageinfo.num_counters);
222218
use coverage::count_code_region_args::*;
219+
let coverageinfo = tcx.coverageinfo(caller_instance.def_id());
220+
221+
let fn_name = self.create_pgo_func_name_var(caller_instance);
223222
let hash = args[FUNCTION_SOURCE_HASH].immediate();
223+
let num_counters = self.const_u32(coverageinfo.num_counters);
224224
let index = args[COUNTER_ID].immediate();
225225
debug!(
226226
"translating Rust intrinsic `count_code_region()` to LLVM intrinsic: \
227-
instrprof.increment(fn_name={}, hash={:?}, num_counters={:?}, index={:?})",
228-
mangled_fn.name, hash, num_counters, index,
227+
instrprof.increment(fn_name={:?}, hash={:?}, num_counters={:?}, index={:?})",
228+
fn_name, hash, num_counters, index,
229229
);
230-
self.instrprof_increment(mangled_fn_name, hash, num_counters, index)
230+
self.instrprof_increment(fn_name, hash, num_counters, index)
231231
}
232232
sym::va_start => self.va_start(args[0].immediate()),
233233
sym::va_end => self.va_end(args[0].immediate()),

src/librustc_codegen_llvm/llvm/ffi.rs

+2
Original file line numberDiff line numberDiff line change
@@ -1786,6 +1786,8 @@ extern "C" {
17861786
BufferOut: &RustString,
17871787
);
17881788

1789+
pub fn LLVMRustCoverageCreatePGOFuncNameVar(F: &'a Value, FuncName: *const c_char)
1790+
-> &'a Value;
17891791
pub fn LLVMRustCoverageComputeHash(Name: *const c_char) -> u64;
17901792

17911793
#[allow(improper_ctypes)]

src/librustc_codegen_ssa/back/symbol_export.rs

+3-12
Original file line numberDiff line numberDiff line change
@@ -190,7 +190,9 @@ fn exported_symbols_provider_local(
190190
}
191191
}
192192

193-
if tcx.sess.opts.cg.profile_generate.enabled() {
193+
if tcx.sess.opts.debugging_opts.instrument_coverage
194+
|| tcx.sess.opts.cg.profile_generate.enabled()
195+
{
194196
// These are weak symbols that point to the profile version and the
195197
// profile name, which need to be treated as exported so LTO doesn't nix
196198
// them.
@@ -203,17 +205,6 @@ fn exported_symbols_provider_local(
203205
}));
204206
}
205207

206-
if tcx.sess.opts.debugging_opts.instrument_coverage {
207-
// Similar to PGO profiling, preserve symbols used by LLVM InstrProf coverage profiling.
208-
const COVERAGE_WEAK_SYMBOLS: [&str; 3] =
209-
["__llvm_profile_filename", "__llvm_coverage_mapping", "__llvm_covmap"];
210-
211-
symbols.extend(COVERAGE_WEAK_SYMBOLS.iter().map(|sym| {
212-
let exported_symbol = ExportedSymbol::NoDefId(SymbolName::new(tcx, sym));
213-
(exported_symbol, SymbolExportLevel::C)
214-
}));
215-
}
216-
217208
if tcx.sess.opts.debugging_opts.sanitizer.contains(SanitizerSet::MEMORY) {
218209
// Similar to profiling, preserve weak msan symbol during LTO.
219210
const MSAN_WEAK_SYMBOLS: [&str; 2] = ["__msan_track_origins", "__msan_keep_going"];

src/librustc_codegen_ssa/traits/coverageinfo.rs

+2
Original file line numberDiff line numberDiff line change
@@ -7,6 +7,8 @@ pub trait CoverageInfoMethods: BackendTypes {
77
}
88

99
pub trait CoverageInfoBuilderMethods<'tcx>: BackendTypes {
10+
fn create_pgo_func_name_var(&self, instance: Instance<'tcx>) -> Self::Value;
11+
1012
fn add_counter_region(
1113
&mut self,
1214
instance: Instance<'tcx>,

src/librustc_mir/transform/instrument_coverage.rs

+15
Original file line numberDiff line numberDiff line change
@@ -295,6 +295,21 @@ impl<'a, 'tcx> Instrumentor<'a, 'tcx> {
295295

296296
let (file_name, start_line, start_col, end_line, end_col) = self.code_region(&span);
297297

298+
// FIXME(richkadel): Note that `const_str()` results in the creation of an `Allocation` to
299+
// hold one copy of each unique filename. It looks like that `Allocation` may translate into
300+
// the creation of an `@alloc` in LLVM IR that is never actually used by runtime code.
301+
//
302+
// Example LLVM IR:
303+
//
304+
// @alloc4 = private unnamed_addr constant <{ [43 x i8] }> \
305+
// <{ [43 x i8] c"C:\\msys64\\home\\richkadel\\rust\\rust_basic.rs" }>, align 1
306+
//
307+
// Can I flag the alloc as something not to be added to codegen? Or somehow remove it before
308+
// it gets added to the LLVM IR? Do we need some kind of reference counting to know it's
309+
// not used by any runtime code?
310+
//
311+
// This question is moot if I convert the Call Terminators to Statements, I believe:
312+
// https://rust-lang.zulipchat.com/#narrow/stream/233931-t-compiler.2Fmajor-changes/topic/Implement.20LLVM-compatible.20source-based.20cod.20compiler-team.23278/near/206731748
298313
args.push(self.const_str(&file_name, inject_at));
299314
args.push(self.const_u32(start_line, inject_at));
300315
args.push(self.const_u32(start_col, inject_at));

src/rustllvm/CoverageMappingWrapper.cpp

+5
Original file line numberDiff line numberDiff line change
@@ -38,6 +38,11 @@ extern "C" void LLVMRustCoverageWriteMappingToBuffer(
3838
CoverageMappingWriter.write(OS);
3939
}
4040

41+
extern "C" LLVMValueRef LLVMRustCoverageCreatePGOFuncNameVar(LLVMValueRef F, const char *FuncName) {
42+
StringRef FuncNameRef(FuncName);
43+
return wrap(createPGOFuncNameVar(*cast<Function>(unwrap(F)), FuncNameRef));
44+
}
45+
4146
extern "C" uint64_t LLVMRustCoverageComputeHash(const char *Name) {
4247
StringRef NameRef(Name);
4348
return IndexedInstrProf::ComputeHash(NameRef);

src/test/run-make-fulldeps/instrument-coverage/Makefile

+62-16
Original file line numberDiff line numberDiff line change
@@ -3,55 +3,101 @@
33

44
# FIXME(richkadel): Debug the following problem, and reenable on Windows (by
55
# removing the `# ignore-msvc` directive above). The current implementation
6-
# generates a segfault when running the instrumented `main` executable,
7-
# after the `main` program code executes, but before the process terminates.
8-
# This most likely points to a problem generating the LLVM "main.profraw"
6+
# generates a segfault when running the instrumented `testprog` executable,
7+
# after the `main()` function completes, but before the process terminates.
8+
# This most likely points to a problem generating the LLVM "testprog.profraw"
99
# file.
1010

1111
-include ../tools.mk
1212

13+
UNAME = $(shell uname)
14+
15+
ifeq ($(UNAME),Darwin)
16+
INSTR_PROF_DATA_SUFFIX=,regular,live_support
17+
DATA_SECTION_PREFIX=__DATA,
18+
LLVM_COV_SECTION_PREFIX=__LLVM_COV,
19+
else
20+
INSTR_PROF_DATA_SUFFIX=
21+
DATA_SECTION_PREFIX=
22+
LLVM_COV_SECTION_PREFIX=
23+
endif
24+
1325
# This test makes sure that LLVM coverage maps are genereated in LLVM IR.
1426

1527
COMMON_FLAGS=-Zinstrument-coverage
1628

1729
all:
1830
# Compile the test program with instrumentation, and also generate LLVM IR
19-
$(RUSTC) $(COMMON_FLAGS) main.rs
31+
$(RUSTC) $(COMMON_FLAGS) testprog.rs \
32+
--emit=link,llvm-ir
33+
34+
# check the LLVM IR
35+
ifdef IS_WIN32
36+
cat "$(TMPDIR)"/testprog.ll | "$(LLVM_FILECHECK)" filecheck-patterns.txt \
37+
-check-prefixes=CHECK,WIN32 \
38+
-DPRIVATE_GLOBAL="internal global" \
39+
-DINSTR_PROF_DATA=".lprfd$$M" \
40+
-DINSTR_PROF_NAME=".lprfn$$M" \
41+
-DINSTR_PROF_CNTS=".lprfc$$M" \
42+
-DINSTR_PROF_VALS=".lprfv$$M" \
43+
-DINSTR_PROF_VNODES=".lprfnd$$M" \
44+
-DINSTR_PROF_COVMAP=".lcovmap$$M" \
45+
-DINSTR_PROF_ORDERFILE=".lorderfile$$M"
46+
else
47+
cat "$(TMPDIR)"/testprog.ll | "$(LLVM_FILECHECK)" filecheck-patterns.txt \
48+
-check-prefixes=CHECK \
49+
-DPRIVATE_GLOBAL="private global" \
50+
-DINSTR_PROF_DATA="$(DATA_SECTION_PREFIX)__llvm_prf_data$(INSTR_PROF_DATA_SUFFIX)" \
51+
-DINSTR_PROF_NAME="$(DATA_SECTION_PREFIX)__llvm_prf_names" \
52+
-DINSTR_PROF_CNTS="$(DATA_SECTION_PREFIX)__llvm_prf_cnts" \
53+
-DINSTR_PROF_VALS="$(DATA_SECTION_PREFIX)__llvm_prf_vals" \
54+
-DINSTR_PROF_VNODES="$(DATA_SECTION_PREFIX)__llvm_prf_vnds" \
55+
-DINSTR_PROF_COVMAP="$(LLVM_COV_SECTION_PREFIX)__llvm_covmap" \
56+
-DINSTR_PROF_ORDERFILE="$(DATA_SECTION_PREFIX)__llvm_orderfile"
57+
endif
2058

2159
# Run it in order to generate some profiling data,
2260
# with `LLVM_PROFILE_FILE=<profdata_file>` environment variable set to
2361
# output the coverage stats for this run.
24-
LLVM_PROFILE_FILE="$(TMPDIR)"/main.profraw \
25-
$(call RUN,main)
62+
LLVM_PROFILE_FILE="$(TMPDIR)"/testprog.profraw \
63+
$(call RUN,testprog)
2664

2765
# Postprocess the profiling data so it can be used by the llvm-cov tool
2866
"$(LLVM_BIN_DIR)"/llvm-profdata merge --sparse \
29-
"$(TMPDIR)"/main.profraw \
30-
-o "$(TMPDIR)"/main.profdata
67+
"$(TMPDIR)"/testprog.profraw \
68+
-o "$(TMPDIR)"/testprog.profdata
3169

3270
# Generate a coverage report using `llvm-cov show`. The output ordering
3371
# can be non-deterministic, so ignore the return status. If the test fails
3472
# when comparing the JSON `export`, the `show` output may be useful when
3573
# debugging.
3674
"$(LLVM_BIN_DIR)"/llvm-cov show \
37-
--Xdemangler="$(RUST_DEMANGLER)" \
38-
--show-line-counts-or-regions \
39-
--instr-profile="$(TMPDIR)"/main.profdata \
40-
$(call BIN,"$(TMPDIR)"/main) \
75+
--Xdemangler="$(RUST_DEMANGLER)" \
76+
--show-line-counts-or-regions \
77+
--instr-profile="$(TMPDIR)"/testprog.profdata \
78+
$(call BIN,"$(TMPDIR)"/testprog) \
4179
> "$(TMPDIR)"/actual_show_coverage.txt
4280

81+
ifdef RUSTC_BLESS_TEST
82+
cp "$(TMPDIR)"/actual_show_coverage.txt typical_show_coverage.txt
83+
else
4384
# Compare the show coverage output
4485
$(DIFF) typical_show_coverage.txt "$(TMPDIR)"/actual_show_coverage.txt || \
45-
>&2 echo 'diff failed for `llvm-cov show` (might not be an error)'
86+
>&2 echo 'diff failed for `llvm-cov show` (might not be an error)'
87+
endif
4688

4789
# Generate a coverage report in JSON, using `llvm-cov export`, and fail if
4890
# there are differences from the expected output.
4991
"$(LLVM_BIN_DIR)"/llvm-cov export \
50-
--summary-only \
51-
--instr-profile="$(TMPDIR)"/main.profdata \
52-
$(call BIN,"$(TMPDIR)"/main) \
92+
--summary-only \
93+
--instr-profile="$(TMPDIR)"/testprog.profdata \
94+
$(call BIN,"$(TMPDIR)"/testprog) \
5395
| "$(PYTHON)" prettify_json.py \
5496
> "$(TMPDIR)"/actual_export_coverage.json
5597

98+
ifdef RUSTC_BLESS_TEST
99+
cp "$(TMPDIR)"/actual_export_coverage.json expected_export_coverage.json
100+
else
56101
# Check that the exported JSON coverage data matches what we expect
57102
$(DIFF) expected_export_coverage.json "$(TMPDIR)"/actual_export_coverage.json
103+
endif

src/test/run-make-fulldeps/instrument-coverage/expected_export_coverage.json

+1-1
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@
33
{
44
"files": [
55
{
6-
"filename": "main.rs",
6+
"filename": "testprog.rs",
77
"summary": {
88
"functions": {
99
"count": 7,
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,51 @@
1+
# Check for metadata, variables, declarations, and function definitions injected
2+
# into LLVM IR when compiling with -Zinstrument-coverage.
3+
4+
WIN32: $__llvm_profile_runtime_user = comdat any
5+
6+
CHECK: @__llvm_coverage_mapping = internal constant
7+
CHECK-SAME: section "[[INSTR_PROF_COVMAP]]", align 8
8+
9+
WIN32: @__llvm_profile_runtime = external global i32
10+
11+
CHECK: @__profc__R{{[a-zA-Z0-9_]+}}testprog14will_be_called = [[PRIVATE_GLOBAL]]
12+
CHECK-SAME: section "[[INSTR_PROF_CNTS]]", align 8
13+
14+
CHECK: @__profd__R{{[a-zA-Z0-9_]+}}testprog14will_be_called = [[PRIVATE_GLOBAL]]
15+
CHECK-SAME: @__profc__R{{[a-zA-Z0-9_]+}}testprog14will_be_called,
16+
CHECK-SAME: ()* @_R{{[a-zA-Z0-9_]+}}testprog14will_be_called to i8*),
17+
CHECK-SAME: section "[[INSTR_PROF_DATA]]", align 8
18+
19+
CHECK: @__profc__R{{[a-zA-Z0-9_]+}}testprog4main = [[PRIVATE_GLOBAL]]
20+
CHECK-SAME: section "[[INSTR_PROF_CNTS]]", align 8
21+
22+
CHECK: @__profd__R{{[a-zA-Z0-9_]+}}testprog4main = [[PRIVATE_GLOBAL]]
23+
CHECK-SAME: @__profc__R{{[a-zA-Z0-9_]+}}testprog4main,
24+
CHECK-SAME: ()* @_R{{[a-zA-Z0-9_]+}}testprog4main to i8*),
25+
CHECK-SAME: section "[[INSTR_PROF_DATA]]", align 8
26+
27+
CHECK: @__llvm_prf_nm = private constant
28+
CHECK-SAME: section "[[INSTR_PROF_NAME]]", align 1
29+
30+
CHECK: @llvm.used = appending global
31+
CHECK-SAME: i8* bitcast ({ {{.*}} }* @__llvm_coverage_mapping to i8*)
32+
WIN32-SAME: i8* bitcast (i32 ()* @__llvm_profile_runtime_user to i8*)
33+
CHECK-SAME: i8* bitcast ({ {{.*}} }* @__profd__R{{[a-zA-Z0-9_]*}}testprog4main to i8*)
34+
CHECK-SAME: i8* getelementptr inbounds ({{.*}}* @__llvm_prf_nm, i32 0, i32 0)
35+
CHECK-SAME: section "llvm.metadata"
36+
37+
CHECK: define hidden { {{.*}} } @_R{{[a-zA-Z0-9_]+}}testprog14will_be_called() unnamed_addr #{{[0-9]+}} {
38+
CHECK-NEXT: start:
39+
CHECK-NOT: bb{{[0-9]+}}:
40+
CHECK: %pgocount = load i64, i64* getelementptr inbounds
41+
CHECK-SAME: * @__profc__R{{[a-zA-Z0-9_]+}}testprog14will_be_called,
42+
43+
CHECK: declare void @llvm.instrprof.increment(i8*, i64, i32, i32) #[[LLVM_INSTRPROF_INCREMENT_ATTR:[0-9]+]]
44+
45+
WIN32: define linkonce_odr hidden i32 @__llvm_profile_runtime_user() #[[LLVM_PROFILE_RUNTIME_USER_ATTR:[0-9]+]] comdat {
46+
WIN32-NEXT: %1 = load i32, i32* @__llvm_profile_runtime
47+
WIN32-NEXT: ret i32 %1
48+
WIN32-NEXT: }
49+
50+
CHECK: attributes #[[LLVM_INSTRPROF_INCREMENT_ATTR]] = { nounwind }
51+
WIN32: attributes #[[LLVM_PROFILE_RUNTIME_USER_ATTR]] = { noinline }

src/test/run-make-fulldeps/instrument-coverage/typical_show_coverage.txt

+2-2
Original file line numberDiff line numberDiff line change
@@ -25,14 +25,14 @@
2525
25| 2| }
2626
26| 2|}
2727
------------------
28-
| main[317d481089b8c8fe]::wrap_with::<main[317d481089b8c8fe]::main::{closure#0}, &str>:
28+
| testprog[317d481089b8c8fe]::wrap_with::<testprog[317d481089b8c8fe]::main::{closure#0}, &str>:
2929
| 22| 1|{
3030
| 23| 1| if should_wrap {
3131
| 24| 1| wrapper(&inner)
3232
| 25| 1| }
3333
| 26| 1|}
3434
------------------
35-
| main[317d481089b8c8fe]::wrap_with::<main[317d481089b8c8fe]::main::{closure#1}, &str>:
35+
| testprog[317d481089b8c8fe]::wrap_with::<testprog[317d481089b8c8fe]::main::{closure#1}, &str>:
3636
| 22| 1|{
3737
| 23| 1| if should_wrap {
3838
| 24| 1| wrapper(&inner)

0 commit comments

Comments
 (0)