@@ -4,6 +4,7 @@ use crate::coverageinfo::ffi::CounterMappingRegion;
4
4
use crate :: coverageinfo:: map_data:: { FunctionCoverage , FunctionCoverageCollector } ;
5
5
use crate :: llvm;
6
6
7
+ use itertools:: Itertools as _;
7
8
use rustc_codegen_ssa:: traits:: { BaseTypeMethods , ConstMethods } ;
8
9
use rustc_data_structures:: fx:: FxIndexSet ;
9
10
use rustc_hir:: def:: DefKind ;
@@ -57,20 +58,26 @@ pub fn finalize(cx: &CodegenCx<'_, '_>) {
57
58
return ;
58
59
}
59
60
60
- let mut global_file_table = GlobalFileTable :: new ( tcx) ;
61
+ let function_coverage_entries = function_coverage_map
62
+ . into_iter ( )
63
+ . map ( |( instance, function_coverage) | ( instance, function_coverage. into_finished ( ) ) )
64
+ . collect :: < Vec < _ > > ( ) ;
65
+
66
+ let all_file_names =
67
+ function_coverage_entries. iter ( ) . flat_map ( |( _, fn_cov) | fn_cov. all_file_names ( ) ) ;
68
+ let global_file_table = GlobalFileTable :: new ( tcx, all_file_names) ;
61
69
62
70
// Encode coverage mappings and generate function records
63
71
let mut function_data = Vec :: new ( ) ;
64
- for ( instance, function_coverage) in function_coverage_map {
65
- let function_coverage = function_coverage. into_finished ( ) ;
72
+ for ( instance, function_coverage) in function_coverage_entries {
66
73
debug ! ( "Generate function coverage for {}, {:?}" , cx. codegen_unit. name( ) , instance) ;
67
74
68
75
let mangled_function_name = tcx. symbol_name ( instance) . name ;
69
76
let source_hash = function_coverage. source_hash ( ) ;
70
77
let is_used = function_coverage. is_used ( ) ;
71
78
72
79
let coverage_mapping_buffer =
73
- encode_mappings_for_function ( & mut global_file_table, & function_coverage) ;
80
+ encode_mappings_for_function ( & global_file_table, & function_coverage) ;
74
81
75
82
if coverage_mapping_buffer. is_empty ( ) {
76
83
if function_coverage. is_used ( ) {
@@ -88,11 +95,11 @@ pub fn finalize(cx: &CodegenCx<'_, '_>) {
88
95
}
89
96
90
97
// Encode all filenames referenced by counters/expressions in this module
91
- let filenames_buffer = global_file_table. into_filenames_buffer ( ) ;
98
+ let filenames_buffer = global_file_table. filenames_buffer ( ) ;
92
99
93
100
let filenames_size = filenames_buffer. len ( ) ;
94
- let filenames_val = cx. const_bytes ( & filenames_buffer) ;
95
- let filenames_ref = coverageinfo:: hash_bytes ( & filenames_buffer) ;
101
+ let filenames_val = cx. const_bytes ( filenames_buffer) ;
102
+ let filenames_ref = coverageinfo:: hash_bytes ( filenames_buffer) ;
96
103
97
104
// Generate the LLVM IR representation of the coverage map and store it in a well-known global
98
105
let cov_data_val = generate_coverage_map ( cx, version, filenames_size, filenames_val) ;
@@ -140,39 +147,62 @@ pub fn finalize(cx: &CodegenCx<'_, '_>) {
140
147
}
141
148
142
149
struct GlobalFileTable {
143
- global_file_table : FxIndexSet < Symbol > ,
150
+ /// This "raw" table doesn't include the working dir, so a filename's
151
+ /// global ID is its index in this set **plus one**.
152
+ raw_file_table : FxIndexSet < Symbol > ,
153
+ filenames_buffer : Vec < u8 > ,
144
154
}
145
155
146
156
impl GlobalFileTable {
147
- fn new ( tcx : TyCtxt < ' _ > ) -> Self {
148
- let mut global_file_table = FxIndexSet :: default ( ) ;
157
+ fn new ( tcx : TyCtxt < ' _ > , all_file_names : impl IntoIterator < Item = Symbol > ) -> Self {
149
158
// LLVM Coverage Mapping Format version 6 (zero-based encoded as 5)
150
159
// requires setting the first filename to the compilation directory.
151
160
// Since rustc generates coverage maps with relative paths, the
152
161
// compilation directory can be combined with the relative paths
153
162
// to get absolute paths, if needed.
154
- let working_dir = Symbol :: intern (
155
- & tcx. sess . opts . working_dir . remapped_path_if_available ( ) . to_string_lossy ( ) ,
156
- ) ;
157
- global_file_table . insert ( working_dir ) ;
158
- Self { global_file_table }
159
- }
160
-
161
- fn global_file_id_for_file_name ( & mut self , file_name : Symbol ) -> u32 {
162
- let ( global_file_id , _ ) = self . global_file_table . insert_full ( file_name ) ;
163
- global_file_id as u32
164
- }
163
+ let working_dir: & str =
164
+ & tcx. sess . opts . working_dir . remapped_path_if_available ( ) . to_string_lossy ( ) ;
165
+
166
+ // Prepare a map from filename symbols to their underlying strings, so
167
+ // that we can sort by the strings.
168
+ let mut raw_file_table = FxIndexMap :: < Symbol , & str > :: default ( ) ;
169
+ // Filenames usually come in contiguous runs, so dedup to save work.
170
+ let all_file_names = all_file_names . into_iter ( ) . dedup ( ) . collect :: < Vec < _ > > ( ) ;
171
+ for file_name in & all_file_names {
172
+ raw_file_table . entry ( * file_name ) . or_insert_with ( || file_name . as_str ( ) ) ;
173
+ }
165
174
166
- fn into_filenames_buffer ( self ) -> Vec < u8 > {
167
- // This method takes `self` so that the caller can't accidentally
168
- // modify the original file table after encoding it into a buffer.
175
+ // Sort the file table by its actual string values, not the arbitrary
176
+ // ordering of its symbols.
177
+ raw_file_table . sort_unstable_by ( |_ , a , _ , b| str :: cmp ( a , b ) ) ;
169
178
170
- llvm:: build_byte_buffer ( |buffer| {
179
+ // Build the LLVM filenames buffer ahead of time, so that we can discard
180
+ // the string references afterwards.
181
+ let filenames_buffer = llvm:: build_byte_buffer ( |buffer| {
171
182
coverageinfo:: write_filenames_section_to_buffer (
172
- self . global_file_table . iter ( ) . map ( Symbol :: as_str) ,
183
+ // Insert the working dir at index 0, before the other filenames.
184
+ std:: iter:: once ( working_dir) . chain ( raw_file_table. values ( ) . copied ( ) ) ,
173
185
buffer,
174
186
) ;
175
- } )
187
+ } ) ;
188
+
189
+ // Discard the string reference values, leaving only a set of symbols.
190
+ let raw_file_table = raw_file_table. into_keys ( ) . collect :: < FxIndexSet < _ > > ( ) ;
191
+
192
+ Self { raw_file_table, filenames_buffer }
193
+ }
194
+
195
+ fn global_file_id_for_file_name ( & self , file_name : Symbol ) -> u32 {
196
+ let raw_id = self . raw_file_table . get_index_of ( & file_name) . unwrap_or_else ( || {
197
+ bug ! ( "file name not found in prepared global file table: {file_name}" ) ;
198
+ } ) ;
199
+ // The raw file table doesn't include an entry for the working dir
200
+ // (which has ID 0), so add 1 to get the correct ID.
201
+ ( raw_id + 1 ) as u32
202
+ }
203
+
204
+ fn filenames_buffer ( & self ) -> & [ u8 ] {
205
+ & self . filenames_buffer
176
206
}
177
207
}
178
208
@@ -182,7 +212,7 @@ impl GlobalFileTable {
182
212
///
183
213
/// Newly-encountered filenames will be added to the global file table.
184
214
fn encode_mappings_for_function (
185
- global_file_table : & mut GlobalFileTable ,
215
+ global_file_table : & GlobalFileTable ,
186
216
function_coverage : & FunctionCoverage < ' _ > ,
187
217
) -> Vec < u8 > {
188
218
let mut counter_regions = function_coverage. counter_regions ( ) . collect :: < Vec < _ > > ( ) ;
@@ -203,7 +233,7 @@ fn encode_mappings_for_function(
203
233
for counter_regions_for_file in
204
234
counter_regions. group_by ( |( _, a) , ( _, b) | a. file_name == b. file_name )
205
235
{
206
- // Look up (or allocate) the global file ID for this filename.
236
+ // Look up the global file ID for this filename.
207
237
let file_name = counter_regions_for_file[ 0 ] . 1 . file_name ;
208
238
let global_file_id = global_file_table. global_file_id_for_file_name ( file_name) ;
209
239
0 commit comments