diff options
| author | bors <bors@rust-lang.org> | 2021-06-22 14:53:58 +0000 |
|---|---|---|
| committer | bors <bors@rust-lang.org> | 2021-06-22 14:53:58 +0000 |
| commit | 80926fc409d671e7da13f08c90642b1e71f800d9 (patch) | |
| tree | 726ca593e13f10dfc8c0ec3eb38aa40c2e27403a /compiler/rustc_middle/src | |
| parent | 3487be11d5f3c9afc4d8e44438cdd2af1e98c859 (diff) | |
| parent | c3c4ab5ed204b09a8446f9abbdb4d49b278756be (diff) | |
| download | rust-80926fc409d671e7da13f08c90642b1e71f800d9.tar.gz rust-80926fc409d671e7da13f08c90642b1e71f800d9.zip | |
Auto merge of #86368 - michaelwoerister:lexing-ice, r=davidtwco
Disambiguate between SourceFiles from different crates even if they have the same path This PR fixes an ICE that can occur when the compiler encounters a source file that is part of both the local crate and an upstream crate: 1. While importing source files from an upstream crate the compiler creates a `SourceFile` entry for `foo.rs` in the `SourceMap`. Since this is an imported source file its `src` field is `None`. 2. At a later point the parser encounters `foo.rs` again. It tells the `SourceMap` to load the file but because we already have an entry for `foo.rs` the `SourceMap` will return the existing version with `src == None`. 3. The parser proceeds under the assumption that `src.is_some()` and panics when actually trying to use the file's contents. This PR fixes the issue by adding the source file's associated `CrateNum` to the `SourceMap`'s interning key. As a consequence the two instances of the file will each have a separate entry in the `SourceMap`. They just happen to share the same file path. This approach seemed less problematic to me than trying to mutate the `SourceFile` after it had already been created. Another, more involved, approach might be to merge the `src` and the `external_src` field. Fixes #85955
Diffstat (limited to 'compiler/rustc_middle/src')
| -rw-r--r-- | compiler/rustc_middle/src/ty/query/on_disk_cache.rs | 38 |
1 files changed, 33 insertions, 5 deletions
diff --git a/compiler/rustc_middle/src/ty/query/on_disk_cache.rs b/compiler/rustc_middle/src/ty/query/on_disk_cache.rs index ebaef347f42..6df8e64fada 100644 --- a/compiler/rustc_middle/src/ty/query/on_disk_cache.rs +++ b/compiler/rustc_middle/src/ty/query/on_disk_cache.rs @@ -54,7 +54,7 @@ pub struct OnDiskCache<'sess> { cnum_map: OnceCell<UnhashMap<StableCrateId, CrateNum>>, source_map: &'sess SourceMap, - file_index_to_stable_id: FxHashMap<SourceFileIndex, StableSourceFileId>, + file_index_to_stable_id: FxHashMap<SourceFileIndex, EncodedSourceFileId>, // Caches that are populated lazily during decoding. file_index_to_file: Lock<FxHashMap<SourceFileIndex, Lrc<SourceFile>>>, @@ -111,7 +111,7 @@ pub struct OnDiskCache<'sess> { // This type is used only for serialization and deserialization. #[derive(Encodable, Decodable)] struct Footer { - file_index_to_stable_id: FxHashMap<SourceFileIndex, StableSourceFileId>, + file_index_to_stable_id: FxHashMap<SourceFileIndex, EncodedSourceFileId>, query_result_index: EncodedQueryResultIndex, diagnostics_index: EncodedQueryResultIndex, // The location of all allocations. @@ -157,6 +157,32 @@ crate struct RawDefId { pub index: u32, } +/// An `EncodedSourceFileId` is the same as a `StableSourceFileId` except that +/// the source crate is represented as a [StableCrateId] instead of as a +/// `CrateNum`. This way `EncodedSourceFileId` can be encoded and decoded +/// without any additional context, i.e. with a simple `opaque::Decoder` (which +/// is the only thing available when decoding the cache's [Footer]. +#[derive(Encodable, Decodable, Clone, Debug)] +struct EncodedSourceFileId { + file_name_hash: u64, + stable_crate_id: StableCrateId, +} + +impl EncodedSourceFileId { + fn translate(&self, cnum_map: &UnhashMap<StableCrateId, CrateNum>) -> StableSourceFileId { + let cnum = cnum_map[&self.stable_crate_id]; + StableSourceFileId { file_name_hash: self.file_name_hash, cnum } + } + + fn new(tcx: TyCtxt<'_>, file: &SourceFile) -> EncodedSourceFileId { + let source_file_id = StableSourceFileId::new(file); + EncodedSourceFileId { + file_name_hash: source_file_id.file_name_hash, + stable_crate_id: tcx.stable_crate_id(source_file_id.cnum), + } + } +} + impl<'sess> OnDiskCache<'sess> { /// Creates a new `OnDiskCache` instance from the serialized data in `data`. pub fn new(sess: &'sess Session, data: Vec<u8>, start_pos: usize) -> Self { @@ -238,7 +264,8 @@ impl<'sess> OnDiskCache<'sess> { let index = SourceFileIndex(index as u32); let file_ptr: *const SourceFile = &**file as *const _; file_to_file_index.insert(file_ptr, index); - file_index_to_stable_id.insert(index, StableSourceFileId::new(&file)); + let source_file_id = EncodedSourceFileId::new(tcx, &file); + file_index_to_stable_id.insert(index, source_file_id); } (file_to_file_index, file_index_to_stable_id) @@ -605,7 +632,7 @@ pub struct CacheDecoder<'a, 'tcx> { source_map: &'a SourceMap, cnum_map: &'a UnhashMap<StableCrateId, CrateNum>, file_index_to_file: &'a Lock<FxHashMap<SourceFileIndex, Lrc<SourceFile>>>, - file_index_to_stable_id: &'a FxHashMap<SourceFileIndex, StableSourceFileId>, + file_index_to_stable_id: &'a FxHashMap<SourceFileIndex, EncodedSourceFileId>, alloc_decoding_session: AllocDecodingSession<'a>, syntax_contexts: &'a FxHashMap<u32, AbsoluteBytePos>, expn_data: &'a FxHashMap<u32, AbsoluteBytePos>, @@ -618,6 +645,7 @@ impl<'a, 'tcx> CacheDecoder<'a, 'tcx> { ref file_index_to_file, ref file_index_to_stable_id, ref source_map, + ref cnum_map, .. } = *self; @@ -625,7 +653,7 @@ impl<'a, 'tcx> CacheDecoder<'a, 'tcx> { .borrow_mut() .entry(index) .or_insert_with(|| { - let stable_id = file_index_to_stable_id[&index]; + let stable_id = file_index_to_stable_id[&index].translate(cnum_map); source_map .source_file_by_stable_id(stable_id) .expect("failed to lookup `SourceFile` in new context") |
