Skip to content

Commit 3243ea0

Browse files
committedJun 9, 2024
feat: Compute native diagnostics in parallel
1 parent 994a9b8 commit 3243ea0

File tree

3 files changed

+73
-26
lines changed

3 files changed

+73
-26
lines changed
 

‎src/tools/rust-analyzer/crates/rust-analyzer/src/diagnostics.rs

+36-12
Original file line numberDiff line numberDiff line change
@@ -8,6 +8,7 @@ use ide_db::FxHashMap;
88
use itertools::Itertools;
99
use nohash_hasher::{IntMap, IntSet};
1010
use rustc_hash::FxHashSet;
11+
use stdx::iter_eq_by;
1112
use triomphe::Arc;
1213

1314
use crate::{global_state::GlobalStateSnapshot, lsp, lsp_ext};
@@ -22,14 +23,21 @@ pub struct DiagnosticsMapConfig {
2223
pub check_ignore: FxHashSet<String>,
2324
}
2425

26+
pub(crate) type DiagnosticsGeneration = usize;
27+
2528
#[derive(Debug, Default, Clone)]
2629
pub(crate) struct DiagnosticCollection {
2730
// FIXME: should be IntMap<FileId, Vec<ra_id::Diagnostic>>
28-
pub(crate) native: IntMap<FileId, Vec<lsp_types::Diagnostic>>,
31+
pub(crate) native: IntMap<FileId, (DiagnosticsGeneration, Vec<lsp_types::Diagnostic>)>,
2932
// FIXME: should be Vec<flycheck::Diagnostic>
3033
pub(crate) check: IntMap<usize, IntMap<FileId, Vec<lsp_types::Diagnostic>>>,
3134
pub(crate) check_fixes: CheckFixes,
3235
changes: IntSet<FileId>,
36+
/// Counter for supplying a new generation number for diagnostics.
37+
/// This is used to keep track of when to clear the diagnostics for a given file as we compute
38+
/// diagnostics on multiple worker threads simultaneously which may result in multiple diagnostics
39+
/// updates for the same file in a single generation update (due to macros affecting multiple files).
40+
generation: DiagnosticsGeneration,
3341
}
3442

3543
#[derive(Debug, Clone)]
@@ -82,29 +90,39 @@ impl DiagnosticCollection {
8290

8391
pub(crate) fn set_native_diagnostics(
8492
&mut self,
93+
generation: DiagnosticsGeneration,
8594
file_id: FileId,
86-
diagnostics: Vec<lsp_types::Diagnostic>,
95+
mut diagnostics: Vec<lsp_types::Diagnostic>,
8796
) {
88-
if let Some(existing_diagnostics) = self.native.get(&file_id) {
97+
diagnostics.sort_by_key(|it| (it.range.start, it.range.end));
98+
if let Some((old_gen, existing_diagnostics)) = self.native.get_mut(&file_id) {
8999
if existing_diagnostics.len() == diagnostics.len()
90-
&& diagnostics
91-
.iter()
92-
.zip(existing_diagnostics)
93-
.all(|(new, existing)| are_diagnostics_equal(new, existing))
100+
&& iter_eq_by(&diagnostics, &*existing_diagnostics, |new, existing| {
101+
are_diagnostics_equal(new, existing)
102+
})
94103
{
104+
// don't signal an update if the diagnostics are the same
95105
return;
96106
}
107+
if *old_gen < generation || generation == 0 {
108+
self.native.insert(file_id, (generation, diagnostics));
109+
} else {
110+
existing_diagnostics.extend(diagnostics);
111+
// FIXME: Doing the merge step of a merge sort here would be a bit more performant
112+
// but eh
113+
existing_diagnostics.sort_by_key(|it| (it.range.start, it.range.end))
114+
}
115+
} else {
116+
self.native.insert(file_id, (generation, diagnostics));
97117
}
98-
99-
self.native.insert(file_id, diagnostics);
100118
self.changes.insert(file_id);
101119
}
102120

103121
pub(crate) fn diagnostics_for(
104122
&self,
105123
file_id: FileId,
106124
) -> impl Iterator<Item = &lsp_types::Diagnostic> {
107-
let native = self.native.get(&file_id).into_iter().flatten();
125+
let native = self.native.get(&file_id).into_iter().map(|(_, d)| d).flatten();
108126
let check = self.check.values().filter_map(move |it| it.get(&file_id)).flatten();
109127
native.chain(check)
110128
}
@@ -115,6 +133,11 @@ impl DiagnosticCollection {
115133
}
116134
Some(mem::take(&mut self.changes))
117135
}
136+
137+
pub(crate) fn next_generation(&mut self) -> usize {
138+
self.generation += 1;
139+
self.generation
140+
}
118141
}
119142

120143
fn are_diagnostics_equal(left: &lsp_types::Diagnostic, right: &lsp_types::Diagnostic) -> bool {
@@ -126,7 +149,8 @@ fn are_diagnostics_equal(left: &lsp_types::Diagnostic, right: &lsp_types::Diagno
126149

127150
pub(crate) fn fetch_native_diagnostics(
128151
snapshot: GlobalStateSnapshot,
129-
subscriptions: Vec<FileId>,
152+
subscriptions: std::sync::Arc<[FileId]>,
153+
slice: std::ops::Range<usize>,
130154
) -> Vec<(FileId, Vec<lsp_types::Diagnostic>)> {
131155
let _p = tracing::info_span!("fetch_native_diagnostics").entered();
132156
let _ctx = stdx::panic_context::enter("fetch_native_diagnostics".to_owned());
@@ -149,7 +173,7 @@ pub(crate) fn fetch_native_diagnostics(
149173
// the diagnostics produced may point to different files not requested by the concrete request,
150174
// put those into here and filter later
151175
let mut odd_ones = Vec::new();
152-
let mut diagnostics = subscriptions
176+
let mut diagnostics = subscriptions[slice]
153177
.iter()
154178
.copied()
155179
.filter_map(|file_id| {

‎src/tools/rust-analyzer/crates/rust-analyzer/src/global_state.rs

+3-1
Original file line numberDiff line numberDiff line change
@@ -163,7 +163,9 @@ pub(crate) struct GlobalStateSnapshot {
163163
pub(crate) semantic_tokens_cache: Arc<Mutex<FxHashMap<Url, SemanticTokens>>>,
164164
vfs: Arc<RwLock<(vfs::Vfs, IntMap<FileId, LineEndings>)>>,
165165
pub(crate) workspaces: Arc<Vec<ProjectWorkspace>>,
166-
// used to signal semantic highlighting to fall back to syntax based highlighting until proc-macros have been loaded
166+
// used to signal semantic highlighting to fall back to syntax based highlighting until
167+
// proc-macros have been loaded
168+
// FIXME: Can we derive this from somewhere else?
167169
pub(crate) proc_macros_loaded: bool,
168170
pub(crate) flycheck: Arc<[FlycheckHandle]>,
169171
}

‎src/tools/rust-analyzer/crates/rust-analyzer/src/main_loop.rs

+34-13
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@ use vfs::FileId;
1717

1818
use crate::{
1919
config::Config,
20-
diagnostics::fetch_native_diagnostics,
20+
diagnostics::{fetch_native_diagnostics, DiagnosticsGeneration},
2121
dispatch::{NotificationDispatcher, RequestDispatcher},
2222
global_state::{file_id_to_url, url_to_file_id, GlobalState},
2323
hack_recover_crate_name,
@@ -87,7 +87,7 @@ pub(crate) enum Task {
8787
Response(lsp_server::Response),
8888
ClientNotification(lsp_ext::UnindexedProjectParams),
8989
Retry(lsp_server::Request),
90-
Diagnostics(Vec<(FileId, Vec<lsp_types::Diagnostic>)>),
90+
Diagnostics(DiagnosticsGeneration, Vec<(FileId, Vec<lsp_types::Diagnostic>)>),
9191
DiscoverTest(lsp_ext::DiscoverTestResults),
9292
PrimeCaches(PrimeCachesProgress),
9393
FetchWorkspace(ProjectWorkspaceProgress),
@@ -479,7 +479,7 @@ impl GlobalState {
479479

480480
fn update_diagnostics(&mut self) {
481481
let db = self.analysis_host.raw_database();
482-
// spawn a task per subscription?
482+
let generation = self.diagnostics.next_generation();
483483
let subscriptions = {
484484
let vfs = &self.vfs.read().0;
485485
self.mem_docs
@@ -494,16 +494,37 @@ impl GlobalState {
494494
// forever if we emitted them here.
495495
!db.source_root(source_root).is_library
496496
})
497-
.collect::<Vec<_>>()
497+
.collect::<std::sync::Arc<_>>()
498498
};
499499
tracing::trace!("updating notifications for {:?}", subscriptions);
500-
501-
// Diagnostics are triggered by the user typing
502-
// so we run them on a latency sensitive thread.
503-
self.task_pool.handle.spawn(ThreadIntent::LatencySensitive, {
504-
let snapshot = self.snapshot();
505-
move || Task::Diagnostics(fetch_native_diagnostics(snapshot, subscriptions))
506-
});
500+
// Split up the work on multiple threads, but we don't wanna fill the entire task pool with
501+
// diagnostic tasks, so we limit the number of tasks to a quarter of the total thread pool.
502+
let max_tasks = self.config.main_loop_num_threads() / 4;
503+
let chunk_length = subscriptions.len() / max_tasks;
504+
let remainder = subscriptions.len() % max_tasks;
505+
506+
let mut start = 0;
507+
for task_idx in 0..max_tasks {
508+
let extra = if task_idx < remainder { 1 } else { 0 };
509+
let end = start + chunk_length + extra;
510+
let slice = start..end;
511+
if slice.is_empty() {
512+
break;
513+
}
514+
// Diagnostics are triggered by the user typing
515+
// so we run them on a latency sensitive thread.
516+
self.task_pool.handle.spawn(ThreadIntent::LatencySensitive, {
517+
let snapshot = self.snapshot();
518+
let subscriptions = subscriptions.clone();
519+
move || {
520+
Task::Diagnostics(
521+
generation,
522+
fetch_native_diagnostics(snapshot, subscriptions, slice),
523+
)
524+
}
525+
});
526+
start = end;
527+
}
507528
}
508529

509530
fn update_tests(&mut self) {
@@ -590,9 +611,9 @@ impl GlobalState {
590611
// Only retry requests that haven't been cancelled. Otherwise we do unnecessary work.
591612
Task::Retry(req) if !self.is_completed(&req) => self.on_request(req),
592613
Task::Retry(_) => (),
593-
Task::Diagnostics(diagnostics_per_file) => {
614+
Task::Diagnostics(generation, diagnostics_per_file) => {
594615
for (file_id, diagnostics) in diagnostics_per_file {
595-
self.diagnostics.set_native_diagnostics(file_id, diagnostics)
616+
self.diagnostics.set_native_diagnostics(generation, file_id, diagnostics)
596617
}
597618
}
598619
Task::PrimeCaches(progress) => match progress {

0 commit comments

Comments
 (0)