Skip to content

Commit

Permalink
Deduplicate compiler diagnostics.
Browse files Browse the repository at this point in the history
  • Loading branch information
ehuss committed Jul 9, 2021
1 parent cc80b40 commit 493e8b7
Show file tree
Hide file tree
Showing 8 changed files with 281 additions and 77 deletions.
2 changes: 1 addition & 1 deletion src/cargo/core/compiler/custom_build.rs
Original file line number Diff line number Diff line change
Expand Up @@ -129,7 +129,7 @@ pub fn prepare(cx: &mut Context<'_, '_>, unit: &Unit) -> CargoResult<Job> {
}

fn emit_build_output(
state: &JobState<'_>,
state: &JobState<'_, '_>,
output: &BuildOutput,
out_dir: &Path,
package_id: PackageId,
Expand Down
8 changes: 4 additions & 4 deletions src/cargo/core/compiler/job.rs
Original file line number Diff line number Diff line change
Expand Up @@ -12,13 +12,13 @@ pub struct Job {
/// Each proc should send its description before starting.
/// It should send either once or close immediately.
pub struct Work {
inner: Box<dyn FnOnce(&JobState<'_>) -> CargoResult<()> + Send>,
inner: Box<dyn FnOnce(&JobState<'_, '_>) -> CargoResult<()> + Send>,
}

impl Work {
pub fn new<F>(f: F) -> Work
where
F: FnOnce(&JobState<'_>) -> CargoResult<()> + Send + 'static,
F: FnOnce(&JobState<'_, '_>) -> CargoResult<()> + Send + 'static,
{
Work { inner: Box::new(f) }
}
Expand All @@ -27,7 +27,7 @@ impl Work {
Work::new(|_| Ok(()))
}

pub fn call(self, tx: &JobState<'_>) -> CargoResult<()> {
pub fn call(self, tx: &JobState<'_, '_>) -> CargoResult<()> {
(self.inner)(tx)
}

Expand Down Expand Up @@ -58,7 +58,7 @@ impl Job {

/// Consumes this job by running it, returning the result of the
/// computation.
pub fn run(self, state: &JobState<'_>) -> CargoResult<()> {
pub fn run(self, state: &JobState<'_, '_>) -> CargoResult<()> {
self.work.call(state)
}

Expand Down
137 changes: 127 additions & 10 deletions src/cargo/core/compiler/job_queue.rs
Original file line number Diff line number Diff line change
Expand Up @@ -49,8 +49,9 @@
//! The current scheduling algorithm is relatively primitive and could likely be
//! improved.
use std::cell::Cell;
use std::cell::{Cell, RefCell};
use std::collections::{BTreeMap, BTreeSet, HashMap, HashSet};
use std::fmt::Write as _;
use std::io;
use std::marker;
use std::sync::Arc;
Expand Down Expand Up @@ -125,6 +126,14 @@ struct DrainState<'cfg> {

queue: DependencyQueue<Unit, Artifact, Job>,
messages: Arc<Queue<Message>>,
/// Diagnostic deduplication support.
diag_dedupe: DiagDedupe<'cfg>,
/// Count of warnings, used to print a summary after the job succeeds.
///
/// First value is the total number of warnings, and the second value is
/// the number that were suppressed because they were duplicates of a
/// previous warning.
warning_count: HashMap<JobId, (usize, usize)>,
active: HashMap<JobId, Unit>,
compiled: HashSet<PackageId>,
documented: HashSet<PackageId>,
Expand Down Expand Up @@ -174,7 +183,7 @@ impl std::fmt::Display for JobId {
///
/// The job may execute on either a dedicated thread or the main thread. If the job executes on the
/// main thread, the `output` field must be set to prevent a deadlock.
pub struct JobState<'a> {
pub struct JobState<'a, 'cfg> {
/// Channel back to the main thread to coordinate messages and such.
///
/// When the `output` field is `Some`, care must be taken to avoid calling `push_bounded` on
Expand All @@ -191,7 +200,7 @@ pub struct JobState<'a> {
/// interleaved. In the future, it may be wrapped in a `Mutex` instead. In this case
/// interleaving is still prevented as the lock would be held for the whole printing of an
/// output message.
output: Option<&'a Config>,
output: Option<&'a DiagDedupe<'cfg>>,

/// The job id that this state is associated with, used when sending
/// messages back to the main thread.
Expand All @@ -207,6 +216,36 @@ pub struct JobState<'a> {
_marker: marker::PhantomData<&'a ()>,
}

/// Handler for deduplicating diagnostics.
struct DiagDedupe<'cfg> {
seen: RefCell<HashSet<u64>>,
config: &'cfg Config,
}

impl<'cfg> DiagDedupe<'cfg> {
fn new(config: &'cfg Config) -> Self {
DiagDedupe {
seen: RefCell::new(HashSet::new()),
config,
}
}

/// Emits a diagnostic message.
///
/// Returns `true` if the message was emitted, or `false` if it was
/// suppressed for being a duplicate.
fn emit_diag(&self, diag: &str) -> CargoResult<bool> {
let h = util::hash_u64(diag);
if !self.seen.borrow_mut().insert(h) {
return Ok(false);
}
let mut shell = self.config.shell();
shell.print_ansi_stderr(diag.as_bytes())?;
shell.err().write_all(b"\n")?;
Ok(true)
}
}

/// Possible artifacts that can be produced by compilations, used as edge values
/// in the dependency graph.
///
Expand All @@ -232,6 +271,15 @@ enum Message {
BuildPlanMsg(String, ProcessBuilder, Arc<Vec<OutputFile>>),
Stdout(String),
Stderr(String),
Diagnostic {
id: JobId,
level: String,
diag: String,
},
WarningCount {
id: JobId,
emitted: bool,
},
FixDiagnostic(diagnostic_server::Message),
Token(io::Result<Acquired>),
Finish(JobId, Artifact, CargoResult<()>),
Expand All @@ -244,7 +292,7 @@ enum Message {
ReleaseToken(JobId),
}

impl<'a> JobState<'a> {
impl<'a, 'cfg> JobState<'a, 'cfg> {
pub fn running(&self, cmd: &ProcessBuilder) {
self.messages.push(Message::Run(self.id, cmd.to_string()));
}
Expand All @@ -260,17 +308,17 @@ impl<'a> JobState<'a> {
}

pub fn stdout(&self, stdout: String) -> CargoResult<()> {
if let Some(config) = self.output {
writeln!(config.shell().out(), "{}", stdout)?;
if let Some(dedupe) = self.output {
writeln!(dedupe.config.shell().out(), "{}", stdout)?;
} else {
self.messages.push_bounded(Message::Stdout(stdout));
}
Ok(())
}

pub fn stderr(&self, stderr: String) -> CargoResult<()> {
if let Some(config) = self.output {
let mut shell = config.shell();
if let Some(dedupe) = self.output {
let mut shell = dedupe.config.shell();
shell.print_ansi_stderr(stderr.as_bytes())?;
shell.err().write_all(b"\n")?;
} else {
Expand All @@ -279,6 +327,25 @@ impl<'a> JobState<'a> {
Ok(())
}

pub fn emit_diag(&self, level: String, diag: String) -> CargoResult<()> {
if let Some(dedupe) = self.output {
let emitted = dedupe.emit_diag(&diag)?;
if level == "warning" {
self.messages.push(Message::WarningCount {
id: self.id,
emitted,
});
}
} else {
self.messages.push_bounded(Message::Diagnostic {
id: self.id,
level,
diag,
});
}
Ok(())
}

/// A method used to signal to the coordinator thread that the rmeta file
/// for an rlib has been produced. This is only called for some rmeta
/// builds when required, and can be called at any time before a job ends.
Expand Down Expand Up @@ -410,6 +477,8 @@ impl<'cfg> JobQueue<'cfg> {
// typical messages. If you change this, please update the test
// caching_large_output, too.
messages: Arc::new(Queue::new(100)),
diag_dedupe: DiagDedupe::new(cx.bcx.config),
warning_count: HashMap::new(),
active: HashMap::new(),
compiled: HashSet::new(),
documented: HashSet::new(),
Expand Down Expand Up @@ -563,6 +632,15 @@ impl<'cfg> DrainState<'cfg> {
shell.print_ansi_stderr(err.as_bytes())?;
shell.err().write_all(b"\n")?;
}
Message::Diagnostic { id, level, diag } => {
let emitted = self.diag_dedupe.emit_diag(&diag)?;
if level == "warning" {
self.bump_warning_count(id, emitted);
}
}
Message::WarningCount { id, emitted } => {
self.bump_warning_count(id, emitted);
}
Message::FixDiagnostic(msg) => {
self.print.print(&msg)?;
}
Expand All @@ -586,6 +664,7 @@ impl<'cfg> DrainState<'cfg> {
self.tokens.extend(rustc_tokens);
}
self.to_send_clients.remove(&id);
self.report_warning_count(cx.bcx.config, id);
self.active.remove(&id).unwrap()
}
// ... otherwise if it hasn't finished we leave it
Expand Down Expand Up @@ -936,7 +1015,7 @@ impl<'cfg> DrainState<'cfg> {
let fresh = job.freshness();
let rmeta_required = cx.rmeta_required(unit);

let doit = move |state: JobState<'_>| {
let doit = move |state: JobState<'_, '_>| {
let mut sender = FinishOnDrop {
messages: &state.messages,
id,
Expand Down Expand Up @@ -992,7 +1071,7 @@ impl<'cfg> DrainState<'cfg> {
doit(JobState {
id,
messages,
output: Some(cx.bcx.config),
output: Some(&self.diag_dedupe),
rmeta_required: Cell::new(rmeta_required),
_marker: marker::PhantomData,
});
Expand Down Expand Up @@ -1044,6 +1123,44 @@ impl<'cfg> DrainState<'cfg> {
Ok(())
}

fn bump_warning_count(&mut self, id: JobId, emitted: bool) {
let cnts = self.warning_count.entry(id).or_default();
cnts.0 += 1;
if !emitted {
cnts.1 += 1;
}
}

/// Displays a final report of the warnings emitted by a particular job.
fn report_warning_count(&mut self, config: &Config, id: JobId) {
let count = match self.warning_count.remove(&id) {
Some(count) => count,
None => return,
};
let unit = &self.active[&id];
let mut message = format!("`{}` ({}", unit.pkg.name(), unit.target.description_named());
if unit.mode.is_rustc_test() && !(unit.target.is_test() || unit.target.is_bench()) {
message.push_str(" test");
} else if unit.mode.is_doc_test() {
message.push_str(" doctest");
} else if unit.mode.is_doc() {
message.push_str(" doc");
}
message.push_str(") generated ");
match count.0 {
1 => message.push_str("1 warning"),
n => drop(write!(message, "{} warnings", n)),
};
match count.1 {
0 => {}
1 => message.push_str(" (1 duplicate)"),
n => drop(write!(message, " ({} duplicates)", n)),
}
// Errors are ignored here because it is tricky to handle them
// correctly, and they aren't important.
drop(config.shell().warn(message));
}

fn finish(
&mut self,
id: JobId,
Expand Down
27 changes: 16 additions & 11 deletions src/cargo/core/compiler/mod.rs
Original file line number Diff line number Diff line change
Expand Up @@ -347,6 +347,8 @@ fn rustc(cx: &mut Context<'_, '_>, unit: &Unit, exec: &Arc<dyn Executor>) -> Car
};
format!("could not compile `{}`{}{}", name, errors, warnings)
})?;
// Exec should never return with success *and* generate an error.
debug_assert_eq!(output_options.errors_seen, 0);
}

if rustc_dep_info_loc.exists() {
Expand Down Expand Up @@ -1199,7 +1201,7 @@ impl OutputOptions {
}

fn on_stdout_line(
state: &JobState<'_>,
state: &JobState<'_, '_>,
line: &str,
_package_id: PackageId,
_target: &Target,
Expand All @@ -1209,7 +1211,7 @@ fn on_stdout_line(
}

fn on_stderr_line(
state: &JobState<'_>,
state: &JobState<'_, '_>,
line: &str,
package_id: PackageId,
manifest_path: &std::path::Path,
Expand All @@ -1231,7 +1233,7 @@ fn on_stderr_line(

/// Returns true if the line should be cached.
fn on_stderr_line_inner(
state: &JobState<'_>,
state: &JobState<'_, '_>,
line: &str,
package_id: PackageId,
manifest_path: &std::path::Path,
Expand Down Expand Up @@ -1296,27 +1298,30 @@ fn on_stderr_line_inner(
message: String,
level: String,
}
if let Ok(mut error) = serde_json::from_str::<CompilerMessage>(compiler_message.get()) {
if error.level == "error" && error.message.starts_with("aborting due to") {
if let Ok(mut msg) = serde_json::from_str::<CompilerMessage>(compiler_message.get()) {
if msg.message.starts_with("aborting due to")
|| msg.message.ends_with("warning emitted")
|| msg.message.ends_with("warnings emitted")
{
// Skip this line; we'll print our own summary at the end.
return Ok(true);
}
// state.stderr will add a newline
if error.rendered.ends_with('\n') {
error.rendered.pop();
if msg.rendered.ends_with('\n') {
msg.rendered.pop();
}
let rendered = if options.color {
error.rendered
msg.rendered
} else {
// Strip only fails if the the Writer fails, which is Cursor
// on a Vec, which should never fail.
strip_ansi_escapes::strip(&error.rendered)
strip_ansi_escapes::strip(&msg.rendered)
.map(|v| String::from_utf8(v).expect("utf8"))
.expect("strip should never fail")
};
if options.show_warnings {
count_diagnostic(&error.level, options);
state.stderr(rendered)?;
count_diagnostic(&msg.level, options);
state.emit_diag(msg.level, rendered)?;
}
return Ok(true);
}
Expand Down
2 changes: 1 addition & 1 deletion src/cargo/core/manifest.rs
Original file line number Diff line number Diff line change
Expand Up @@ -925,7 +925,7 @@ impl Target {
TargetKind::ExampleLib(..) | TargetKind::ExampleBin => {
format!("example \"{}\"", self.name())
}
TargetKind::CustomBuild => "custom-build".to_string(),
TargetKind::CustomBuild => "build script".to_string(),
}
}
}
Expand Down
Loading

0 comments on commit 493e8b7

Please sign in to comment.