Merge pull request #1298 from Kobzol/profile-local-parallel

Kobzol · web-flow · commit 74d70ed1b050 · 2022-04-21T08:37:44.000+02:00
Add option to parallelize profiling across benchmarks
diff --git a/Cargo.lock b/Cargo.lock
diff --git a/collector/Cargo.toml b/collector/Cargo.toml
@@ -32,6 +32,7 @@ snap = "1"
 filetime = "0.2.14"
 walkdir = "2"
 flate2 = { version = "1.0.22", features = ["rust_backend"] }
+rayon = "1.5.2"
 
 [target.'cfg(windows)'.dependencies]
 miow = "0.3"
diff --git a/collector/README.md b/collector/README.md
@@ -425,6 +425,8 @@ The following options alter the behaviour of the `profile_local` subcommand.
   diff files will also be produced.
 - `--rustdoc <RUSTDOC>` as for `bench_local`.
 - `--scenarios <SCENARIOS>`: as for `bench_local`.
+- `--jobs <JOB-COUNT>`: execute `<JOB-COUNT>` benchmarks in parallel. This is only allowed for certain
+profilers whose results are not affected by system noise (e.g. `callgrind` or `eprintln`).
 
 `RUST_LOG=debug` can be specified to enable verbose logging, which is useful
 for debugging `collector` itself.
diff --git a/collector/src/execute.rs b/collector/src/execute.rs
@@ -177,6 +177,25 @@ pub enum Profiler {
     LlvmIr,
 }
 
+impl Profiler {
+    /// Returns true if this profiler can be executed
+    /// in parallel without distorting the profile results.
+    pub fn supports_parallel_execution(&self) -> bool {
+        matches!(
+            self,
+            Profiler::Cachegrind
+                | Profiler::Callgrind
+                | Profiler::Dhat
+                | Profiler::DhatCopy
+                | Profiler::Eprintln
+                | Profiler::LlvmLines
+                | Profiler::LlvmIr
+                | Profiler::MonoItems
+                | Profiler::DepGraph
+        )
+    }
+}
+
 #[derive(Clone, Copy, Debug, PartialEq)]
 pub enum PerfTool {
     BenchTool(Bencher),
diff --git a/collector/src/main.rs b/collector/src/main.rs
@@ -5,6 +5,7 @@ use clap::Parser;
 use collector::category::Category;
 use database::{ArtifactId, Commit};
 use log::debug;
+use rayon::iter::{IndexedParallelIterator, IntoParallelRefIterator, ParallelIterator};
 use std::collections::HashMap;
 use std::fs;
 use std::fs::File;
@@ -134,6 +135,10 @@ impl BenchmarkErrors {
         self.0 += 1;
     }
 
+    fn add(&mut self, count: usize) {
+        self.0 += count;
+    }
+
     fn fail_if_nonzero(self) -> anyhow::Result<()> {
         if self.0 > 0 {
             anyhow::bail!("{} benchmarks failed", self.0)
@@ -684,18 +689,30 @@ fn profile(
     if let Profiler::SelfProfile = profiler {
         check_measureme_installed().unwrap();
     }
-    for (i, benchmark) in benchmarks.iter().enumerate() {
-        eprintln!("{}", n_normal_benchmarks_remaining(benchmarks.len() - i));
-        let mut processor = ProfileProcessor::new(profiler, out_dir, id);
-        let result = benchmark.measure(&mut processor, &profiles, &scenarios, compiler, Some(1));
-        if let Err(ref s) = result {
-            errors.incr();
-            eprintln!(
-                "collector error: Failed to profile '{}' with {:?}, recorded: {:?}",
-                benchmark.name, profiler, s
-            );
-        }
-    }
+
+    let error_count: usize = benchmarks
+        .par_iter()
+        .enumerate()
+        .map(|(i, benchmark)| {
+            let benchmark_id = format!("{} ({}/{})", benchmark.name, i + 1, benchmarks.len());
+            eprintln!("Executing benchmark {benchmark_id}");
+            let mut processor = ProfileProcessor::new(profiler, out_dir, id);
+            let result =
+                benchmark.measure(&mut processor, &profiles, &scenarios, compiler, Some(1));
+            eprintln!("Finished benchmark {benchmark_id}");
+
+            if let Err(ref s) = result {
+                eprintln!(
+                    "collector error: Failed to profile '{}' with {:?}, recorded: {:?}",
+                    benchmark.name, profiler, s
+                );
+                1
+            } else {
+                0
+            }
+        })
+        .sum();
+    errors.add(error_count);
 }
 
 fn main() {
@@ -859,6 +876,11 @@ enum Commands {
         // toolchain name, and `PathBuf` doesn't work well for the latter.
         #[clap(long)]
         rustc2: Option<String>,
+
+        /// How many benchmarks should be profiled in parallel.
+        /// This flag is only supported for certain profilers
+        #[clap(long, short = 'j', default_value = "1")]
+        jobs: u64,
     },
 
     /// Installs the next commit for perf.rust-lang.org
@@ -1089,7 +1111,16 @@ fn main_result() -> anyhow::Result<i32> {
             local,
             out_dir,
             rustc2,
+            jobs,
         } => {
+            let jobs = jobs.max(1);
+            if jobs > 1 && !profiler.supports_parallel_execution() {
+                anyhow::bail!(
+                    "Profiler {:?} does not support parallel execution.",
+                    profiler
+                );
+            }
+
             let profiles = Profile::expand_all(&local.profiles);
             let scenarios = Scenario::expand_all(&local.scenarios);
 
@@ -1102,6 +1133,12 @@ fn main_result() -> anyhow::Result<i32> {
 
             let mut errors = BenchmarkErrors::new();
 
+            eprintln!("Running with {jobs} job(s)");
+            rayon::ThreadPoolBuilder::new()
+                .num_threads(jobs as usize)
+                .build_global()
+                .unwrap();
+
             let mut get_toolchain_and_profile =
                 |rustc: &str, suffix: &str| -> anyhow::Result<String> {
                     let (rustc, rustdoc, cargo, id) = get_local_toolchain(