frame-omni-bencher: better diagnostic on insufficient data points (#11510)

gui1117 · github-actions[bot] · shawntabrizi · web-flow · commit 4fba586ff870 · 2026-04-16T20:43:45.000Z
When a benchmark is run with not enough steps and too many points are
skipped then it can make the analysis panic. This PR improves the panic
message and gives precise information about which benchmark is at fault.

---------

Co-authored-by: cmd[bot] &lt;41898282+github-actions[bot]@users.noreply.github.com&gt;
Co-authored-by: Shawn Tabrizi &lt;shawntabrizi@gmail.com&gt;
Co-authored-by: Bastian Köcher &lt;git@kchr.de&gt;
diff --git a/Cargo.lock b/Cargo.lock
diff --git a/prdoc/pr_11510.prdoc b/prdoc/pr_11510.prdoc
@@ -0,0 +1,11 @@
+title: 'frame-omni-bencher: better diagnostic on insufficient data points'
+doc:
+- audience: Runtime Dev
+  description: When a benchmark is run with not enough steps and too many points are
+    skipped then it can make the analysis panic. This PR improves the panic message
+    and gives precise information about which benchmark is at fault.
+crates:
+- name: frame-benchmarking
+  bump: major
+- name: frame-benchmarking-cli
+  bump: major
diff --git a/substrate/frame/benchmarking/Cargo.toml b/substrate/frame/benchmarking/Cargo.toml
@@ -16,6 +16,7 @@ workspace = true
 targets = ["x86_64-unknown-linux-gnu"]
 
 [dependencies]
+anyhow = { optional = true, workspace = true }
 codec = { workspace = true }
 frame-support = { workspace = true }
 frame-support-procedural = { workspace = true }
@@ -45,6 +46,7 @@ sp-state-machine = { workspace = true }
 [features]
 default = ["std"]
 std = [
+	"anyhow/std",
 	"codec/std",
 	"frame-support-procedural/std",
 	"frame-support/std",
diff --git a/substrate/frame/benchmarking/src/analysis.rs b/substrate/frame/benchmarking/src/analysis.rs
@@ -197,10 +197,11 @@ fn linear_regression(
 impl Analysis {
 	// Useful for when there are no components, and we just need an median value of the benchmark
 	// results. Note: We choose the median value because it is more robust to outliers.
-	fn median_value(r: &Vec<BenchmarkResult>, selector: BenchmarkSelector) -> Option<Self> {
-		if r.is_empty() {
-			return None;
-		}
+	fn median_value(
+		r: &Vec<BenchmarkResult>,
+		selector: BenchmarkSelector,
+	) -> Result<Self, anyhow::Error> {
+		anyhow::ensure!(!r.is_empty(), "benchmark results cannot be empty");
 
 		let mut values: Vec<u128> = r
 			.iter()
@@ -216,7 +217,7 @@ impl Analysis {
 		values.sort();
 		let mid = values.len() / 2;
 
-		Some(Self {
+		Ok(Self {
 			base: selector.scale_weight(values[mid]),
 			slopes: Vec::new(),
 			names: Vec::new(),
@@ -227,7 +228,12 @@ impl Analysis {
 		})
 	}
 
-	pub fn median_slopes(r: &Vec<BenchmarkResult>, selector: BenchmarkSelector) -> Option<Self> {
+	pub fn median_slopes(
+		r: &Vec<BenchmarkResult>,
+		selector: BenchmarkSelector,
+	) -> Result<Self, anyhow::Error> {
+		anyhow::ensure!(!r.is_empty(), "benchmark results cannot be empty");
+
 		if r[0].components.is_empty() {
 			return Self::median_value(r, selector);
 		}
@@ -273,7 +279,7 @@ impl Analysis {
 
 		let models = results
 			.iter()
-			.map(|(_, _, _, ref values)| {
+			.map(|(param_name, _, _, ref values)| {
 				let mut slopes = vec![];
 				for (i, &(x1, y1)) in values.iter().enumerate() {
 					for &(x2, y2) in values.iter().skip(i + 1) {
@@ -282,6 +288,19 @@ impl Analysis {
 						}
 					}
 				}
+				if slopes.is_empty() {
+					let unique_values = values
+						.iter()
+						.map(|(x, _)| x)
+						.collect::<std::collections::BTreeSet<_>>()
+						.len();
+					return Err(anyhow::anyhow!(
+						"Parameter `{param_name}` only has \
+						{unique_values} unique value(s) but needs at least 2 to compute a slope. \
+						This can happen when too many benchmark samples are skipped. \
+						Try increasing the number of steps for this parameter or fix the benchmark.",
+					));
+				}
 				slopes.sort_by(|a, b| a.partial_cmp(b).expect("values well defined; qed"));
 				let slope = slopes[slopes.len() / 2];
 
@@ -292,9 +311,9 @@ impl Analysis {
 				offsets.sort_by(|a, b| a.partial_cmp(b).expect("values well defined; qed"));
 				let offset = offsets[offsets.len() / 2];
 
-				(offset, slope)
+				Ok((offset, slope))
 			})
-			.collect::<Vec<_>>();
+			.collect::<Result<Vec<_>, anyhow::Error>>()?;
 
 		let models = models
 			.iter()
@@ -316,7 +335,7 @@ impl Analysis {
 			.map(|x| selector.scale_and_cast_weight(x.1.max(0f64), false))
 			.collect::<Vec<_>>();
 
-		Some(Self {
+		Ok(Self {
 			base,
 			slopes,
 			names: results.into_iter().map(|x| x.0).collect::<Vec<_>>(),
@@ -327,7 +346,12 @@ impl Analysis {
 		})
 	}
 
-	pub fn min_squares_iqr(r: &Vec<BenchmarkResult>, selector: BenchmarkSelector) -> Option<Self> {
+	pub fn min_squares_iqr(
+		r: &Vec<BenchmarkResult>,
+		selector: BenchmarkSelector,
+	) -> Result<Self, anyhow::Error> {
+		anyhow::ensure!(!r.is_empty(), "benchmark results cannot be empty");
+
 		if r[0].components.is_empty() || r.len() <= 2 {
 			return Self::median_value(r, selector);
 		}
@@ -379,9 +403,12 @@ impl Analysis {
 			}
 		}
 
-		let (intercept, slopes, errors) = linear_regression(xs, ys, r[0].components.len())?;
+		let (intercept, slopes, errors) = linear_regression(xs, ys, r[0].components.len())
+			.ok_or_else(|| {
+				anyhow::anyhow!("linear regression failed for min_squares_iqr analysis")
+			})?;
 
-		Some(Self {
+		Ok(Self {
 			base: selector.scale_and_cast_weight(intercept, true),
 			slopes: slopes
 				.into_iter()
@@ -400,16 +427,12 @@ impl Analysis {
 		})
 	}
 
-	pub fn max(r: &Vec<BenchmarkResult>, selector: BenchmarkSelector) -> Option<Self> {
-		let median_slopes = Self::median_slopes(r, selector);
-		let min_squares = Self::min_squares_iqr(r, selector);
-
-		if median_slopes.is_none() || min_squares.is_none() {
-			return None;
-		}
-
-		let median_slopes = median_slopes.unwrap();
-		let min_squares = min_squares.unwrap();
+	pub fn max(
+		r: &Vec<BenchmarkResult>,
+		selector: BenchmarkSelector,
+	) -> Result<Self, anyhow::Error> {
+		let median_slopes = Self::median_slopes(r, selector)?;
+		let min_squares = Self::min_squares_iqr(r, selector)?;
 
 		let base = median_slopes.base.max(min_squares.base);
 		let slopes = median_slopes
@@ -429,7 +452,7 @@ impl Analysis {
 		let errors = min_squares.errors;
 		let minimum = selector.get_minimum(&r);
 
-		Some(Self { base, slopes, names, value_dists, errors, selector, minimum })
+		Ok(Self { base, slopes, names, value_dists, errors, selector, minimum })
 	}
 }
 
diff --git a/substrate/utils/frame/benchmarking-cli/Cargo.toml b/substrate/utils/frame/benchmarking-cli/Cargo.toml
@@ -17,6 +17,7 @@ targets = ["x86_64-unknown-linux-gnu"]
 
 [dependencies]
 Inflector = { workspace = true }
+anyhow = { workspace = true, default-features = true }
 array-bytes = { workspace = true, default-features = true }
 chrono = { workspace = true }
 clap = { features = ["derive"], workspace = true }
diff --git a/substrate/utils/frame/benchmarking-cli/src/pallet/command.rs b/substrate/utils/frame/benchmarking-cli/src/pallet/command.rs
@@ -893,7 +893,8 @@ impl PalletCmd {
 
 			if !self.no_storage_info {
 				let mut storage_per_prefix = HashMap::<Vec<u8>, Vec<BenchmarkResult>>::new();
-				let pov_mode = pov_modes.get(&(pallet, benchmark)).cloned().unwrap_or_default();
+				let pov_mode =
+					pov_modes.get(&(pallet, benchmark.clone())).cloned().unwrap_or_default();
 
 				let comments = writer::process_storage_results(
 					&mut storage_per_prefix,
@@ -914,49 +915,45 @@ impl PalletCmd {
 			// Conduct analysis.
 			if !self.no_median_slopes {
 				println!("Median Slopes Analysis\n========");
-				if let Some(analysis) =
-					Analysis::median_slopes(&batch.time_results, BenchmarkSelector::ExtrinsicTime)
+				match Analysis::median_slopes(&batch.time_results, BenchmarkSelector::ExtrinsicTime)
 				{
-					println!("-- Extrinsic Time --\n{}", analysis);
+					Ok(analysis) => println!("-- Extrinsic Time --\n{}", analysis),
+					Err(err) => println!("-- Extrinsic Time --\nError: {:?}", err),
 				}
-				if let Some(analysis) =
-					Analysis::median_slopes(&batch.db_results, BenchmarkSelector::Reads)
-				{
-					println!("Reads = {:?}", analysis);
+				match Analysis::median_slopes(&batch.db_results, BenchmarkSelector::Reads) {
+					Ok(analysis) => println!("Reads = {:?}", analysis),
+					Err(err) => println!("Reads: Error: {:?}", err),
 				}
-				if let Some(analysis) =
-					Analysis::median_slopes(&batch.db_results, BenchmarkSelector::Writes)
-				{
-					println!("Writes = {:?}", analysis);
+				match Analysis::median_slopes(&batch.db_results, BenchmarkSelector::Writes) {
+					Ok(analysis) => println!("Writes = {:?}", analysis),
+					Err(err) => println!("Writes: Error: {:?}", err),
 				}
-				if let Some(analysis) =
-					Analysis::median_slopes(&batch.db_results, BenchmarkSelector::ProofSize)
-				{
-					println!("Recorded proof Size = {:?}", analysis);
+				match Analysis::median_slopes(&batch.db_results, BenchmarkSelector::ProofSize) {
+					Ok(analysis) => println!("Recorded proof Size = {:?}", analysis),
+					Err(err) => println!("Recorded proof Size: Error: {:?}", err),
 				}
 				println!();
 			}
 			if !self.no_min_squares {
 				println!("Min Squares Analysis\n========");
-				if let Some(analysis) =
-					Analysis::min_squares_iqr(&batch.time_results, BenchmarkSelector::ExtrinsicTime)
-				{
-					println!("-- Extrinsic Time --\n{}", analysis);
+				match Analysis::min_squares_iqr(
+					&batch.time_results,
+					BenchmarkSelector::ExtrinsicTime,
+				) {
+					Ok(analysis) => println!("-- Extrinsic Time --\n{}", analysis),
+					Err(err) => println!("-- Extrinsic Time --\nError: {:?}", err),
 				}
-				if let Some(analysis) =
-					Analysis::min_squares_iqr(&batch.db_results, BenchmarkSelector::Reads)
-				{
-					println!("Reads = {:?}", analysis);
+				match Analysis::min_squares_iqr(&batch.db_results, BenchmarkSelector::Reads) {
+					Ok(analysis) => println!("Reads = {:?}", analysis),
+					Err(err) => println!("Reads: Error: {:?}", err),
 				}
-				if let Some(analysis) =
-					Analysis::min_squares_iqr(&batch.db_results, BenchmarkSelector::Writes)
-				{
-					println!("Writes = {:?}", analysis);
+				match Analysis::min_squares_iqr(&batch.db_results, BenchmarkSelector::Writes) {
+					Ok(analysis) => println!("Writes = {:?}", analysis),
+					Err(err) => println!("Writes: Error: {:?}", err),
 				}
-				if let Some(analysis) =
-					Analysis::min_squares_iqr(&batch.db_results, BenchmarkSelector::ProofSize)
-				{
-					println!("Recorded proof Size = {:?}", analysis);
+				match Analysis::min_squares_iqr(&batch.db_results, BenchmarkSelector::ProofSize) {
+					Ok(analysis) => println!("Recorded proof Size = {:?}", analysis),
+					Err(err) => println!("Recorded proof Size: Error: {:?}", err),
 				}
 				println!();
 			}
diff --git a/substrate/utils/frame/benchmarking-cli/src/pallet/writer.rs b/substrate/utils/frame/benchmarking-cli/src/pallet/writer.rs
@@ -23,6 +23,7 @@ use std::{
 	path::PathBuf,
 };
 
+use anyhow::Context;
 use inflector::Inflector;
 use itertools::Itertools;
 use serde::Serialize;
@@ -142,10 +143,10 @@ fn map_results(
 	pov_analysis_choice: &AnalysisChoice,
 	worst_case_map_values: u32,
 	additional_trie_layers: u8,
-) -> Result<HashMap<(String, String), Vec<BenchmarkData>>, std::io::Error> {
+) -> Result<HashMap<(String, String), Vec<BenchmarkData>>, sc_cli::Error> {
 	// Skip if batches is empty.
 	if batches.is_empty() {
-		return Err(io_error("empty batches"));
+		return Err(io_error("empty batches").into());
 	}
 
 	let mut all_benchmarks = HashMap::<_, Vec<BenchmarkData>>::new();
@@ -168,7 +169,7 @@ fn map_results(
 			pov_analysis_choice,
 			worst_case_map_values,
 			additional_trie_layers,
-		);
+		)?;
 		let pallet_benchmarks = all_benchmarks.entry((pallet_name, instance_name)).or_default();
 		pallet_benchmarks.push(benchmark_data);
 	}
@@ -198,7 +199,7 @@ fn get_benchmark_data(
 	pov_analysis_choice: &AnalysisChoice,
 	worst_case_map_values: u32,
 	additional_trie_layers: u8,
-) -> BenchmarkData {
+) -> Result<BenchmarkData, sc_cli::Error> {
 	// Analyze benchmarks to get the linear regression.
 	let analysis_function = match analysis_choice {
 		AnalysisChoice::MinSquares => Analysis::min_squares_iqr,
@@ -214,14 +215,18 @@ fn get_benchmark_data(
 	let benchmark = String::from_utf8(batch.benchmark.clone()).unwrap();
 
 	let extrinsic_time = analysis_function(&batch.time_results, BenchmarkSelector::ExtrinsicTime)
-		.expect("analysis function should return an extrinsic time for valid inputs");
+		.context(format!("benchmark '{pallet}::{benchmark}'"))
+		.map_err(|e| sc_cli::Error::Application(e.into()))?;
 	let reads = analysis_function(&batch.db_results, BenchmarkSelector::Reads)
-		.expect("analysis function should return the number of reads for valid inputs");
+		.context(format!("benchmark '{pallet}::{benchmark}'"))
+		.map_err(|e| sc_cli::Error::Application(e.into()))?;
 	let writes = analysis_function(&batch.db_results, BenchmarkSelector::Writes)
-		.expect("analysis function should return the number of writes for valid inputs");
+		.context(format!("benchmark '{pallet}::{benchmark}'"))
+		.map_err(|e| sc_cli::Error::Application(e.into()))?;
 	let recorded_proof_size =
 		pov_analysis_function(&batch.db_results, BenchmarkSelector::ProofSize)
-			.expect("analysis function should return proof sizes for valid inputs");
+			.context(format!("benchmark '{pallet}::{benchmark}'"))
+			.map_err(|e| sc_cli::Error::Application(e.into()))?;
 
 	// Analysis data may include components that are not used, this filters out anything whose value
 	// is zero.
@@ -298,21 +303,22 @@ fn get_benchmark_data(
 		additional_trie_layers,
 	);
 
-	let proof_size_per_components = storage_per_prefix
+	let proof_size_per_components: Vec<_> = storage_per_prefix
 		.iter()
 		.map(|(prefix, results)| {
 			let proof_size = analysis_function(results, BenchmarkSelector::ProofSize)
-				.expect("analysis function should return proof sizes for valid inputs");
+				.context(format!("benchmark '{pallet}::{benchmark}'"))
+				.map_err(|e| sc_cli::Error::Application(e.into()))?;
 			let slope = proof_size
 				.slopes
 				.into_iter()
 				.zip(proof_size.names.iter())
 				.zip(extract_errors(&proof_size.errors))
 				.map(|((slope, name), error)| ComponentSlope { name: name.clone(), slope, error })
 				.collect::<Vec<_>>();
-			(prefix.clone(), slope, proof_size.base)
+			Ok((prefix.clone(), slope, proof_size.base))
 		})
-		.collect::<Vec<_>>();
+		.collect::<Result<_, sc_cli::Error>>()?;
 
 	let mut base_calculated_proof_size = 0;
 	// Sum up the proof sizes per component
@@ -357,7 +363,7 @@ fn get_benchmark_data(
 		.map(|c| c.clone())
 		.unwrap_or_default();
 
-	BenchmarkData {
+	Ok(BenchmarkData {
 		name: benchmark,
 		components,
 		base_weight: extrinsic_time.base,
@@ -373,7 +379,7 @@ fn get_benchmark_data(
 		component_ranges,
 		comments,
 		min_execution_time: extrinsic_time.minimum,
-	}
+	})
 }
 
 /// Create weight file from benchmark data and Handlebars template.