From 0b3f3b0e28d0ec9c9e3818ab304711471561a60d Mon Sep 17 00:00:00 2001 From: Josh Date: Mon, 10 Nov 2025 11:18:54 -0500 Subject: [PATCH] test-utils: surface dpd errors. At the moment, DendriteInstance::start in omicron-test-utils doesn't catch errors in dpd. We spawn a child process, wait up to the timeout interval to discover the dpd port from its logs, and fail if we can't discover the port. But if dpd exits quickly, we still wait the timeout interval and swallow any errors. This patch captures the stderr of the dpd child process, checks it for an early exit, and prints the details if dpd crashes. --- test-utils/src/dev/dendrite.rs | 65 ++++++++++++++++++++++++++-------- 1 file changed, 50 insertions(+), 15 deletions(-) diff --git a/test-utils/src/dev/dendrite.rs b/test-utils/src/dev/dendrite.rs index eaf659a4f51..e178c5ce72e 100644 --- a/test-utils/src/dev/dendrite.rs +++ b/test-utils/src/dev/dendrite.rs @@ -63,27 +63,25 @@ impl DendriteInstance { args.push(socket_addr.to_string()); } - let child = tokio::process::Command::new("dpd") + let mut child = tokio::process::Command::new("dpd") .args(&args) .stdin(Stdio::null()) .stdout(Stdio::from(redirect_file( temp_dir.path(), "dendrite_stdout", )?)) - .stderr(Stdio::from(redirect_file( - temp_dir.path(), - "dendrite_stderr", - )?)) + .stderr(Stdio::piped()) .spawn() .with_context(|| { format!("failed to spawn `dpd` (with args: {:?})", &args) })?; - - let child = Some(child); + let stderr = child.stderr.take().unwrap(); let temp_dir = temp_dir.keep(); if port == 0 { port = discover_port( + &mut child, + stderr, temp_dir.join("dendrite_stdout").display().to_string(), ) .await @@ -95,7 +93,7 @@ impl DendriteInstance { })?; } - Ok(Self { port, args, child, data_dir: Some(temp_dir) }) + Ok(Self { port, args, child: Some(child), data_dir: Some(temp_dir) }) } pub async fn cleanup(&mut self) -> Result<(), anyhow::Error> { @@ -145,20 +143,45 @@ fn redirect_file( .with_context(|| format!("open \"{}\"", out_path.display())) } -async fn discover_port(logfile: String) -> Result { +async fn discover_port( + child: &mut tokio::process::Child, + stderr: tokio::process::ChildStderr, + logfile: String, +) -> Result { let timeout = Instant::now() + DENDRITE_TIMEOUT; - tokio::time::timeout_at(timeout, find_dendrite_port_in_log(logfile)) - .await - .context("time out while discovering dendrite port number")? + tokio::time::timeout_at( + timeout, + find_dendrite_port_in_log(child, stderr, logfile), + ) + .await + .context("time out while discovering dendrite port number")? } async fn find_dendrite_port_in_log( + child: &mut tokio::process::Child, + mut stderr: tokio::process::ChildStderr, logfile: String, ) -> Result { let re = regex::Regex::new(r#""local_addr":"\[::1\]:([0-9]+)""#).unwrap(); let mut reader = BufReader::new(File::open(&logfile).await?); let mut lines = reader.lines(); loop { + // Exit early if the process has exited. + if let Some(exit_status) = child.try_wait()? { + let mut stderr_contents = String::new(); + tokio::io::AsyncReadExt::read_to_string( + &mut stderr, + &mut stderr_contents, + ) + .await?; + + anyhow::bail!( + "dpd exited with status {} before port could be discovered: {}", + exit_status, + stderr_contents + ); + } + match lines.next_line().await? { Some(line) => { if let Some(cap) = re.captures(&line) { @@ -212,10 +235,22 @@ mod tests { writeln!(file, "Another garbage line").unwrap(); file.flush().unwrap(); + let mut child = tokio::process::Command::new("yes") + .stdin(Stdio::null()) + .stdout(Stdio::null()) + .stderr(Stdio::piped()) + .spawn() + .unwrap(); + let stderr = child.stderr.take().unwrap(); + assert_eq!( - find_dendrite_port_in_log(file.path().display().to_string()) - .await - .unwrap(), + find_dendrite_port_in_log( + &mut child, + stderr, + file.path().display().to_string() + ) + .await + .unwrap(), EXPECTED_PORT ); }