seq: Buffer writes to stdout

drinkcat · drinkcat · commit 85fa12bf8d68 · 2025-03-19T09:51:42.000+01:00
Use a BufWriter to wrap stdout: reduces the numbers of system calls,
improves performance drastically (2x in some cases).

Also document use cases in src/uu/seq/BENCHMARKING.md, and the
optimization we have just done here.
diff --git a/src/uu/seq/BENCHMARKING.md b/src/uu/seq/BENCHMARKING.md
@@ -19,7 +19,57 @@ Finally, you can compare the performance of the two versions of `seq`
 by running, for example,
 
 ```shell
-hyperfine "seq 1000000" "target/release/seq 1000000"
+hyperfine -L seq seq,target/release/seq "{seq} 1000000"
+```
+
+## Interesting test cases
+
+Performance characteristics may vary a lot depending on the parameters,
+and if custom formatting is required. In particular, it does appear
+that the GNU implementation is heavily optimized for positive integer
+outputs (which is probably the most common use case for `seq`).
+
+Specifying a format or fixed width will slow down the
+execution a lot (~15-20 times on GNU `seq`):
+```shell
+hyperfine -L seq seq,target/release/seq "{seq} -f%g 1000000"
+hyperfine -L seq seq,target/release/seq "{seq} -w 1000000"
+```
+
+Floating point increments, or any negative bound, also degrades the
+performance (~10-15 times on GNU `seq`):
+```shell
+hyperfine -L seq seq,./target/release/seq "{seq} 0 0.000001 1"
+hyperfine -L seq seq,./target/release/seq "{seq} -100 1 1000000"
+```
+
+## Optimizations
+
+### Buffering stdout
+
+The original `uutils` implementation of `seq` did unbuffered writes
+to stdout, causing a large number of system calls (and therefore a large amount
+of system time). Simply wrapping `stdout` in a `BufWriter` increased performance
+by about 2 times for a floating point increment test case, leading to similar
+performance compared with GNU `seq`:
+```shell
+taskset -c 0 hyperfine -L seq seq,./seq-main,target/release/seq "{seq} 0 0.1 100000"
+Benchmark 1: seq 0 0.1 100000
+  Time (mean ± σ):     161.6 ms ±   0.3 ms    [User: 160.8 ms, System: 0.6 ms]
+  Range (min … max):   161.2 ms … 162.4 ms    18 runs
+
+Benchmark 2: ./seq-main 0 0.1 100000
+  Time (mean ± σ):     282.7 ms ±   5.0 ms    [User: 221.0 ms, System: 60.0 ms]
+  Range (min … max):   279.7 ms … 296.2 ms    10 runs
+
+Benchmark 3: target/release/seq 0 0.1 100000
+  Time (mean ± σ):     143.8 ms ±   0.3 ms    [User: 143.0 ms, System: 0.6 ms]
+  Range (min … max):   143.2 ms … 144.4 ms    20 runs
+
+Summary
+  target/release/seq 0 0.1 100000 ran
+    1.12 ± 0.00 times faster than seq 0 0.1 100000
+    1.97 ± 0.03 times faster than ./seq-main 0 0.1 100000
 ```
 
 [0]: https://github.com/sharkdp/hyperfine
diff --git a/src/uu/seq/src/seq.rs b/src/uu/seq/src/seq.rs
@@ -4,7 +4,7 @@
 // file that was distributed with this source code.
 // spell-checker:ignore (ToDO) bigdecimal extendedbigdecimal numberparse hexadecimalfloat
 use std::ffi::OsString;
-use std::io::{stdout, ErrorKind, Write};
+use std::io::{stdout, BufWriter, ErrorKind, Write};
 
 use clap::{Arg, ArgAction, Command};
 use num_traits::{ToPrimitive, Zero};
@@ -262,8 +262,8 @@ fn print_seq(
     padding: usize,
     format: Option<&Format<num_format::Float>>,
 ) -> std::io::Result<()> {
-    let stdout = stdout();
-    let mut stdout = stdout.lock();
+    let stdout = stdout().lock();
+    let mut stdout = BufWriter::new(stdout);
     let (first, increment, last) = range;
     let mut value = first;
     let padding = if pad {