uutils
diff --git a/‎src/uu/cmp/benches/cmp_bench.rs‎
Lines changed: 158 additions & 151 deletions b/‎src/uu/cmp/benches/cmp_bench.rs‎
Lines changed: 158 additions & 151 deletions
@@ -1,151 +1,158 @@
-#![allow(unused)]
-// This file is part of the uutils diffutils package.
-//
-// For the full copyright and license information, please view the LICENSE-*
-// files that was distributed with this source code.
-
-//! Benches for all utils in diffutils.
-//!
-//! There is a file generator included to create files of different sizes for comparison. \
-//! Set the TEMP_DIR const to keep the files. df_to_ files have small changes in them, search for '#'. \
-//! File generation up to 1 GB is really fast, Benchmarking above 100 MB takes very long.
-
-/// Generate test files with these sizes in KB.
-const FILE_SIZES_IN_KILO_BYTES: [u64; 4] = [100, 1 * MB, 10 * MB, 25 * MB];
-const NUM_DIFF: u64 = 4;
-// Empty String to use TempDir (files will be removed after test) or specify dir to keep generated files
-const TEMP_DIR: &str = "";
-// just for FILE_SIZE_KILO_BYTES
-const MB: u64 = 1_000;
-
-use std::sync::OnceLock;
-
-use divan::Bencher;
-use tempfile::TempDir;
-use uu_cmp::{params_cmp::Params, uu_app};
-// use uu_cmp::parse_params;
-// use uu_cmp::uumain;
-use uudiff::benchmark::{
-    bench_binary,
-    prepare_bench::{BenchContext, generate_test_files_bytes},
-    str_to_args,
-};
-
-// bench the time it takes to parse the command line arguments
-#[divan::bench]
-fn cmp_parser(bencher: Bencher) {
-    let cmd = "cmd file_1.txt file_2.txt -bl -n10M --ignore-initial=100KiB:1MiB";
-    let args = str_to_args(&cmd).into_iter().peekable();
-    bencher.with_inputs(|| args.clone()).bench_values(
-        // |params: std::iter::Peekable<std::vec::IntoIter<std::ffi::OsString>>| parse_params(params),
-        |params: std::iter::Peekable<std::vec::IntoIter<std::ffi::OsString>>| {
-            let matches = uudiff::clap_localization::handle_clap_result(uu_app(), params).unwrap();
-            let params: Params = matches.try_into().unwrap();
-        },
-    );
-    // );
-}
-
-// // // test the impact on the benchmark if not converting the cmd to Vec<OsString> (doubles for parse)
-// #[divan::bench]
-// fn cmp_parser_no_prepare() {
-//     let cmd = "cmd file_1.txt file_2.txt -bl n10M --ignore-initial=100KiB:1MiB";
-//     let args = str_to_args(&cmd).into_iter().peekable();
-//     let _ = parse_params(args);
-// }
-
-// bench equal, full file read
-#[divan::bench(args = FILE_SIZES_IN_KILO_BYTES)]
-fn cmp_compare_files_equal(bencher: Bencher, kb: u64) {
-    let fp = get_context().get_files_equal_kb(kb).unwrap();
-    let cmd = format!("cmp {} {}", fp.from, fp.to);
-    let args = str_to_args(&cmd).into_iter();
-
-    bencher
-        // .with_inputs(|| prepare::cmp_params_identical_testfiles(lines))
-        .with_inputs(|| args.clone())
-        .bench_refs(|params| uu_cmp::uumain(params.peekable()));
-}
-
-// bench different; cmp exits on first difference
-#[divan::bench(args = FILE_SIZES_IN_KILO_BYTES)]
-fn cmp_compare_files_different(bencher: Bencher, kb: u64) {
-    let fp = get_context().get_files_different_kb(kb).unwrap();
-    let cmd = format!("cmp -s {} {}", fp.from, fp.to);
-    let args = str_to_args(&cmd).into_iter();
-
-    bencher
-        // .with_inputs(|| prepare::cmp_params_identical_testfiles(lines))
-        .with_inputs(|| args.clone())
-        .bench_refs(|params| uu_cmp::uumain(params.peekable()));
-}
-
-// TODO use coreutils bench logic
-// bench original GNU cmp
-#[cfg(feature = "feat_run_binary_bench")]
-#[divan::bench(args = FILE_SIZES_IN_KILO_BYTES)]
-fn cmd_cmp_gnu_equal(bencher: Bencher, kb: u64) {
-    let fp = get_context().get_files_equal_kb(kb).unwrap();
-    let args_str = format!("{} {}", fp.from, fp.to);
-    bencher
-        // .with_inputs(|| prepare::cmp_params_identical_testfiles(lines))
-        .with_inputs(|| args_str.clone())
-        .bench_refs(|cmd_args| bench_binary::bench_binary("cmp", cmd_args));
-}
-
-// bench the compiled release version
-#[cfg(feature = "feat_run_binary_bench")]
-#[divan::bench(args = FILE_SIZES_IN_KILO_BYTES)]
-fn cmd_cmp_release_equal(bencher: Bencher, kb: u64) {
-    // search for src, then shorten path
-    let dir = std::env::current_dir().unwrap();
-    let path = dir.to_string_lossy();
-    let path = path.trim_end_matches("src/uu/cmp");
-    let prg = path.to_string() + "target/release/cmp";
-
-    let fp = get_context().get_files_equal_kb(kb).unwrap();
-    let args_str = format!("{} {}", fp.from, fp.to);
-
-    bencher
-        // .with_inputs(|| prepare::cmp_params_identical_testfiles(lines))
-        .with_inputs(|| args_str.clone())
-        .bench_refs(|cmd_args| bench_binary::bench_binary(&prg, cmd_args));
-}
-
-// Since each bench function is separate in Divan it is more difficult to dynamically create test data.
-// This keeps the TempDir alive until the program exits and generates the files only once.
-static SHARED_CONTEXT: OnceLock<BenchContext> = OnceLock::new();
-/// Creates the test files once and provides them to all tests.
-pub fn get_context() -> &'static BenchContext {
-    SHARED_CONTEXT.get_or_init(|| {
-        let mut ctx = BenchContext::default();
-        if TEMP_DIR.is_empty() {
-            let tmp_dir = TempDir::new().expect("Failed to create temp dir");
-            ctx.tmp_dir = Some(tmp_dir);
-        } else {
-            // uses current directory, the generated files are kept
-            let path = std::path::Path::new(TEMP_DIR);
-            if !path.exists() {
-                std::fs::create_dir_all(path).expect("Path {path} could not be created");
-            }
-            ctx.dir = TEMP_DIR.to_string();
-        };
-
-        // generate test bytes
-        for kb in FILE_SIZES_IN_KILO_BYTES {
-            let f = generate_test_files_bytes(ctx.get_path(), kb * 1000, 0, "eq")
-                .expect("generate_test_files failed");
-            ctx.files_equal.push(f);
-            let f = generate_test_files_bytes(ctx.get_path(), kb * 1000, NUM_DIFF, "df")
-                .expect("generate_test_files failed");
-            ctx.files_different.push(f);
-        }
-
-        ctx
-    })
-}
-
-fn main() {
-    // Run registered benchmarks.
-    divan::main();
-}
+#![allow(unused)]
+// This file is part of the uutils diffutils package.
+//
+// For the full copyright and license information, please view the LICENSE-*
+// files that was distributed with this source code.
+
+//! Benches for all utils in diffutils.
+//!
+//! There is a file generator included to create files of different sizes for comparison. \
+//! Set the TEMP_DIR const to keep the files. df_to_ files have small changes in them, search for '#'. \
+//! File generation up to 1 GB is really fast, Benchmarking above 100 MB takes very long.
+
+/// Generate test files with these sizes in KB.
+const FILE_SIZES_IN_KILO_BYTES: [u64; 5] = [100, 1 * MB, 10 * MB, 25 * MB, 100 * MB];
+const NUM_DIFF: u64 = 4;
+// Empty String to use TempDir (files will be removed after test) or specify dir to keep generated files
+const TEMP_DIR: &str = "";
+// just for FILE_SIZE_KILO_BYTES
+const MB: u64 = 1_000;
+
+use std::{
+    path::{Path, PathBuf},
+    sync::OnceLock,
+};
+
+use divan::Bencher;
+use tempfile::TempDir;
+use uu_cmp::{params_cmp::Params, uu_app};
+use uudiff::benchmark::{
+    bench_binary,
+    prepare_bench::{BenchContext, generate_test_files_bytes},
+    str_to_args,
+};
+
+// bench the time it takes to parse the command line arguments
+#[divan::bench]
+fn cmp_parser(bencher: Bencher) {
+    let cmd = "cmd file_1.txt file_2.txt -bl -n10M --ignore-initial=100KiB:1MiB";
+    let args = str_to_args(&cmd).into_iter().peekable();
+    bencher.with_inputs(|| args.clone()).bench_values(
+        // |params: std::iter::Peekable<std::vec::IntoIter<std::ffi::OsString>>| parse_params(params),
+        |params: std::iter::Peekable<std::vec::IntoIter<std::ffi::OsString>>| {
+            let matches = uudiff::clap_localization::handle_clap_result(uu_app(), params).unwrap();
+            let params: Params = matches.try_into().unwrap();
+        },
+    );
+    // );
+}
+
+// // // test the impact on the benchmark if not converting the cmd to Vec<OsString> (doubles for parse)
+// #[divan::bench]
+// fn cmp_parser_no_prepare() {
+//     let cmd = "cmd file_1.txt file_2.txt -bl n10M --ignore-initial=100KiB:1MiB";
+//     let args = str_to_args(&cmd).into_iter().peekable();
+//     let _ = parse_params(args);
+// }
+
+// bench equal, full file read
+#[divan::bench(args = FILE_SIZES_IN_KILO_BYTES)]
+fn cmp_compare_files_equal(bencher: Bencher, kb: u64) {
+    let fp = get_context().get_files_equal_kb(kb).unwrap();
+    let cmd = format!("cmp {} {}", fp.from, fp.to);
+    let args = str_to_args(&cmd).into_iter();
+    let matches =
+        uudiff::clap_localization::handle_clap_result_with_exit_code(uu_app(), args, 2).unwrap();
+    let params: Params = matches.try_into().unwrap();
+
+    bencher
+        // .with_inputs(|| prepare::cmp_params_identical_testfiles(lines))
+        .with_inputs(|| params.clone())
+        .bench_refs(|params| uu_cmp::cmp_compare(params));
+}
+
+// bench different; cmp exits on first difference
+#[divan::bench(args = FILE_SIZES_IN_KILO_BYTES)]
+fn cmp_compare_files_different(bencher: Bencher, kb: u64) {
+    let fp = get_context().get_files_different_kb(kb).unwrap();
+    let cmd = format!("cmp -s {} {}", fp.from, fp.to);
+    let args = str_to_args(&cmd).into_iter();
+
+    bencher
+        // .with_inputs(|| prepare::cmp_params_identical_testfiles(lines))
+        .with_inputs(|| args.clone())
+        .bench_refs(|params| uu_cmp::uumain(params.peekable()));
+}
+
+// TODO use coreutils bench logic
+// bench original GNU cmp
+#[cfg(feature = "feat_run_binary_bench")]
+#[divan::bench(args = FILE_SIZES_IN_KILO_BYTES)]
+fn cmd_cmp_gnu_equal(bencher: Bencher, kb: u64) {
+    let fp = get_context().get_files_equal_kb(kb).unwrap();
+    let args_str = format!("{} {}", fp.from, fp.to);
+    bencher
+        // .with_inputs(|| prepare::cmp_params_identical_testfiles(lines))
+        .with_inputs(|| args_str.clone())
+        .bench_refs(|cmd_args| bench_binary::bench_binary(&PathBuf::from("cmp"), cmd_args));
+}
+
+// bench the compiled release version
+#[cfg(feature = "feat_run_binary_bench")]
+#[divan::bench(args = FILE_SIZES_IN_KILO_BYTES)]
+fn cmd_cmp_release_equal(bencher: Bencher, kb: u64) {
+    let mut dir = std::env::current_dir().unwrap();
+    let suffix = Path::new("src").join("uu").join("cmp");
+    if dir.ends_with(suffix) {
+        dir.pop();
+        dir.pop();
+        dir.pop();
+    }
+    let prg = dir.join("target").join("release").join("cmp");
+
+    let fp = get_context().get_files_equal_kb(kb).unwrap();
+    let args_str = format!("{} {}", fp.from, fp.to);
+
+    bencher
+        // .with_inputs(|| prepare::cmp_params_identical_testfiles(lines))
+        .with_inputs(|| args_str.clone())
+        .bench_refs(|cmd_args| bench_binary::bench_binary(&prg, cmd_args));
+}
+
+// Since each bench function is separate in Divan it is more difficult to dynamically create test data.
+// This keeps the TempDir alive until the program exits and generates the files only once.
+static SHARED_CONTEXT: OnceLock<BenchContext> = OnceLock::new();
+/// Creates the test files once and provides them to all tests.
+pub fn get_context() -> &'static BenchContext {
+    SHARED_CONTEXT.get_or_init(|| {
+        let mut ctx = BenchContext::default();
+        if TEMP_DIR.is_empty() {
+            let tmp_dir = TempDir::new().expect("Failed to create temp dir");
+            ctx.tmp_dir = Some(tmp_dir);
+        } else {
+            // uses current directory, the generated files are kept
+            let path = std::path::Path::new(TEMP_DIR);
+            if !path.exists() {
+                std::fs::create_dir_all(path).expect("Path {path} could not be created");
+            }
+            ctx.dir = TEMP_DIR.to_string();
+        };
+
+        // generate test bytes
+        for kb in FILE_SIZES_IN_KILO_BYTES {
+            let f = generate_test_files_bytes(ctx.get_path(), kb * 1000, 0, "eq")
+                .expect("generate_test_files failed");
+            ctx.files_equal.push(f);
+            let f = generate_test_files_bytes(ctx.get_path(), kb * 1000, NUM_DIFF, "df")
+                .expect("generate_test_files failed");
+            ctx.files_different.push(f);
+        }
+
+        ctx
+    })
+}
+
+fn main() {
+    // Run registered benchmarks.
+    divan::main();
+}