rustcoreutils
diff --git a/‎Cargo.lock‎
Lines changed: 291 additions & 3 deletions b/‎Cargo.lock‎
Lines changed: 291 additions & 3 deletions
diff --git a/‎Cargo.toml‎
Lines changed: 3 additions & 1 deletion b/‎Cargo.toml‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎datetime/tests/time/mod.rs‎
Lines changed: 1 addition & 1 deletion b/‎datetime/tests/time/mod.rs‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎m4/Cargo.toml‎
Lines changed: 27 additions & 0 deletions b/‎m4/Cargo.toml‎
Lines changed: 27 additions & 0 deletions
diff --git a/‎m4/README.md‎
Lines changed: 15 additions & 0 deletions b/‎m4/README.md‎
Lines changed: 15 additions & 0 deletions
diff --git a/‎m4/build.rs‎
Lines changed: 327 additions & 0 deletions b/‎m4/build.rs‎
Lines changed: 327 additions & 0 deletions
@@ -8,6 +8,8 @@ members = [
 	"display",
 	"file",
 	"fs",
+	"m4",
+	"m4/test-manager",
 	"gettext-rs",
 	"misc",
 	"pathnames",
@@ -24,7 +26,7 @@ members = [
 
 [workspace.dependencies]
 atty = "0.2"
-clap = { version = "4", default-features = false, features = ["std", "derive", "help", "usage"] }
+clap = { version = "4", default-features = false, features = ["std", "derive", "help", "usage", "error-context", "cargo"] }
 chrono = { version = "0.4", default-features = false, features = ["clock"] }
 libc = "0.2"
 regex = "1.10"
 
@@ -89,5 +89,5 @@ fn parse_error_test() {
 
 #[test]
 fn command_error_test() {
-    run_test_time(&["-s", "ls", "-l"], "", "unexpected argument found", 0);
+    run_test_time(&["-s", "ls", "-l"], "", "unexpected argument '-s' found", 0);
 }
@@ -0,0 +1,27 @@
+[package]
+name = "m4"
+version = "0.1.0"
+edition = "2021"
+
+# See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html
+
+[dependencies]
+clap.workspace = true
+env_logger = "0.11"
+errno = "0.3"
+libc.workspace = true
+log = "0.4"
+nom = "7.1"
+once_cell = "1.19"
+thiserror = "1.0"
+
+[dev-dependencies]
+env_logger = "0.11"
+m4-test-manager = { path = "./test-manager" }
+regex-lite = "0.1"
+similar-asserts = "1.5"
+test-log = { version = "0.2", default-features=false, features=["log"]}
+
+[build-dependencies]
+m4-test-manager = { path = "./test-manager" }
+
@@ -0,0 +1,15 @@
+# `m4`
+
+Implementation of `m4` according to the specification <https://pubs.opengroup.org/onlinepubs/9699919799/utilities/m4.html>.
+
+
+## Other Implementations
+
+Other known implementations of `m4`:
+
+* [illumos m4](https://github.com/illumos/illumos-gate/blob/master/usr/src/cmd/sgs/m4/common/m4.c)
+* BSD
+  * [FreeBSD m4](https://github.com/freebsd/freebsd-src/tree/main/usr.bin/m4)
+  * [OpenBSD m4](https://github.com/openbsd/src/tree/master/usr.bin/m4)
+  * Portable BSD m4 - [here](https://github.com/ibara/m4) and [here](https://github.com/chimera-linux/bsdm4)
+* [GNU m4](https://www.gnu.org/software/m4/)
@@ -0,0 +1,327 @@
+use std::{
+    collections::BTreeMap,
+    fs::read_dir,
+    os::unix::ffi::OsStrExt,
+    path::{Path, PathBuf},
+};
+
+use m4_test_manager::TestSnapshot;
+
+/// A candididate for an integration test [`Test`], can be converted into one if both
+/// [`TestCandidate::input`] and [`TestCandidate::output`] are `Some`. This is created during the
+/// process of analyzing the available integration test files in order to pair up the input and
+/// output for the same test.
+#[derive(Default)]
+struct TestCandidate {
+    /// The name of the test.
+    name: String,
+    /// Input `.m4` or `.args` file. Will be `None` if has not yet been found.
+    input: Option<PathBuf>,
+    /// Output `.out` file. Will be `None` if has not yet been found.
+    output: Option<PathBuf>,
+    /// See [`TestSnapshot::ignore`].
+    ignore: bool,
+    /// See [`TestSnapshot::expect_error`].
+    expect_error: bool,
+    /// See [`TestSnapshot::stdout_regex`].
+    stdout_regex: Option<String>,
+}
+
+impl TryFrom<TestCandidate> for Test {
+    type Error = &'static str;
+
+    fn try_from(value: TestCandidate) -> Result<Self, Self::Error> {
+        Ok(Test {
+            name: value.name,
+            input: value
+                .input
+                .ok_or("No input provided")?
+                .to_str()
+                .ok_or("Error converting input path to string")?
+                .to_owned(),
+            output: value
+                .output
+                .ok_or("No output file provided, please run m4-test-manager update-snapshots")?
+                .to_str()
+                .ok_or("Error converting output path to string")?
+                .to_owned(),
+            ignore: value.ignore,
+            expect_error: value.expect_error,
+            stdout_regex: value.stdout_regex,
+        })
+    }
+}
+
+struct Test {
+    /// The name of the test.
+    name: String,
+    /// Input `.m4` file.
+    input: String,
+    /// Output `.out` file
+    output: String,
+    /// See [`TestSnapshot::ignore`].
+    ignore: bool,
+    /// See [`TestSnapshot::expect_error`].
+    expect_error: bool,
+    /// See [`TestSnapshot::stdout_regex`].
+    stdout_regex: Option<String>,
+}
+impl Test {
+    fn as_code(&self) -> String {
+        let Self {
+            name,
+            input,
+            output,
+            ignore,
+            expect_error,
+            stdout_regex,
+        } = self;
+        let mut s = String::new();
+
+        if *ignore {
+            s.push_str("#[ignore]");
+        }
+
+        s.push_str(&format!(
+            r##"#[test]
+fn test_{name}() {{
+    init();
+    let output = run_command(&Path::new("{input}"));
+
+    let test: TestSnapshot = read_test("{output}");
+    assert_eq!(output.status, std::process::ExitStatus::from_raw(test.status), "status (\x1b[31mcurrent\x1b[0m|\x1b[32mexpected\x1b[0m)");
+    
+"##
+        ));
+
+        if let Some(stdout_regex) = stdout_regex {
+            s.push_str(&format!(
+                r##"
+    let r = regex_lite::Regex::new(r"{stdout_regex}").unwrap();
+    assert!(r.is_match(&String::from_utf8(output.stdout).unwrap()), "stdout doesn't match regex: r\"{{}}\"", "{stdout_regex}");
+            "##
+            ));
+        } else {
+            s.push_str(r##"
+    assert_eq!(String::from_utf8(output.stdout).unwrap(), test.stdout, "stdout (\x1b[31mcurrent\x1b[0m|\x1b[32mexpected\x1b[0m)");
+            "##);
+        }
+
+        if *expect_error {
+            s.push_str(
+                r##"
+    if !test.stderr.is_empty() {
+        assert!(!output.stderr.is_empty());
+    }"##,
+            );
+        } else {
+            s.push_str(r##"
+    assert_eq!(String::from_utf8(output.stderr).unwrap(), test.stderr, "stderr (\x1b[31mcurrent\x1b[0m|\x1b[32mexpected\x1b[0m)");"##);
+        }
+
+        s.push('}');
+
+        s
+    }
+}
+
+fn name_from_path(path: &Path) -> Option<String> {
+    Some(path.file_name()?.to_str()?.split('.').next()?.to_owned())
+}
+
+fn main() {
+    println!("cargo::rerun-if-changed=fixtures/");
+    let mut test_candidates: BTreeMap<String, TestCandidate> = BTreeMap::new();
+    let fixtures_directory = Path::new("fixtures/integration_tests");
+    for entry in read_dir(fixtures_directory).unwrap() {
+        let entry = entry.unwrap();
+        let path = entry.path();
+
+        match path.extension().map(|e| e.as_bytes()) {
+            Some(b"m4") | Some(b"args") => {
+                let name = name_from_path(&path).unwrap();
+                let snapshot_file_name = format!("{name}.out");
+                let snapshot_file = fixtures_directory.join(snapshot_file_name);
+                let (ignore, expect_error, stdout_regex) = if snapshot_file.exists() {
+                    let mut f = std::fs::OpenOptions::new()
+                        .read(true)
+                        .open(&snapshot_file)
+                        .unwrap();
+                    let snapshot = TestSnapshot::deserialize(&mut f);
+                    (
+                        snapshot.ignore,
+                        snapshot.expect_error,
+                        snapshot.stdout_regex,
+                    )
+                } else {
+                    (false, false, None)
+                };
+                let candidate = test_candidates
+                    .entry(name.clone())
+                    .or_insert(TestCandidate {
+                        name,
+                        ignore,
+                        expect_error,
+                        stdout_regex: stdout_regex.clone(),
+                        ..TestCandidate::default()
+                    });
+                candidate.input = Some(path);
+                candidate.ignore = ignore;
+                candidate.expect_error = expect_error;
+                candidate.stdout_regex = stdout_regex;
+            }
+            Some(b"out") => {
+                let name = name_from_path(&path).unwrap();
+                let candidate = test_candidates
+                    .entry(name.clone())
+                    .or_insert(TestCandidate {
+                        name,
+                        ..TestCandidate::default()
+                    });
+                candidate.output = Some(path);
+            }
+            _ => eprintln!("Ignoring file {path:?}"),
+        }
+    }
+    let mut integration_test: String =
+        r#"//! NOTE: This file has been auto generated using build.rs, don't edit by hand!
+//! You can regenerate the tests (which are based on the fixtures in `fixtures/integration_tests/`)
+//! using the following command:
+//! `cargo run -p m4-test-manager update-snapshots`
+use similar_asserts::assert_eq;
+use std::process::ExitStatus;
+use std::os::unix::ffi::OsStrExt;
+use std::os::unix::process::ExitStatusExt;
+use std::fs::read_to_string;
+use std::path::Path;
+use m4::error::GetExitCode;
+use m4_test_manager::TestSnapshot;
+
+fn init() {
+    let _ = env_logger::builder()
+        .is_test(true)
+        // No timestamp to make it easier to diff output
+        .format_timestamp(None)
+        .try_init();
+}
+
+fn read_test(path: impl AsRef<std::path::Path>) -> TestSnapshot {
+    let mut f = std::fs::File::open(path).unwrap();
+    let snapshot = TestSnapshot::deserialize(&mut f);
+    log::info!(
+        "Expecting stdout:\n\x1b[34m{}\x1b[0m",
+        snapshot.stdout,
+    );
+    log::info!(
+        "Expecting stderr:\n\x1b[34m{}\x1b[0m",
+        snapshot.stderr,
+    );
+    log::info!(
+        "Expecting status:\n\x1b[34m{}\x1b[0m",
+        snapshot.status,
+    );
+    snapshot
+}
+
+fn run_command(input: &Path) -> std::process::Output {
+    let input_string = read_to_string(input).unwrap();
+    log::info!(
+        "Running command with input {input:?}:\n\x1b[34m{}\x1b[0m",
+        input_string,
+    );
+    #[derive(Default, Clone)]
+    struct StdoutRef(std::rc::Rc<std::cell::RefCell<Vec<u8>>>);
+    impl std::io::Write for StdoutRef {
+        fn write(&mut self, buf: &[u8]) -> std::io::Result<usize> {
+            self.0.borrow_mut().write(buf)
+        }
+
+        fn flush(&mut self) -> std::io::Result<()> {
+            self.0.borrow_mut().flush()
+        }
+    }
+    impl StdoutRef {
+        fn into_inner(self) -> Vec<u8> {
+            std::rc::Rc::into_inner(self.0).unwrap().into_inner()
+        }
+    }
+    let (stdout, stderr, status) = match input
+        .extension()
+        .expect("Input file should have extension")
+        .as_bytes()
+    {
+        b"m4" => {
+            // The reason why we run the command using this as a library is so we can run with it built in
+            // test configuration, with all the associated conditionally compiled test log instrumentation.
+
+            let stdout = StdoutRef::default();
+            let mut stderr: Vec<u8> = Vec::new();
+            let args = m4::Args {
+                files: vec![input.into()],
+                ..m4::Args::default()
+            };
+            let result = m4::run(stdout.clone(), &mut stderr, args);
+            let status = ExitStatus::from_raw(result.get_exit_code() as i32);
+            (stdout.into_inner(), stderr, status)
+        }
+        b"args" => {
+            let args = input_string;
+            let _cargo_build_output = std::process::Command::new("cargo")
+                .arg("build")
+                .output()
+                .unwrap();
+
+            log::info!("RUST_LOG is ignored for this test because it interferes with output");
+            let output = std::process::Command::new("sh")
+                .env("RUST_LOG", "") // Disable rust log output because it interferes with the test.
+                .arg("-c")
+                .arg(format!("../target/debug/m4 {args}"))
+                .output()
+                .unwrap();
+
+            (output.stdout, output.stderr, output.status)
+        }
+        _ => panic!("Unsupported input extension {input:?}"),
+    };
+
+    log::info!("Received status: {status}");
+    log::info!(
+        "Received stdout:\n\x1b[34m{}\x1b[0m",
+        String::from_utf8_lossy(&stdout)
+    );
+    log::info!(
+        "Received stderr:\n\x1b[34m{}\x1b[0m",
+        String::from_utf8_lossy(&stderr)
+    );
+    std::process::Output {
+        stdout,
+        stderr,
+        status,
+    }
+}
+"#
+        .to_owned();
+    for (name, candidate) in test_candidates {
+        let test: Test = candidate.try_into().unwrap_or_else(|error| {
+            panic!("Error creating test from candidate for {name}: {error}")
+        });
+
+        integration_test.push('\n');
+        integration_test.push_str(&test.as_code());
+        integration_test.push('\n');
+    }
+
+    std::fs::write("tests/integration_test.rs", integration_test).unwrap();
+    let output = std::process::Command::new("cargo")
+        .arg("fmt")
+        .arg("--")
+        .arg("tests/integration_test.rs")
+        .output()
+        .unwrap();
+    if !output.status.success() {
+        panic!(
+            "Error executing cargo fmt: {}",
+            String::from_utf8_lossy(&output.stderr)
+        );
+    }
+}
Original file line number	Diff line number	Diff line change
`@@ -89,5 +89,5 @@ fn parse_error_test() {`
`89`	`89`
`90`	`90`	`#[test]`
`91`	`91`	`fn command_error_test() {`
`92`		`- run_test_time(&["-s", "ls", "-l"], "", "unexpected argument found", 0);`
	`92`	`+ run_test_time(&["-s", "ls", "-l"], "", "unexpected argument '-s' found", 0);`
`93`	`93`	`}`