diff --git a/awk/Cargo.toml b/awk/Cargo.toml
index 3b1bb2ebb..0f47cc06f 100644
--- a/awk/Cargo.toml
+++ b/awk/Cargo.toml
@@ -13,6 +13,7 @@ libc.workspace = true
 pest = "2.7"
 pest_derive = "2.7"
 lexical = { version = "6.1", features = ["format"] }
+plib = { path = "../plib" }
 rand = { version = "0.8", default-features = false, features = ["small_rng"] }
 
 [dev-dependencies]
diff --git a/awk/regex.rs b/awk/regex.rs
index ada1074f0..612c171c7 100644
--- a/awk/regex.rs
+++ b/awk/regex.rs
@@ -7,36 +7,14 @@
 // SPDX-License-Identifier: MIT
 //
 
+use plib::regex::{Match, Regex as PlibRegex, RegexFlags};
 use std::ffi::CString;
-use std::ptr;
-
-fn regex_compilation_result(
-    status_integer: libc::c_int,
-    regex: &libc::regex_t,
-) -> Result<(), String> {
-    if status_integer != 0 {
-        let mut error_buffer = vec![b'\0'; 128];
-        unsafe {
-            libc::regerror(
-                status_integer,
-                ptr::from_ref(regex),
-                error_buffer.as_mut_ptr() as *mut libc::c_char,
-                128,
-            )
-        };
-        let error = CString::from_vec_with_nul(error_buffer)
-            .expect("error message returned from `libc::regerror` is an invalid CString");
-        Err(error
-            .into_string()
-            .expect("error message from `libc::regerror' contains invalid utf-8"))
-    } else {
-        Ok(())
-    }
-}
 
+/// A regex wrapper that provides CString-compatible API for AWK.
+/// Internally uses plib::regex for POSIX ERE support.
 pub struct Regex {
-    raw_regex: libc::regex_t,
-    regex_string: CString,
+    inner: PlibRegex,
+    pattern_string: String,
 }
 
 #[cfg_attr(test, derive(Debug))]
@@ -46,8 +24,20 @@ pub struct RegexMatch {
     pub end: usize,
 }
 
+impl From<Match> for RegexMatch {
+    fn from(m: Match) -> Self {
+        RegexMatch {
+            start: m.start,
+            end: m.end,
+        }
+    }
+}
+
+/// Iterator over regex matches in a string.
+/// Owns the input CString to preserve lifetimes.
 pub struct MatchIter<'re> {
-    string: CString,
+    // Store the string as owned String to avoid lifetime issues
+    string: String,
     next_start: usize,
     regex: &'re Regex,
 }
@@ -55,86 +45,74 @@ pub struct MatchIter<'re> {
 impl Iterator for MatchIter<'_> {
     type Item = RegexMatch;
     fn next(&mut self) -> Option<Self::Item> {
-        if self.next_start >= self.string.as_bytes().len() {
-            return None;
-        }
-        let mut match_range = libc::regmatch_t {
-            rm_so: -1,
-            rm_eo: -1,
-        };
-        let exec_status = unsafe {
-            libc::regexec(
-                ptr::from_ref(&self.regex.raw_regex),
-                self.string.as_ptr().add(self.next_start),
-                1,
-                ptr::from_mut(&mut match_range),
-                0,
-            )
-        };
-        if exec_status == libc::REG_NOMATCH {
+        if self.next_start >= self.string.len() {
             return None;
         }
+
+        // Find match starting from current offset
+        let substring = &self.string[self.next_start..];
+        let m = self.regex.inner.find(substring)?;
+
         let result = RegexMatch {
-            start: self.next_start + match_range.rm_so as usize,
-            end: self.next_start + match_range.rm_eo as usize,
+            start: self.next_start + m.start,
+            end: self.next_start + m.end,
         };
-        self.next_start += match_range.rm_eo as usize;
+
+        // Move past this match for next iteration
+        // Ensure we make progress even on zero-width matches
+        self.next_start = if m.end > 0 {
+            self.next_start + m.end
+        } else {
+            self.next_start + 1
+        };
+
         Some(result)
     }
 }
 
 impl Regex {
     pub fn new(regex: CString) -> Result<Self, String> {
-        let mut raw = unsafe { std::mem::zeroed::<libc::regex_t>() };
-        let compilation_status =
-            unsafe { libc::regcomp(ptr::from_mut(&mut raw), regex.as_ptr(), libc::REG_EXTENDED) };
-        regex_compilation_result(compilation_status, &raw)?;
+        let pattern = regex.to_str().map_err(|e| e.to_string())?;
+        let inner = PlibRegex::new(pattern, RegexFlags::ere()).map_err(|e| e.to_string())?;
         Ok(Self {
-            raw_regex: raw,
-            regex_string: regex,
+            inner,
+            pattern_string: pattern.to_string(),
         })
     }
 
+    /// Returns an iterator over all match locations in the string.
+    /// Takes ownership of the CString.
     pub fn match_locations(&self, string: CString) -> MatchIter {
+        let s = string.into_string().unwrap_or_default();
         MatchIter {
             next_start: 0,
             regex: self,
-            string,
+            string: s,
         }
     }
 
     pub fn matches(&self, string: &CString) -> bool {
-        let exec_status = unsafe {
-            libc::regexec(
-                ptr::from_ref(&self.raw_regex),
-                string.as_ptr(),
-                0,
-                ptr::null_mut(),
-                0,
-            )
-        };
-        exec_status != libc::REG_NOMATCH
+        let s = string.to_str().unwrap_or("");
+        self.inner.is_match(s)
     }
 }
 
 impl Drop for Regex {
     fn drop(&mut self) {
-        unsafe {
-            libc::regfree(ptr::from_mut(&mut self.raw_regex));
-        }
+        // plib::regex handles cleanup internally
     }
 }
 
 #[cfg(test)]
 impl core::fmt::Debug for Regex {
     fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
-        writeln!(f, "/{}/", self.regex_string.to_str().unwrap())
+        writeln!(f, "/{}/", self.pattern_string)
     }
 }
 
 impl PartialEq for Regex {
     fn eq(&self, other: &Self) -> bool {
-        self.regex_string == other.regex_string
+        self.pattern_string == other.pattern_string
     }
 }
 
diff --git a/display/Cargo.toml b/display/Cargo.toml
index a5acb137d..9d75cd8da 100644
--- a/display/Cargo.toml
+++ b/display/Cargo.toml
@@ -12,6 +12,7 @@ clap.workspace = true
 clap.features = ["env"]
 gettext-rs.workspace = true
 libc.workspace = true
+plib = { path = "../plib" }
 termion = "4.0"
 thiserror = "1.0"
 
diff --git a/display/more.rs b/display/more.rs
index ff6b606ac..da3239b71 100644
--- a/display/more.rs
+++ b/display/more.rs
@@ -9,18 +9,15 @@
 
 use clap::Parser;
 use gettextrs::{bind_textdomain_codeset, gettext, setlocale, textdomain, LocaleCategory};
-use libc::{
-    getegid, getgid, getuid, regcomp, regex_t, regexec, setgid, setuid, REG_ICASE, REG_NOMATCH,
-};
+use libc::{getegid, getgid, getuid, setgid, setuid};
+use plib::regex::{Regex, RegexFlags};
 use std::collections::HashMap;
-use std::ffi::CString;
 use std::fs::File;
 use std::io::{stdout, BufRead, BufReader, Cursor, Read, Seek, SeekFrom, Write};
 use std::ops::{Not, Range};
 use std::os::fd::AsRawFd;
 use std::path::PathBuf;
 use std::process::{exit, ExitStatus};
-use std::ptr;
 use std::str::FromStr;
 use std::sync::mpsc::{channel, Receiver, TryRecvError};
 use std::sync::Mutex;
@@ -942,8 +939,8 @@ struct SourceContext {
     /// Current search pattern
     current_pattern: String,
     /// Last search settings
-    last_search: Option<(regex_t, bool, Direction)>,
-    /// Storage for marks that were set durring current [`Source`] processing
+    last_search: Option<(Regex, bool, Direction)>,
+    /// Storage for marks that were set during current [`Source`] processing
     marked_positions: HashMap<char, usize>,
     /// Flag that [`true`] if input files count is more that 1
     is_many_files: bool,
@@ -1206,7 +1203,7 @@ impl SourceContext {
     pub fn search(
         &mut self,
         count: Option<usize>,
-        pattern: regex_t,
+        pattern: Regex,
         is_not: bool,
         direction: Direction,
     ) -> Result<(), MoreError> {
@@ -1222,21 +1219,10 @@ impl SourceContext {
                     Direction::Backward => haystack + &last_string,
                 };
             }
-            let c_input = CString::new(haystack)
-                .map_err(|_| MoreError::StringParse(self.current_source.name()))?;
-            let has_match = unsafe {
-                regexec(
-                    &pattern as *const regex_t,
-                    c_input.as_ptr(),
-                    0,
-                    ptr::null_mut(),
-                    0,
-                )
-            };
             let has_match = if is_not {
-                has_match == REG_NOMATCH
+                !pattern.is_match(&haystack)
             } else {
-                has_match != REG_NOMATCH
+                pattern.is_match(&haystack)
             };
             if has_match {
                 let Some((rows, _)) = self.terminal_size else {
@@ -1291,7 +1277,7 @@ impl SourceContext {
             } else {
                 direction.clone()
             };
-            self.search(count, *pattern, *is_not, direction)
+            self.search(count, pattern.clone(), *is_not, direction)
         } else {
             Err(MoreError::SourceContext(
                 SourceContextError::MissingLastSearch,
@@ -1647,39 +1633,19 @@ impl Prompt {
     }
 }
 
-/// Compiles [`pattern`] as [`regex_t`]
-fn compile_regex(pattern: String, ignore_case: bool) -> Result<regex_t, MoreError> {
-    #[cfg(target_os = "macos")]
-    let mut pattern = pattern.replace("\\\\", "\\");
-    #[cfg(all(unix, not(target_os = "macos")))]
+/// Compiles [`pattern`] as a POSIX BRE regex
+fn compile_regex(pattern: String, ignore_case: bool) -> Result<Regex, MoreError> {
+    // Normalize backslash escapes
     let pattern = pattern.replace("\\\\", "\\");
-    let mut cflags = 0;
-    if ignore_case {
-        cflags |= REG_ICASE;
-    }
 
-    // macOS version of [regcomp](regcomp) from `libc` provides additional check
-    // for empty regex. In this case, an error
-    // [REG_EMPTY](https://developer.apple.com/library/archive/documentation/System/Conceptual/ManPages_iPhoneOS/man3/regcomp.3.html)
-    // will be returned. Therefore, an empty pattern is replaced with ".*".
-    #[cfg(target_os = "macos")]
-    {
-        pattern = if pattern == "" {
-            String::from(".*")
-        } else {
-            pattern
-        };
-    }
-
-    let c_pattern =
-        CString::new(pattern.clone()).map_err(|_| MoreError::StringParse(pattern.clone()))?;
-    let mut regex = unsafe { std::mem::zeroed::<regex_t>() };
-
-    if unsafe { regcomp(&mut regex, c_pattern.as_ptr(), cflags) } == 0 {
-        Ok(regex)
+    let flags = if ignore_case {
+        RegexFlags::bre().ignore_case()
     } else {
-        Err(MoreError::StringParse(pattern))
-    }
+        RegexFlags::bre()
+    };
+
+    // plib::regex handles macOS empty pattern workaround internally
+    Regex::new(&pattern, flags).map_err(|_| MoreError::StringParse(pattern))
 }
 
 /// More state
diff --git a/pax/subst.rs b/pax/subst.rs
index 92773db55..32b874bd4 100644
--- a/pax/subst.rs
+++ b/pax/subst.rs
@@ -19,19 +19,16 @@
 //! - `g` flag: global replacement (all occurrences)
 //! - `p` flag: print successful substitutions to stderr
 //!
-//! This implementation uses POSIX regcomp/regexec for BRE support.
+//! This implementation uses plib::regex for POSIX BRE support.
 
 use crate::error::{PaxError, PaxResult};
-use std::ffi::{CStr, CString};
-
-/// Maximum number of subexpression matches (POSIX requires at least 9)
-const MAX_MATCHES: usize = 10;
+use plib::regex::{Match, Regex, RegexFlags, MAX_CAPTURES};
 
 /// A compiled substitution expression from -s option
 #[derive(Debug)]
 pub struct Substitution {
     /// Compiled POSIX regex
-    regex: PosixRegex,
+    regex: Regex,
     /// Replacement template string (with & and \n references)
     replacement: String,
     /// Replace all occurrences (g flag)
@@ -53,8 +50,6 @@ pub enum SubstResult {
 
 impl Clone for Substitution {
     fn clone(&self) -> Self {
-        // Re-parse the pattern to create a new compiled regex
-        // This is safe because we already validated it
         Substitution {
             regex: self.regex.clone(),
             replacement: self.replacement.clone(),
@@ -112,7 +107,8 @@ impl Substitution {
         }
 
         // Compile the POSIX BRE regex
-        let regex = PosixRegex::compile(&old_pattern)?;
+        let regex = Regex::new(&old_pattern, RegexFlags::bre())
+            .map_err(|e| PaxError::PatternError(e.to_string()))?;
 
         Ok(Substitution {
             regex,
@@ -130,8 +126,7 @@ impl Substitution {
 
         loop {
             // Try to match at or after current position
-            let search_str = &result[pos..];
-            let matches = match self.regex.exec(search_str) {
+            let matches = match self.regex.captures_at(&result, pos) {
                 Some(m) => m,
                 None => break,
             };
@@ -139,11 +134,11 @@ impl Substitution {
             any_match = true;
 
             // Build the replacement string
-            let replacement = build_replacement(&self.replacement, search_str, &matches);
+            let replacement = build_replacement(&self.replacement, &result, &matches);
 
             // Get the absolute positions in result
-            let match_start = pos + matches[0].0;
-            let match_end = pos + matches[0].1;
+            let match_start = matches[0].start;
+            let match_end = matches[0].end;
 
             // Replace the matched portion
             let new_result = format!(
@@ -192,27 +187,26 @@ impl Substitution {
 }
 
 /// Build the replacement string from template and match groups
-fn build_replacement(
-    template: &str,
-    input: &str,
-    matches: &[(usize, usize); MAX_MATCHES],
-) -> String {
+fn build_replacement(template: &str, input: &str, matches: &[Match]) -> String {
     let mut result = String::new();
     let mut chars = template.chars().peekable();
 
     while let Some(c) = chars.next() {
         if c == '&' {
             // & is replaced by entire match
-            if matches[0].1 > matches[0].0 {
-                result.push_str(&input[matches[0].0..matches[0].1]);
+            if !matches.is_empty() && matches[0].end > matches[0].start {
+                result.push_str(&input[matches[0].start..matches[0].end]);
             }
         } else if c == '\\' {
             if let Some(&next) = chars.peek() {
                 if next.is_ascii_digit() && next != '0' {
                     // \1 through \9 - backreference
                     let idx = (next as usize) - ('0' as usize);
-                    if idx < MAX_MATCHES && matches[idx].1 > matches[idx].0 {
-                        result.push_str(&input[matches[idx].0..matches[idx].1]);
+                    if idx < matches.len()
+                        && idx < MAX_CAPTURES
+                        && matches[idx].end > matches[idx].start
+                    {
+                        result.push_str(&input[matches[idx].start..matches[idx].end]);
                     }
                     chars.next();
                 } else if next == '\\' {
@@ -292,142 +286,6 @@ pub fn apply_substitutions(substitutions: &[Substitution], path: &str) -> SubstR
     SubstResult::Unchanged
 }
 
-/// Wrapper around POSIX regex functions
-#[derive(Debug)]
-struct PosixRegex {
-    /// The original pattern string (for cloning)
-    pattern: String,
-    /// Compiled regex_t
-    #[cfg(unix)]
-    compiled: *mut libc::regex_t,
-    #[cfg(not(unix))]
-    compiled: (),
-}
-
-impl Clone for PosixRegex {
-    fn clone(&self) -> Self {
-        // Re-compile the pattern
-        PosixRegex::compile(&self.pattern).expect("failed to clone already-valid regex")
-    }
-}
-
-impl PosixRegex {
-    /// Compile a POSIX Basic Regular Expression
-    #[cfg(unix)]
-    fn compile(pattern: &str) -> PaxResult<Self> {
-        let c_pattern = CString::new(pattern)
-            .map_err(|_| PaxError::PatternError("pattern contains null byte".to_string()))?;
-
-        unsafe {
-            let regex_ptr =
-                libc::malloc(std::mem::size_of::<libc::regex_t>()) as *mut libc::regex_t;
-            if regex_ptr.is_null() {
-                return Err(PaxError::PatternError(
-                    "failed to allocate regex".to_string(),
-                ));
-            }
-
-            // REG_NEWLINE is not used - we want . to NOT match newline by default
-            let flags = 0; // BRE with no special flags
-
-            let result = libc::regcomp(regex_ptr, c_pattern.as_ptr(), flags);
-            if result != 0 {
-                // Get error message
-                let mut errbuf = [0u8; 256];
-                libc::regerror(
-                    result,
-                    regex_ptr,
-                    errbuf.as_mut_ptr() as *mut libc::c_char,
-                    errbuf.len(),
-                );
-                libc::regfree(regex_ptr);
-                libc::free(regex_ptr as *mut libc::c_void);
-
-                let err_msg = CStr::from_ptr(errbuf.as_ptr() as *const libc::c_char)
-                    .to_string_lossy()
-                    .to_string();
-                return Err(PaxError::PatternError(format!(
-                    "invalid regex '{}': {}",
-                    pattern, err_msg
-                )));
-            }
-
-            Ok(PosixRegex {
-                pattern: pattern.to_string(),
-                compiled: regex_ptr,
-            })
-        }
-    }
-
-    #[cfg(not(unix))]
-    fn compile(pattern: &str) -> PaxResult<Self> {
-        // Fallback for non-Unix - just store the pattern
-        // This won't actually work for matching
-        Ok(PosixRegex {
-            pattern: pattern.to_string(),
-            compiled: (),
-        })
-    }
-
-    /// Execute the regex against a string
-    /// Returns array of (start, end) for each match group, or None if no match
-    #[cfg(unix)]
-    fn exec(&self, input: &str) -> Option<[(usize, usize); MAX_MATCHES]> {
-        let c_input = match CString::new(input) {
-            Ok(s) => s,
-            Err(_) => return None,
-        };
-
-        unsafe {
-            let mut matches: [libc::regmatch_t; MAX_MATCHES] = std::mem::zeroed();
-
-            let result = libc::regexec(
-                self.compiled,
-                c_input.as_ptr(),
-                MAX_MATCHES,
-                matches.as_mut_ptr(),
-                0,
-            );
-
-            if result != 0 {
-                return None;
-            }
-
-            // Convert regmatch_t to (usize, usize) pairs
-            let mut result_matches = [(0usize, 0usize); MAX_MATCHES];
-            for (i, m) in matches.iter().enumerate() {
-                if m.rm_so >= 0 && m.rm_eo >= 0 {
-                    result_matches[i] = (m.rm_so as usize, m.rm_eo as usize);
-                }
-            }
-
-            Some(result_matches)
-        }
-    }
-
-    #[cfg(not(unix))]
-    fn exec(&self, _input: &str) -> Option<[(usize, usize); MAX_MATCHES]> {
-        // Fallback for non-Unix - no matching capability
-        None
-    }
-}
-
-#[cfg(unix)]
-impl Drop for PosixRegex {
-    fn drop(&mut self) {
-        unsafe {
-            if !self.compiled.is_null() {
-                libc::regfree(self.compiled);
-                libc::free(self.compiled as *mut libc::c_void);
-            }
-        }
-    }
-}
-
-// SAFETY: The compiled regex is not shared between threads
-unsafe impl Send for PosixRegex {}
-unsafe impl Sync for PosixRegex {}
-
 #[cfg(test)]
 mod tests {
     use super::*;
@@ -479,7 +337,7 @@ mod tests {
         // But our parser handles delimiter escaping in the -s expression itself
         let s = Substitution::parse("/foo\\/bar/baz/").unwrap();
         // The pattern should be "foo/bar" (with literal /)
-        assert_eq!(s.regex.pattern, "foo/bar");
+        assert_eq!(s.regex.as_str(), "foo/bar");
     }
 
     #[test]
diff --git a/plib/src/lib.rs b/plib/src/lib.rs
index de06edd6c..12929a31a 100644
--- a/plib/src/lib.rs
+++ b/plib/src/lib.rs
@@ -14,6 +14,7 @@ pub mod lzw;
 pub mod modestr;
 pub mod platform;
 pub mod priority;
+pub mod regex;
 pub mod sccsfile;
 pub mod testing;
 pub mod utmpx;
diff --git a/plib/src/regex.rs b/plib/src/regex.rs
new file mode 100644
index 000000000..aaa138f3f
--- /dev/null
+++ b/plib/src/regex.rs
@@ -0,0 +1,628 @@
+//
+// Copyright (c) 2024 Jeff Garzik
+//
+// This file is part of the posixutils-rs project covered under
+// the MIT License.  For the full license text, please see the LICENSE
+// file in the root directory of this project.
+// SPDX-License-Identifier: MIT
+//
+
+//! POSIX Regular Expression support using libc regcomp/regexec.
+//!
+//! This module provides a safe Rust wrapper around POSIX regex functions,
+//! supporting both Basic Regular Expressions (BRE) and Extended Regular
+//! Expressions (ERE).
+//!
+//! # Example
+//!
+//! ```ignore
+//! use plib::regex::{Regex, RegexFlags};
+//!
+//! // Simple BRE matching
+//! let re = Regex::new("hello", RegexFlags::default())?;
+//! assert!(re.is_match("hello world"));
+//!
+//! // ERE with case-insensitive matching
+//! let re = Regex::new("hello+", RegexFlags::ere().ignore_case())?;
+//! assert!(re.is_match("HELLOOO"));
+//! ```
+
+use libc::{regcomp, regex_t, regexec, regfree, regmatch_t, REG_EXTENDED, REG_ICASE, REG_NOMATCH};
+use std::ffi::CString;
+use std::io::{Error, ErrorKind};
+use std::ptr;
+
+/// Maximum number of capture groups supported
+pub const MAX_CAPTURES: usize = 10;
+
+/// Flags controlling regex compilation behavior.
+#[derive(Debug, Clone, Copy, Default)]
+pub struct RegexFlags {
+    /// Use Extended Regular Expressions (ERE) instead of Basic (BRE)
+    pub extended: bool,
+    /// Perform case-insensitive matching
+    pub ignore_case: bool,
+}
+
+impl RegexFlags {
+    /// Create flags for Basic Regular Expression (BRE) mode.
+    /// This is the default.
+    pub fn bre() -> Self {
+        Self::default()
+    }
+
+    /// Create flags for Extended Regular Expression (ERE) mode.
+    pub fn ere() -> Self {
+        Self {
+            extended: true,
+            ignore_case: false,
+        }
+    }
+
+    /// Enable case-insensitive matching.
+    pub fn ignore_case(mut self) -> Self {
+        self.ignore_case = true;
+        self
+    }
+
+    /// Convert to libc cflags
+    fn to_cflags(self) -> libc::c_int {
+        let mut cflags = 0;
+        if self.extended {
+            cflags |= REG_EXTENDED;
+        }
+        if self.ignore_case {
+            cflags |= REG_ICASE;
+        }
+        cflags
+    }
+}
+
+/// A match location within the input string.
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Default)]
+pub struct Match {
+    /// Start byte offset of the match
+    pub start: usize,
+    /// End byte offset of the match (exclusive)
+    pub end: usize,
+}
+
+impl Match {
+    /// Returns true if this is an empty/invalid match.
+    pub fn is_empty(&self) -> bool {
+        self.start == self.end
+    }
+
+    /// Extract the matched substring from the original input.
+    pub fn as_str<'a>(&self, input: &'a str) -> &'a str {
+        &input[self.start..self.end]
+    }
+}
+
+/// A compiled POSIX regular expression.
+pub struct Regex {
+    raw: regex_t,
+    /// Original pattern string, kept for Clone and Debug
+    pattern: String,
+    /// Flags used for compilation, kept for Clone
+    flags: RegexFlags,
+}
+
+// SAFETY: regex_t is thread-safe for matching (regexec is reentrant)
+unsafe impl Send for Regex {}
+unsafe impl Sync for Regex {}
+
+impl Regex {
+    /// Compile a new regular expression with the given flags.
+    ///
+    /// # Arguments
+    ///
+    /// * `pattern` - The regex pattern string
+    /// * `flags` - Compilation flags (BRE vs ERE, case sensitivity)
+    ///
+    /// # Errors
+    ///
+    /// Returns an error if the pattern is invalid.
+    pub fn new(pattern: &str, flags: RegexFlags) -> std::io::Result<Self> {
+        // Handle macOS quirk: empty pattern causes REG_EMPTY error
+        #[cfg(target_os = "macos")]
+        let pattern = if pattern.is_empty() { ".*" } else { pattern };
+
+        let c_pattern =
+            CString::new(pattern).map_err(|e| Error::new(ErrorKind::InvalidInput, e))?;
+
+        let mut raw = unsafe { std::mem::zeroed::<regex_t>() };
+        let cflags = flags.to_cflags();
+
+        let result = unsafe { regcomp(&mut raw, c_pattern.as_ptr(), cflags) };
+
+        if result != 0 {
+            // Get the error message using regerror
+            let err_msg = Self::get_error_message(result, &raw);
+            unsafe { regfree(&mut raw) };
+            return Err(Error::new(
+                ErrorKind::InvalidInput,
+                format!("invalid regex '{}': {}", pattern, err_msg),
+            ));
+        }
+
+        Ok(Regex {
+            raw,
+            pattern: pattern.to_string(),
+            flags,
+        })
+    }
+
+    /// Compile a Basic Regular Expression (BRE).
+    ///
+    /// Convenience method equivalent to `Regex::new(pattern, RegexFlags::bre())`.
+    pub fn bre(pattern: &str) -> std::io::Result<Self> {
+        Self::new(pattern, RegexFlags::bre())
+    }
+
+    /// Compile an Extended Regular Expression (ERE).
+    ///
+    /// Convenience method equivalent to `Regex::new(pattern, RegexFlags::ere())`.
+    pub fn ere(pattern: &str) -> std::io::Result<Self> {
+        Self::new(pattern, RegexFlags::ere())
+    }
+
+    /// Get error message from regcomp failure using regerror.
+    fn get_error_message(errcode: libc::c_int, regex: &regex_t) -> String {
+        let mut errbuf = [0u8; 256];
+        unsafe {
+            libc::regerror(
+                errcode,
+                regex as *const regex_t,
+                errbuf.as_mut_ptr() as *mut libc::c_char,
+                errbuf.len(),
+            );
+        }
+
+        // Find null terminator and convert to string
+        let len = errbuf.iter().position(|&b| b == 0).unwrap_or(errbuf.len());
+        String::from_utf8_lossy(&errbuf[..len]).to_string()
+    }
+
+    /// Returns true if the pattern matches anywhere in the input string.
+    ///
+    /// # Arguments
+    ///
+    /// * `text` - The string to search
+    ///
+    /// # Returns
+    ///
+    /// `true` if the pattern matches, `false` otherwise.
+    pub fn is_match(&self, text: &str) -> bool {
+        let Ok(c_text) = CString::new(text) else {
+            return false;
+        };
+
+        let result = unsafe { regexec(&self.raw, c_text.as_ptr(), 0, ptr::null_mut(), 0) };
+
+        result != REG_NOMATCH
+    }
+
+    /// Find the first match in the input string.
+    ///
+    /// # Arguments
+    ///
+    /// * `text` - The string to search
+    ///
+    /// # Returns
+    ///
+    /// `Some(Match)` with the location of the first match, or `None` if no match.
+    pub fn find(&self, text: &str) -> Option<Match> {
+        let c_text = CString::new(text).ok()?;
+
+        let mut pmatch = regmatch_t {
+            rm_so: -1,
+            rm_eo: -1,
+        };
+
+        let result = unsafe {
+            regexec(
+                &self.raw,
+                c_text.as_ptr(),
+                1,
+                &mut pmatch as *mut regmatch_t,
+                0,
+            )
+        };
+
+        if result == REG_NOMATCH || pmatch.rm_so < 0 {
+            return None;
+        }
+
+        Some(Match {
+            start: pmatch.rm_so as usize,
+            end: pmatch.rm_eo as usize,
+        })
+    }
+
+    /// Find all capture groups in the input string.
+    ///
+    /// Group 0 is always the entire match. Groups 1-9 are the parenthesized
+    /// subexpressions (in BRE: `\(...\)`, in ERE: `(...)`).
+    ///
+    /// # Arguments
+    ///
+    /// * `text` - The string to search
+    ///
+    /// # Returns
+    ///
+    /// `Some(Vec<Match>)` with all capture groups, or `None` if no match.
+    /// Empty/unused groups have `start == end == 0`.
+    pub fn captures(&self, text: &str) -> Option<Vec<Match>> {
+        let c_text = CString::new(text).ok()?;
+
+        let mut pmatch: [regmatch_t; MAX_CAPTURES] = unsafe { std::mem::zeroed() };
+
+        let result = unsafe {
+            regexec(
+                &self.raw,
+                c_text.as_ptr(),
+                MAX_CAPTURES,
+                pmatch.as_mut_ptr(),
+                0,
+            )
+        };
+
+        if result == REG_NOMATCH {
+            return None;
+        }
+
+        let matches: Vec<Match> = pmatch
+            .iter()
+            .map(|m| {
+                if m.rm_so >= 0 && m.rm_eo >= 0 {
+                    Match {
+                        start: m.rm_so as usize,
+                        end: m.rm_eo as usize,
+                    }
+                } else {
+                    Match::default()
+                }
+            })
+            .collect();
+
+        Some(matches)
+    }
+
+    /// Execute regex and return captures, continuing from a given offset.
+    ///
+    /// This is useful for finding multiple matches in a string.
+    ///
+    /// # Arguments
+    ///
+    /// * `text` - The string to search (full string, not a slice)
+    /// * `offset` - Byte offset to start searching from
+    ///
+    /// # Returns
+    ///
+    /// `Some(Vec<Match>)` with captures (positions relative to start of `text`),
+    /// or `None` if no match found at or after offset.
+    pub fn captures_at(&self, text: &str, offset: usize) -> Option<Vec<Match>> {
+        if offset > text.len() {
+            return None;
+        }
+
+        let substring = &text[offset..];
+        let c_text = CString::new(substring).ok()?;
+
+        let mut pmatch: [regmatch_t; MAX_CAPTURES] = unsafe { std::mem::zeroed() };
+
+        let result = unsafe {
+            regexec(
+                &self.raw,
+                c_text.as_ptr(),
+                MAX_CAPTURES,
+                pmatch.as_mut_ptr(),
+                0,
+            )
+        };
+
+        if result == REG_NOMATCH {
+            return None;
+        }
+
+        // Adjust positions to be relative to original string start
+        let matches: Vec<Match> = pmatch
+            .iter()
+            .map(|m| {
+                if m.rm_so >= 0 && m.rm_eo >= 0 {
+                    Match {
+                        start: offset + m.rm_so as usize,
+                        end: offset + m.rm_eo as usize,
+                    }
+                } else {
+                    Match::default()
+                }
+            })
+            .collect();
+
+        Some(matches)
+    }
+
+    /// Returns an iterator over all non-overlapping matches in the input.
+    pub fn find_iter<'r, 't>(&'r self, text: &'t str) -> MatchIter<'r, 't> {
+        MatchIter {
+            regex: self,
+            text,
+            offset: 0,
+        }
+    }
+
+    /// Returns the original pattern string.
+    pub fn as_str(&self) -> &str {
+        &self.pattern
+    }
+}
+
+impl Clone for Regex {
+    fn clone(&self) -> Self {
+        // Re-compile the pattern (regex_t cannot be safely copied)
+        Regex::new(&self.pattern, self.flags).expect("failed to clone already-valid regex")
+    }
+}
+
+impl Drop for Regex {
+    fn drop(&mut self) {
+        unsafe { regfree(&mut self.raw) }
+    }
+}
+
+impl std::fmt::Debug for Regex {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        f.debug_struct("Regex")
+            .field("pattern", &self.pattern)
+            .field("flags", &self.flags)
+            .finish()
+    }
+}
+
+impl PartialEq for Regex {
+    fn eq(&self, other: &Self) -> bool {
+        self.pattern == other.pattern
+            && self.flags.extended == other.flags.extended
+            && self.flags.ignore_case == other.flags.ignore_case
+    }
+}
+
+impl Eq for Regex {}
+
+/// Iterator over all non-overlapping matches in a string.
+pub struct MatchIter<'r, 't> {
+    regex: &'r Regex,
+    text: &'t str,
+    offset: usize,
+}
+
+impl<'r, 't> Iterator for MatchIter<'r, 't> {
+    type Item = Match;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.offset > self.text.len() {
+            return None;
+        }
+
+        let substring = &self.text[self.offset..];
+        let c_text = CString::new(substring).ok()?;
+
+        let mut pmatch = regmatch_t {
+            rm_so: -1,
+            rm_eo: -1,
+        };
+
+        let result = unsafe {
+            regexec(
+                &self.regex.raw,
+                c_text.as_ptr(),
+                1,
+                &mut pmatch as *mut regmatch_t,
+                0,
+            )
+        };
+
+        if result == REG_NOMATCH || pmatch.rm_so < 0 {
+            self.offset = self.text.len(); // Stop iteration
+            return None;
+        }
+
+        let m = Match {
+            start: self.offset + pmatch.rm_so as usize,
+            end: self.offset + pmatch.rm_eo as usize,
+        };
+
+        // Move past this match for next iteration
+        // Ensure we make progress even on zero-width matches
+        self.offset = if pmatch.rm_eo as usize > 0 {
+            self.offset + pmatch.rm_eo as usize
+        } else {
+            self.offset + 1
+        };
+
+        Some(m)
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn test_bre_simple_match() {
+        let re = Regex::bre("hello").unwrap();
+        assert!(re.is_match("hello world"));
+        assert!(re.is_match("say hello"));
+        assert!(!re.is_match("HELLO"));
+        assert!(!re.is_match("hi"));
+    }
+
+    #[test]
+    fn test_ere_simple_match() {
+        let re = Regex::ere("hello+").unwrap();
+        assert!(re.is_match("hellooooo"));
+        assert!(re.is_match("hello"));
+        assert!(!re.is_match("hell"));
+    }
+
+    #[test]
+    fn test_case_insensitive() {
+        let re = Regex::new("hello", RegexFlags::bre().ignore_case()).unwrap();
+        assert!(re.is_match("HELLO"));
+        assert!(re.is_match("Hello"));
+        assert!(re.is_match("hello"));
+    }
+
+    #[test]
+    fn test_ere_case_insensitive() {
+        let re = Regex::new("hello+", RegexFlags::ere().ignore_case()).unwrap();
+        assert!(re.is_match("HELLOOO"));
+        assert!(re.is_match("Hello"));
+    }
+
+    #[test]
+    fn test_find() {
+        let re = Regex::bre("world").unwrap();
+        let m = re.find("hello world").unwrap();
+        assert_eq!(m.start, 6);
+        assert_eq!(m.end, 11);
+        assert_eq!(m.as_str("hello world"), "world");
+    }
+
+    #[test]
+    fn test_find_no_match() {
+        let re = Regex::bre("xyz").unwrap();
+        assert!(re.find("hello world").is_none());
+    }
+
+    #[test]
+    fn test_find_iter() {
+        let re = Regex::bre("a").unwrap();
+        let matches: Vec<Match> = re.find_iter("abracadabra").collect();
+        assert_eq!(matches.len(), 5);
+        assert_eq!(matches[0], Match { start: 0, end: 1 });
+        assert_eq!(matches[1], Match { start: 3, end: 4 });
+        assert_eq!(matches[2], Match { start: 5, end: 6 });
+        assert_eq!(matches[3], Match { start: 7, end: 8 });
+        assert_eq!(matches[4], Match { start: 10, end: 11 });
+    }
+
+    #[test]
+    fn test_captures_bre() {
+        // BRE uses \( \) for groups
+        let re = Regex::bre(r"^\(.*\)$").unwrap();
+        let caps = re.captures("hello").unwrap();
+        assert_eq!(caps[0], Match { start: 0, end: 5 }); // Full match
+        assert_eq!(caps[1], Match { start: 0, end: 5 }); // Group 1
+    }
+
+    #[test]
+    fn test_captures_ere() {
+        // ERE uses ( ) for groups
+        let re = Regex::ere(r"^(.*)$").unwrap();
+        let caps = re.captures("hello").unwrap();
+        assert_eq!(caps[0], Match { start: 0, end: 5 }); // Full match
+        assert_eq!(caps[1], Match { start: 0, end: 5 }); // Group 1
+    }
+
+    #[test]
+    fn test_invalid_pattern() {
+        let result = Regex::bre("[invalid");
+        assert!(result.is_err());
+        let err = result.unwrap_err();
+        assert!(err.to_string().contains("invalid regex"));
+    }
+
+    #[test]
+    fn test_clone() {
+        let re1 = Regex::bre("hello").unwrap();
+        let re2 = re1.clone();
+        assert!(re2.is_match("hello"));
+        assert_eq!(re1.as_str(), re2.as_str());
+    }
+
+    #[test]
+    fn test_empty_pattern() {
+        // Should work on all platforms (macOS workaround)
+        let re = Regex::bre("").unwrap();
+        assert!(re.is_match("anything"));
+    }
+
+    #[test]
+    fn test_anchors() {
+        let re = Regex::bre("^hello$").unwrap();
+        assert!(re.is_match("hello"));
+        assert!(!re.is_match("hello world"));
+        assert!(!re.is_match("say hello"));
+    }
+
+    #[test]
+    fn test_special_bre_chars() {
+        // In BRE, ( is literal, \( is grouping
+        let re = Regex::bre("main(").unwrap();
+        assert!(re.is_match("int main() {"));
+    }
+
+    #[test]
+    fn test_special_ere_chars() {
+        // In ERE, ( is grouping, \( is literal
+        let re = Regex::ere(r"main\(").unwrap();
+        assert!(re.is_match("int main() {"));
+    }
+
+    #[test]
+    fn test_captures_at_empty_string() {
+        // Regression test: captures_at must use `offset > text.len()` not `offset >= text.len()`
+        // to allow patterns like ^$ to match empty strings
+        let re = Regex::bre("^$").unwrap();
+
+        // Pattern ^$ should match an empty string
+        let caps = re.captures("");
+        assert!(caps.is_some(), "^$ should match empty string");
+
+        // captures_at with offset 0 on empty string should also match
+        let caps = re.captures_at("", 0);
+        assert!(
+            caps.is_some(),
+            "captures_at(\"\", 0) should match ^$ pattern"
+        );
+
+        // The match should be at position 0..0 (zero-length match)
+        let caps = caps.unwrap();
+        assert_eq!(caps[0].start, 0);
+        assert_eq!(caps[0].end, 0);
+
+        // captures_at with offset past end should return None
+        let caps = re.captures_at("", 1);
+        assert!(caps.is_none(), "captures_at(\"\", 1) should return None");
+    }
+
+    #[test]
+    fn test_find_iter_empty_string() {
+        // Regression test: find_iter must handle empty strings correctly
+        let re = Regex::bre("^$").unwrap();
+
+        // find_iter on empty string should yield exactly one match
+        let matches: Vec<Match> = re.find_iter("").collect();
+        assert_eq!(matches.len(), 1, "^$ should match empty string once");
+        assert_eq!(matches[0], Match { start: 0, end: 0 });
+    }
+
+    #[test]
+    fn test_captures_at_end_of_string() {
+        // Test that $ anchor works at end of non-empty string
+        let re = Regex::bre("$").unwrap();
+
+        // $ should match at the end of "hello" (position 5)
+        let caps = re.captures_at("hello", 5);
+        assert!(
+            caps.is_some(),
+            "$ should match at end of string (offset == len)"
+        );
+        let caps = caps.unwrap();
+        assert_eq!(caps[0].start, 5);
+        assert_eq!(caps[0].end, 5);
+    }
+}
diff --git a/sh/Cargo.toml b/sh/Cargo.toml
index 3bec4e81b..f36f6d76c 100644
--- a/sh/Cargo.toml
+++ b/sh/Cargo.toml
@@ -6,6 +6,7 @@ edition = "2021"
 [dependencies]
 gettext-rs.workspace = true
 libc.workspace = true
+plib = { path = "../plib" }
 
 [dev-dependencies]
 plib = { path = "../plib" }
diff --git a/sh/pattern/regex.rs b/sh/pattern/regex.rs
index 3ffd7a7b0..a0ad36b9b 100644
--- a/sh/pattern/regex.rs
+++ b/sh/pattern/regex.rs
@@ -9,40 +9,15 @@
 
 use crate::pattern::parse::{BracketExpression, BracketItem, PatternItem, RangeEndpoint};
 use core::fmt;
-use std::ffi::{CStr, CString};
+use plib::regex::{Match, Regex as PlibRegex, RegexFlags};
+use std::ffi::CStr;
 use std::fmt::{Formatter, Write};
-use std::ptr;
-
-fn regex_compilation_result(
-    status_integer: libc::c_int,
-    regex: &libc::regex_t,
-) -> Result<(), String> {
-    if status_integer != 0 {
-        let mut error_buffer = vec![b'\0'; 128];
-        unsafe {
-            libc::regerror(
-                status_integer,
-                ptr::from_ref(regex),
-                error_buffer.as_mut_ptr() as *mut libc::c_char,
-                128,
-            )
-        };
-        let error = CStr::from_bytes_until_nul(&error_buffer)
-            .expect("error message returned from `libc::regerror` is an invalid CString");
-        Err(error.to_string_lossy().into_owned())
-    } else {
-        Ok(())
-    }
-}
 
-// TODO: the implementation is copied from awk, maybe we should consider putting it in a shared crate
+/// A regex wrapper that provides CStr-compatible API for shell pattern matching.
+/// Internally uses plib::regex for POSIX BRE support.
 pub struct Regex {
-    /// if the regex was initialized with an empty string,
-    /// `raw_regex` will be empty. This is to allow
-    /// empty string regexes on MacOS, which otherwise
-    /// would return a REG_EMPTY on compilation.
-    raw_regex: Option<libc::regex_t>,
-    regex_string: CString,
+    inner: PlibRegex,
+    pattern_string: String,
 }
 
 #[derive(Copy, Clone, Debug, Default, PartialEq, Eq)]
@@ -51,95 +26,58 @@ pub struct RegexMatch {
     pub end: usize,
 }
 
+impl From<Match> for RegexMatch {
+    fn from(m: Match) -> Self {
+        RegexMatch {
+            start: m.start,
+            end: m.end,
+        }
+    }
+}
+
 pub struct MatchIter<'a> {
-    string: &'a CStr,
-    next_start: usize,
-    regex: &'a Regex,
+    inner: plib::regex::MatchIter<'a, 'a>,
 }
 
 impl Iterator for MatchIter<'_> {
     type Item = RegexMatch;
     fn next(&mut self) -> Option<Self::Item> {
-        self.regex.raw_regex?;
-        if self.next_start >= self.string.to_bytes().len() {
-            return None;
-        }
-        let mut match_range = libc::regmatch_t {
-            rm_so: -1,
-            rm_eo: -1,
-        };
-        let exec_status = unsafe {
-            libc::regexec(
-                ptr::from_ref(&self.regex.raw_regex.unwrap()),
-                self.string.as_ptr().add(self.next_start),
-                1,
-                ptr::from_mut(&mut match_range),
-                0,
-            )
-        };
-        if exec_status == libc::REG_NOMATCH {
-            return None;
-        }
-        let result = RegexMatch {
-            start: self.next_start + match_range.rm_so as usize,
-            end: self.next_start + match_range.rm_eo as usize,
-        };
-        self.next_start += match_range.rm_eo as usize;
-        Some(result)
+        self.inner.next().map(RegexMatch::from)
     }
 }
 
 impl Regex {
-    pub fn new(regex: CString) -> Result<Self, String> {
-        if regex.is_empty() {
-            return Ok(Self {
-                raw_regex: None,
-                regex_string: regex,
-            });
-        }
-        let mut raw = unsafe { std::mem::zeroed::<libc::regex_t>() };
-        // difference from awk implementation: use 0 instead of REG_EXTENDED
-        let compilation_status =
-            unsafe { libc::regcomp(ptr::from_mut(&mut raw), regex.as_ptr(), 0) };
-        regex_compilation_result(compilation_status, &raw)?;
+    pub fn new(pattern: &str) -> Result<Self, String> {
+        let inner = PlibRegex::new(pattern, RegexFlags::bre()).map_err(|e| e.to_string())?;
         Ok(Self {
-            raw_regex: Some(raw),
-            regex_string: regex,
+            inner,
+            pattern_string: pattern.to_string(),
         })
     }
 
     pub fn match_locations<'a>(&'a self, string: &'a CStr) -> MatchIter<'a> {
+        // Convert CStr to &str - shell strings should always be valid UTF-8
+        let s = string.to_str().unwrap_or("");
         MatchIter {
-            next_start: 0,
-            regex: self,
-            string,
+            inner: self.inner.find_iter(s),
         }
     }
 
     pub fn matches(&self, string: &CStr) -> bool {
-        self.match_locations(string).next().is_some()
-    }
-}
-
-impl Drop for Regex {
-    fn drop(&mut self) {
-        if let Some(regex) = &mut self.raw_regex {
-            unsafe {
-                libc::regfree(ptr::from_mut(regex));
-            }
-        }
+        let s = string.to_str().unwrap_or("");
+        self.inner.is_match(s)
     }
 }
 
 impl fmt::Display for Regex {
     fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result {
-        write!(f, "{}", self.regex_string.to_str().unwrap())
+        write!(f, "{}", self.pattern_string)
     }
 }
 
 impl PartialEq for Regex {
     fn eq(&self, other: &Self) -> bool {
-        self.regex_string == other.regex_string
+        self.pattern_string == other.pattern_string
     }
 }
 
@@ -216,8 +154,7 @@ pub fn parsed_pattern_to_regex(parsed_pattern: &[PatternItem]) -> Result<Regex,
             PatternItem::BracketExpression(expr) => push_bracket_expression(expr, &mut regex_str),
         }
     }
-    let regex_cstr = CString::new(regex_str).expect("pattern cannot contain null characters");
-    Regex::new(regex_cstr)
+    Regex::new(&regex_str)
 }
 
 #[cfg(test)]
diff --git a/text/asa.rs b/text/asa.rs
index 4d6c21d25..e94e63990 100644
--- a/text/asa.rs
+++ b/text/asa.rs
@@ -23,7 +23,7 @@ struct Args {
 }
 
 fn asa_file(pathname: &PathBuf) -> io::Result<()> {
-    let mut reader = input_reader(pathname, false)?;
+    let mut reader = input_reader(pathname, true)?;
     let mut first_line = true;
     let mut had_output = false;
 
@@ -40,14 +40,15 @@ fn asa_file(pathname: &PathBuf) -> io::Result<()> {
             None => continue, // empty line shouldn't happen, but handle gracefully
         };
 
-        // Extract line content: skip first char, exclude trailing newline
+        // Extract line content: skip first char (may be multi-byte), exclude trailing newline
+        let first_char_len = ch.len_utf8();
         let line_end = if raw_line.ends_with('\n') {
             raw_line.len() - 1
         } else {
             raw_line.len()
         };
-        let line = if line_end > 1 {
-            &raw_line[1..line_end]
+        let line = if line_end > first_char_len {
+            &raw_line[first_char_len..line_end]
         } else {
             "" // control char only, no content
         };
@@ -112,9 +113,9 @@ fn main() -> Result<(), Box<dyn std::error::Error>> {
 
     let mut args = Args::parse();
 
-    // if no files, read from stdin
+    // if no files, read from stdin (use "-" to indicate stdin)
     if args.files.is_empty() {
-        args.files.push(PathBuf::new());
+        args.files.push(PathBuf::from("-"));
     }
 
     let mut exit_code = 0;
diff --git a/text/comm.rs b/text/comm.rs
index 0312acb36..a0ff2cb40 100644
--- a/text/comm.rs
+++ b/text/comm.rs
@@ -9,8 +9,8 @@
 
 use clap::Parser;
 use gettextrs::{bind_textdomain_codeset, setlocale, textdomain, LocaleCategory};
-use std::fs;
-use std::io::{self, BufRead, Write};
+use plib::io::input_reader;
+use std::io::{self, BufRead, BufReader, Read, Write};
 use std::path::PathBuf;
 
 const NO1: u32 = 1 << 0;
@@ -72,8 +72,8 @@ fn line_out(lead_dup: &'static str, outmask: u32, curtype: u32, s: &str) -> io::
     Ok(())
 }
 
-fn open_file(pathname: &PathBuf) -> io::Result<io::BufReader<fs::File>> {
-    Ok(io::BufReader::new(fs::File::open(pathname)?))
+fn open_file(pathname: &PathBuf) -> io::Result<BufReader<Box<dyn Read>>> {
+    input_reader(pathname, true)
 }
 
 fn comm_file(
@@ -106,10 +106,7 @@ fn comm_file(
         if buf1.is_empty() {
             line_out(lead_dup, mask, NO2, &buf2)?;
             buf2.clear();
-        } else if buf2.is_empty() {
-            line_out(lead_dup, mask, NO1, &buf1)?;
-            buf1.clear();
-        } else if buf1 < buf2 {
+        } else if buf2.is_empty() || buf1 < buf2 {
             line_out(lead_dup, mask, NO1, &buf1)?;
             buf1.clear();
         } else if buf2 < buf1 {
diff --git a/text/csplit.rs b/text/csplit.rs
index c4e12b377..fe6886712 100644
--- a/text/csplit.rs
+++ b/text/csplit.rs
@@ -6,13 +6,10 @@
 // file in the root directory of this project.
 // SPDX-License-Identifier: MIT
 //
-// TODO:
-// - err on line num == 0
-//
 
 use clap::Parser;
 use gettextrs::{bind_textdomain_codeset, setlocale, textdomain, LocaleCategory};
-use regex::Regex;
+use plib::regex::Regex;
 use std::fs::{self, File, OpenOptions};
 use std::io::{self, BufRead, Error, ErrorKind, Read, Write};
 use std::path::PathBuf;
@@ -388,7 +385,7 @@ fn process_lines(
     state.outf.as_mut().unwrap().write_all(lines.as_bytes())?;
     new_files.push(file_name);
     if !suppress {
-        println!("{}\n", lines.len());
+        println!("{}", lines.len());
     }
 
     state.close_output();
@@ -451,11 +448,7 @@ fn parse_op_rx(opstr: &str, delim: char) -> io::Result<Operand> {
     // parse string sandwiched between two delimiter chars
     let end_pos = res.unwrap();
     let re_str = &opstr[1..end_pos];
-    let res = Regex::new(re_str);
-    if res.is_err() {
-        return Err(Error::new(ErrorKind::Other, "invalid regex"));
-    }
-    let re = res.unwrap();
+    let re = Regex::bre(re_str)?;
 
     // reference offset string
     let mut offset_str = &opstr[end_pos + 1..];
@@ -497,32 +490,39 @@ fn parse_op_rx(opstr: &str, delim: char) -> io::Result<Operand> {
 /// problem parsing the operand.
 ///
 fn parse_op_repeat(opstr: &str) -> io::Result<Operand> {
-    // a regex fully describes what must be parsed
-    let re = Regex::new(r"^\{(\d*|[*])}$").unwrap();
-
-    // grab and parse capture #1, if matched
-    match re.captures(opstr) {
-        None => {}
-        Some(caps) => {
-            let numstr = caps.get(1).unwrap().as_str();
-            if numstr == "*" {
-                return Ok(Operand::Repeat(usize::MAX));
-            }
-            match numstr.parse::<usize>() {
-                Ok(n) => return Ok(Operand::Repeat(n)),
-                Err(_e) => {}
-            }
+    // Must match pattern: {num} or {*}
+    if !opstr.starts_with('{') || !opstr.ends_with('}') {
+        return Err(Error::new(
+            ErrorKind::Other,
+            "invalid repeat operand: expected {num} or {*}",
+        ));
+    }
+
+    let inner = &opstr[1..opstr.len() - 1];
+
+    if inner == "*" {
+        return Ok(Operand::Repeat(usize::MAX));
+    }
+
+    // Parse as number (must be all digits)
+    if inner.chars().all(|c| c.is_ascii_digit()) && !inner.is_empty() {
+        match inner.parse::<usize>() {
+            Ok(n) => return Ok(Operand::Repeat(n)),
+            Err(_) => {}
         }
     }
 
-    // error cases fall through to here
-    Err(Error::new(ErrorKind::Other, "invalid repeating operand"))
+    Err(Error::new(
+        ErrorKind::Other,
+        "invalid repeat operand: expected {num} or {*}",
+    ))
 }
 
 /// Parses a line number operand from a string.
 ///
 /// This function parses a line number operand from the input string. The line number operand
 /// specifies a simple positive integer indicating the line number at which to perform a split.
+/// POSIX specifies lines are numbered starting at 1.
 ///
 /// # Arguments
 ///
@@ -535,12 +535,16 @@ fn parse_op_repeat(opstr: &str) -> io::Result<Operand> {
 ///
 /// # Errors
 ///
-/// Returns an error if the input string cannot be parsed as a positive integer or if there is
-/// a problem parsing the operand.
+/// Returns an error if the input string cannot be parsed as a positive integer, is zero, or
+/// if there is a problem parsing the operand.
 ///
 fn parse_op_linenum(opstr: &str) -> io::Result<Operand> {
     // parse simple positive integer
     match opstr.parse::<usize>() {
+        Ok(0) => Err(Error::new(
+            ErrorKind::Other,
+            "line number must be greater than zero",
+        )),
         Ok(n) => Ok(Operand::LineNum(n)),
         Err(e) => {
             let msg = format!("{}", e);
@@ -580,7 +584,7 @@ fn parse_operands(args: &Args) -> io::Result<SplitOps> {
                 '/' => parse_op_rx(opstr, '/')?,
                 '%' => parse_op_rx(opstr, '%')?,
                 '{' => parse_op_repeat(opstr)?,
-                '1'..='9' => parse_op_linenum(opstr)?,
+                '0'..='9' => parse_op_linenum(opstr)?,
                 _ => return Err(Error::new(ErrorKind::Other, "invalid operand")),
             }
         };
@@ -591,6 +595,28 @@ fn parse_operands(args: &Args) -> io::Result<SplitOps> {
     Ok(SplitOps { ops })
 }
 
+/// Validates that the prefix + suffix won't exceed NAME_MAX
+fn validate_prefix(prefix: &str, suffix_len: u8) -> io::Result<()> {
+    // POSIX NAME_MAX is typically 255 on most systems (macOS, Linux, BSDs)
+    // Using a constant avoids platform-specific libc differences
+    const NAME_MAX: usize = 255;
+
+    // Maximum filename length is prefix + suffix digits
+    let max_filename_len = prefix.len() + suffix_len as usize;
+
+    if max_filename_len > NAME_MAX {
+        return Err(Error::new(
+            ErrorKind::InvalidInput,
+            format!(
+                "prefix too long: '{}' with {} digit suffix exceeds NAME_MAX ({})",
+                prefix, suffix_len, NAME_MAX
+            ),
+        ));
+    }
+
+    Ok(())
+}
+
 fn main() -> Result<(), Box<dyn std::error::Error>> {
     setlocale(LocaleCategory::LcAll, "");
     textdomain("posixutils-rs")?;
@@ -598,6 +624,9 @@ fn main() -> Result<(), Box<dyn std::error::Error>> {
 
     let args = Args::parse();
 
+    // Validate prefix won't exceed NAME_MAX
+    validate_prefix(&args.prefix, args.num)?;
+
     let ctx = parse_operands(&args)?;
 
     let mut exit_code = 0;
@@ -755,7 +784,7 @@ mod tests {
         match parse_op_repeat(opstr) {
             Err(e) => {
                 assert_eq!(e.kind(), ErrorKind::Other);
-                assert_eq!(e.to_string(), "invalid repeating operand");
+                assert!(e.to_string().starts_with("invalid repeat operand"));
             }
             _ => panic!("Expected Err"),
         }
@@ -767,7 +796,7 @@ mod tests {
         match parse_op_repeat(opstr) {
             Err(e) => {
                 assert_eq!(e.kind(), ErrorKind::Other);
-                assert_eq!(e.to_string(), "invalid repeating operand");
+                assert!(e.to_string().starts_with("invalid repeat operand"));
             }
             _ => panic!("Expected Err"),
         }
@@ -894,6 +923,7 @@ mod tests {
     #[test]
     fn test_split_c_file_1() {
         // Test valid operands
+        // In BRE, ( is literal, \( starts grouping - so use "main(" not "main\("
         let args = Args {
             prefix: String::from("c_file"),
             keep: false,
@@ -901,7 +931,7 @@ mod tests {
             suppress: false,
             filename: PathBuf::from("tests/assets/test_file_c"),
             operands: vec![
-                String::from(r"%main\(%"),
+                String::from("%main(%"),
                 String::from("/^}/+1"),
                 String::from("{3}"),
             ],
@@ -958,7 +988,7 @@ mod tests {
             suppress: false,
             filename: PathBuf::from("tests/assets/test_file_c"),
             operands: vec![
-                String::from(r"%main\(%+1"),
+                String::from("%main(%+1"),
                 String::from("/^}/+1"),
                 String::from("{3}"),
             ],
@@ -1014,7 +1044,7 @@ mod tests {
             suppress: false,
             filename: PathBuf::from("tests/assets/test_file_c"),
             operands: vec![
-                String::from(r"%main\(%-1"),
+                String::from("%main(%-1"),
                 String::from("/^}/+1"),
                 String::from("{3}"),
             ],
@@ -1071,7 +1101,7 @@ mod tests {
             suppress: false,
             filename: PathBuf::from("tests/assets/test_file_c"),
             operands: vec![
-                String::from(r"%main\(%"),
+                String::from("%main(%"),
                 String::from("/^}/"),
                 String::from("{3}"),
             ],
@@ -1128,7 +1158,7 @@ mod tests {
             suppress: false,
             filename: PathBuf::from("tests/assets/test_file_c"),
             operands: vec![
-                String::from(r"%main\(%"),
+                String::from("%main(%"),
                 String::from("/^}/-1"),
                 String::from("{3}"),
             ],
diff --git a/text/grep.rs b/text/grep.rs
index 5ee38227d..7807a0675 100644
--- a/text/grep.rs
+++ b/text/grep.rs
@@ -9,13 +9,11 @@
 
 use clap::Parser;
 use gettextrs::{bind_textdomain_codeset, setlocale, textdomain, LocaleCategory};
-use libc::{regcomp, regex_t, regexec, regfree, REG_EXTENDED, REG_ICASE, REG_NOMATCH};
+use plib::regex::{Regex, RegexFlags};
 use std::{
-    ffi::CString,
     fs::File,
     io::{self, BufRead, BufReader},
     path::{Path, PathBuf},
-    ptr,
 };
 
 /// grep - search a file for a pattern.
@@ -201,10 +199,10 @@ impl Args {
     }
 }
 
-/// Newtype over `Vec[libc::regex_t]`. Provides functionality for matching input data.
+/// Holds patterns for matching input data - either fixed strings or compiled regexes.
 enum Patterns {
     Fixed(Vec<String>, bool, bool),
-    Regex(Vec<regex_t>),
+    Regex(Vec<Regex>),
 }
 
 impl Patterns {
@@ -244,44 +242,25 @@ impl Patterns {
         } else {
             let mut ps = vec![];
 
-            let mut cflags = 0;
-            if extended_regexp {
-                cflags |= REG_EXTENDED;
-            }
+            // Build flags for regex compilation
+            let mut flags = if extended_regexp {
+                RegexFlags::ere()
+            } else {
+                RegexFlags::bre()
+            };
             if ignore_case {
-                cflags |= REG_ICASE;
+                flags = flags.ignore_case();
             }
-            for mut pattern in patterns {
-                // macOS version of [regcomp](regcomp) from `libc`
-                // provides additional check for empty regex. In this case,
-                // an error [REG_EMPTY](https://developer.apple.com/library/archive/documentation/System/Conceptual/ManPages_iPhoneOS/man3/regcomp.3.html)
-                // will be returned.
-
-                // Therefore, an empty pattern is replaced with ".*".
-                #[cfg(target_os = "macos")]
-                {
-                    pattern = if pattern.is_empty() {
-                        String::from(".*")
-                    } else {
-                        pattern
-                    };
-                }
-                pattern = if line_regexp {
+
+            for pattern in patterns {
+                // For -x option, anchor the pattern to match entire line
+                let pattern = if line_regexp {
                     format!("^{pattern}$")
                 } else {
                     pattern
                 };
 
-                let c_pattern = CString::new(pattern).map_err(|err| err.to_string())?;
-                let mut regex = unsafe { std::mem::zeroed::<regex_t>() };
-
-                let result = unsafe { regcomp(&mut regex, c_pattern.as_ptr(), cflags) };
-                if result != 0 {
-                    return Err(format!(
-                        "Error compiling regex '{}'",
-                        c_pattern.to_string_lossy()
-                    ));
-                }
+                let regex = Regex::new(&pattern, flags).map_err(|e| e.to_string())?;
                 ps.push(regex);
             }
             Ok(Self::Regex(ps))
@@ -314,25 +293,7 @@ impl Patterns {
                     }
                 })
             }
-            Patterns::Regex(patterns) => {
-                let c_input = CString::new(input).unwrap();
-                patterns.iter().any(|p| unsafe {
-                    regexec(p, c_input.as_ptr(), 0, ptr::null_mut(), 0) != REG_NOMATCH
-                })
-            }
-        }
-    }
-}
-
-impl Drop for Patterns {
-    fn drop(&mut self) {
-        match &self {
-            Patterns::Fixed(_, _, _) => {}
-            Patterns::Regex(regexes) => {
-                for regex in regexes {
-                    unsafe { regfree(regex as *const regex_t as *mut regex_t) }
-                }
-            }
+            Patterns::Regex(patterns) => patterns.iter().any(|re| re.is_match(input)),
         }
     }
 }
diff --git a/text/join.rs b/text/join.rs
index 63e1a9ffc..b39eb9598 100644
--- a/text/join.rs
+++ b/text/join.rs
@@ -129,10 +129,8 @@ fn process_files2(
                     if v == 0 {
                         println!("{}", res.join(" "));
                     }
-                } else {
-                    if v == 0 {
-                        println!("{} {}", fields1.join(" "), fields2[1..].join(" "));
-                    }
+                } else if v == 0 {
+                    println!("{} {}", fields1.join(" "), fields2[1..].join(" "));
                 }
             }
         }
diff --git a/text/sed.rs b/text/sed.rs
index 0d3feef16..5b2df7c67 100644
--- a/text/sed.rs
+++ b/text/sed.rs
@@ -9,18 +9,14 @@
 
 use clap::{command, Parser};
 use gettextrs::{bind_textdomain_codeset, gettext, setlocale, textdomain, LocaleCategory};
-use libc::{
-    ioctl, regcomp, regex_t, regexec, regmatch_t, winsize, REG_EXTENDED, STDERR_FILENO,
-    STDIN_FILENO, STDOUT_FILENO, TIOCGWINSZ,
-};
+use libc::{ioctl, winsize, STDERR_FILENO, STDIN_FILENO, STDOUT_FILENO, TIOCGWINSZ};
+use plib::regex::{Regex as PlibRegex, RegexFlags};
 use std::sync::Mutex;
 use std::{
     collections::{HashMap, HashSet},
-    ffi::CString,
     fmt::{self, Debug},
     fs::File,
     io::{BufRead, BufReader, Error, ErrorKind, Write},
-    mem::MaybeUninit,
     ops::Range,
     path::PathBuf,
 };
@@ -167,7 +163,7 @@ enum AddressToken {
     Last,
     /// Context related line number that
     /// calculated from this BRE match
-    Pattern(regex_t, String),
+    Pattern(PlibRegex, String),
     /// Used for handling char related exceptions, when parsing [`AddressRange`]
     Delimiter,
 }
@@ -267,13 +263,13 @@ enum ReplaceFlag {
     AppendToIfReplace(PathBuf), // w
 }
 
-/// Newtype for implementing [`Debug`] trait for regex_t
+/// Newtype for implementing [`Debug`] trait for Regex
 #[derive(Clone)]
-struct Regex(regex_t);
+struct Regex(PlibRegex);
 
 impl Debug for Regex {
     fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
-        f.debug_tuple("Regex").finish()
+        f.debug_tuple("Regex").field(&self.0.as_str()).finish()
     }
 }
 
@@ -444,7 +440,7 @@ impl Command {
                 reached_now.push(match token {
                     AddressToken::Number(position) => *position == line_number + 1,
                     AddressToken::Pattern(re, pattern) => {
-                        !(match_pattern(*re, pattern.clone(), line, line_number + 1)?.is_empty())
+                        !(match_pattern(re, pattern, line, line_number + 1)?.is_empty())
                     }
                     AddressToken::Last => match i {
                         0 => last_line,
@@ -480,7 +476,7 @@ impl Command {
     }
 }
 
-/// Function [`regexec`] can return from 1 to 9 range that can be nested.
+/// The regex can return from 1 to 9 range that can be nested.
 /// [`delete_nested_ranges`] function deletes ranges that contain another ranges.
 fn delete_nested_ranges(mut ranges: Vec<(usize, Range<usize>)>) -> Vec<(usize, Range<usize>)> {
     let mut result: Vec<(usize, Range<usize>)> = Vec::new();
@@ -496,8 +492,8 @@ fn delete_nested_ranges(mut ranges: Vec<(usize, Range<usize>)>) -> Vec<(usize, R
     result
 }
 
-/// Function [`regexec`] can return from 1 to 9 range. Some
-/// of them cam be invalid for usage. So this function filter
+/// The regex can return from 1 to 9 range. Some
+/// of them can be invalid for usage. So this function filters
 /// invalid ranges.
 fn filter_groups(groups: &mut Vec<(usize, Range<usize>)>, pattern: &str, haystack: &str) {
     groups.retain(|(_, m)| {
@@ -599,54 +595,62 @@ fn sort_groups(match_subranges: &mut [HashMap<usize, Range<usize>>]) {
 /// [`re`] - pattern for search in haystack
 /// [`line_number`] - current line number in input file, used in error message
 fn match_pattern(
-    re: regex_t,
-    pattern: String,
+    re: &PlibRegex,
+    pattern: &str,
     haystack: &str,
-    line_number: usize,
+    _line_number: usize,
 ) -> Result<Vec<HashMap<usize, std::ops::Range<usize>>>, SedError> {
-    let match_t: regmatch_t = unsafe { MaybeUninit::zeroed().assume_init() };
     let mut match_subranges = vec![];
-    let mut i = 0;
-    let mut last_offset = 0;
-    let c_input = CString::new(haystack).map_err(|err| {
-        SedError::ScriptParse(
-            format!(
-                "line {} contains nul byte in {} position",
-                line_number,
-                err.nul_position()
-            ),
-            None,
-        )
-    })?;
-    let mut c_input = c_input.as_ptr();
-    while i <= haystack.len() {
-        let mut pmatch = vec![match_t; 9];
-        unsafe {
-            c_input = c_input.add(last_offset);
-            let _ = regexec(&re as *const regex_t, c_input, 9, pmatch.as_mut_ptr(), 0);
-        }
+    let mut offset = 0;
+
+    while offset <= haystack.len() {
+        let Some(matches) = re.captures_at(haystack, offset) else {
+            break;
+        };
 
-        let mut groups = pmatch
-            .to_vec()
+        // The whole match is always in matches[0]
+        let whole_match = &matches[0];
+
+        // Convert plib::regex matches to (group_number, Range) format
+        // In sed, group numbers are 1-9 (not 0-indexed)
+        // A capture group is "used" if it's not at position 0,0 OR if it matches the whole match position
+        let mut groups: Vec<(usize, Range<usize>)> = matches
             .iter()
             .enumerate()
-            .filter(|(_, m)| !((m.rm_so < 0) && (m.rm_eo < 0)))
-            .map(|(j, m)| (j + 1, ((m.rm_so as usize) + i)..((m.rm_eo as usize) + i)))
-            .collect::<Vec<_>>();
+            .skip(1) // Skip group 0 (whole match)
+            .filter(|(_, m)| {
+                // Filter out unused capture groups
+                // An unused group in plib::regex is Match::default() = {0, 0}
+                // A used group will either:
+                // - Have non-zero start/end, OR
+                // - Be at the same position as the whole match (for zero-length matches)
+                (m.start != 0 || m.end != 0)
+                    || (m.start == whole_match.start && m.end == whole_match.end)
+            })
+            .map(|(j, m)| (j, m.start..m.end))
+            .collect();
 
-        filter_groups(&mut groups, &pattern, haystack);
-        last_offset = groups
-            .iter()
-            .map(|(_, r)| r.end - r.start)
-            .max()
-            .unwrap_or(0);
-        if last_offset == 0 {
-            last_offset = 1;
+        // For simple patterns without capture groups, use the whole match as group 1
+        // This handles patterns like "foo", "^", "$", ".*", etc.
+        if groups.is_empty() {
+            groups.push((1, whole_match.start..whole_match.end));
         }
-        i += last_offset;
+
+        filter_groups(&mut groups, pattern, haystack);
+
+        // Advance past this match
+        // Use the whole match end position, ensuring we always move forward
+        let next_offset = if whole_match.end > offset {
+            whole_match.end
+        } else {
+            offset + 1
+        };
+
+        offset = next_offset;
         match_subranges.push(groups);
     }
-    filter_groups_when_line_size_check_in_pattern(&mut match_subranges, &pattern);
+
+    filter_groups_when_line_size_check_in_pattern(&mut match_subranges, pattern);
     let mut match_subranges = delete_groups_duplicates(match_subranges);
     sort_groups(&mut match_subranges);
 
@@ -1246,51 +1250,23 @@ fn parse_replace_flags(chars: &[char], i: &mut usize) -> Result<Vec<ReplaceFlag>
     Ok(flags)
 }
 
-/// Compiles [`pattern`] as [`regex_t`]
-fn compile_regex(pattern: String) -> Result<regex_t, SedError> {
-    #[cfg(target_os = "macos")]
-    let mut pattern = pattern.replace("\\\\", "\\");
-    #[cfg(all(unix, not(target_os = "macos")))]
+/// Compiles [`pattern`] as a POSIX regex (BRE or ERE based on ERE flag)
+fn compile_regex(pattern: String) -> Result<PlibRegex, SedError> {
+    // Normalize backslash escapes
     let pattern = pattern.replace("\\\\", "\\");
-    let mut cflags = 0;
-    let ere = ERE.lock().unwrap();
-    if *ere {
-        cflags |= REG_EXTENDED;
-    }
-
-    // macOS version of [regcomp](regcomp) from `libc` provides additional check
-    // for empty regex. In this case, an error
-    // [REG_EMPTY](https://developer.apple.com/library/archive/documentation/System/Conceptual/ManPages_iPhoneOS/man3/regcomp.3.html)
-    // will be returned. Therefore, an empty pattern is replaced with ".*".
-    #[cfg(target_os = "macos")]
-    {
-        pattern = if pattern == "" {
-            String::from(".*")
-        } else {
-            pattern
-        };
-    }
 
-    let c_pattern = CString::new(pattern.clone()).map_err(|err| {
-        SedError::ScriptParse(
-            format!(
-                "pattern '{}' contains nul byte in {} position",
-                pattern,
-                err.nul_position()
-            ),
-            None,
-        )
-    })?;
-    let mut regex = unsafe { std::mem::zeroed::<regex_t>() };
-
-    if unsafe { regcomp(&mut regex, c_pattern.as_ptr(), cflags) } == 0 {
-        Ok(regex)
+    // Check ERE flag to determine regex mode
+    let ere = ERE.lock().unwrap();
+    let flags = if *ere {
+        RegexFlags::ere()
     } else {
-        Err(SedError::ScriptParse(
-            format!("can't compile pattern '{}'", pattern),
-            None,
-        ))
-    }
+        RegexFlags::bre()
+    };
+
+    // plib::regex handles macOS empty pattern workaround internally
+    PlibRegex::new(&pattern, flags).map_err(|e| {
+        SedError::ScriptParse(format!("can't compile pattern '{}': {}", pattern, e), None)
+    })
 }
 
 fn screen_width() -> Option<usize> {
@@ -1794,7 +1770,7 @@ fn execute_replace(
     let Command::Replace(_, re, pattern, replacement, flags) = command else {
         unreachable!();
     };
-    let match_subranges = match_pattern(re.0, pattern, pattern_space, line_number)?;
+    let match_subranges = match_pattern(&re.0, &pattern, pattern_space, line_number)?;
     let is_replace_n = |f: &ReplaceFlag| {
         let ReplaceFlag::ReplaceNth(_) = f.clone() else {
             return false;
@@ -1906,7 +1882,7 @@ struct Sed {
     /// [`true`] if since last t at least one replacement [`Command`]
     /// was performed in cycle limits
     has_replacements_since_t: bool,
-    /// Last regex_t in applied [`Command`]  
+    /// Last regex pattern in applied [`Command`]
     last_regex: Option<Regex>,
     /// Next line for processing
     next_line: String,
diff --git a/text/tests/asa/mod.rs b/text/tests/asa/mod.rs
index e73c9ce14..8513d8d83 100644
--- a/text/tests/asa/mod.rs
+++ b/text/tests/asa/mod.rs
@@ -162,3 +162,27 @@ fn asa_fortran_style_report() {
     let expected = "\x0cREPORT TITLE\n\nDATA LINE 1\nDATA LINE 2\n\nSECTION 2\nDATA LINE 3\n";
     asa_test(input, expected);
 }
+
+// Test multi-byte UTF-8 content (control char is ASCII, content is UTF-8)
+#[test]
+fn asa_utf8_content() {
+    asa_test(" héllo wörld\n", "héllo wörld\n");
+}
+
+#[test]
+fn asa_cjk_content() {
+    asa_test(" 日本語テスト\n", "日本語テスト\n");
+}
+
+// Test multi-byte UTF-8 as control character (non-standard, treated as space per POSIX)
+#[test]
+fn asa_multibyte_control_char() {
+    // Multi-byte char as control: treated as unknown, like space
+    asa_test("éhello\n", "hello\n");
+}
+
+#[test]
+fn asa_cjk_control_char() {
+    // 3-byte CJK char as control: treated as unknown, like space
+    asa_test("日test\n", "test\n");
+}
diff --git a/text/tests/comm/comm.12 b/text/tests/comm/comm.12
new file mode 100644
index 000000000..e494b5f62
--- /dev/null
+++ b/text/tests/comm/comm.12
@@ -0,0 +1,2 @@
+banana
+carrot
diff --git a/text/tests/comm/comm.123 b/text/tests/comm/comm.123
new file mode 100644
index 000000000..e69de29bb
diff --git a/text/tests/comm/comm.13 b/text/tests/comm/comm.13
new file mode 100644
index 000000000..60fffd18f
--- /dev/null
+++ b/text/tests/comm/comm.13
@@ -0,0 +1 @@
+date
diff --git a/text/tests/comm/comm.23 b/text/tests/comm/comm.23
new file mode 100644
index 000000000..4c479deff
--- /dev/null
+++ b/text/tests/comm/comm.23
@@ -0,0 +1 @@
+apple
diff --git a/text/tests/comm/comm.empty b/text/tests/comm/comm.empty
new file mode 100644
index 000000000..e69de29bb
diff --git a/text/tests/comm/comm.empty_both b/text/tests/comm/comm.empty_both
new file mode 100644
index 000000000..e69de29bb
diff --git a/text/tests/comm/comm.empty_file1 b/text/tests/comm/comm.empty_file1
new file mode 100644
index 000000000..c9329061e
--- /dev/null
+++ b/text/tests/comm/comm.empty_file1
@@ -0,0 +1,3 @@
+	banana
+	carrot
+	date
diff --git a/text/tests/comm/comm.empty_file2 b/text/tests/comm/comm.empty_file2
new file mode 100644
index 000000000..53c7efe10
--- /dev/null
+++ b/text/tests/comm/comm.empty_file2
@@ -0,0 +1,3 @@
+apple
+banana
+carrot
diff --git a/text/tests/comm/mod.rs b/text/tests/comm/mod.rs
index b32773824..6028743d2 100644
--- a/text/tests/comm/mod.rs
+++ b/text/tests/comm/mod.rs
@@ -7,7 +7,7 @@
 // SPDX-License-Identifier: MIT
 //
 
-use plib::testing::{run_test, TestPlan};
+use plib::testing::{run_test, run_test_with_checker, TestPlan};
 use std::fs;
 use std::path::PathBuf;
 
@@ -65,3 +65,137 @@ fn comm_suppress_third_column() {
         "comm.3",
     );
 }
+
+#[test]
+fn comm_suppress_columns_12() {
+    run_comm_test(
+        vec!["-12", "tests/comm/comm.file1", "tests/comm/comm.file2"],
+        "comm.12",
+    );
+}
+
+#[test]
+fn comm_suppress_columns_13() {
+    run_comm_test(
+        vec!["-13", "tests/comm/comm.file1", "tests/comm/comm.file2"],
+        "comm.13",
+    );
+}
+
+#[test]
+fn comm_suppress_columns_23() {
+    run_comm_test(
+        vec!["-23", "tests/comm/comm.file1", "tests/comm/comm.file2"],
+        "comm.23",
+    );
+}
+
+#[test]
+fn comm_suppress_columns_123() {
+    run_comm_test(
+        vec!["-123", "tests/comm/comm.file1", "tests/comm/comm.file2"],
+        "comm.123",
+    );
+}
+
+#[test]
+fn comm_suppress_columns_separate_flags() {
+    // Test that -1 -2 -3 works the same as -123
+    run_comm_test(
+        vec![
+            "-1",
+            "-2",
+            "-3",
+            "tests/comm/comm.file1",
+            "tests/comm/comm.file2",
+        ],
+        "comm.123",
+    );
+}
+
+#[test]
+fn comm_empty_both_files() {
+    run_comm_test(
+        vec!["tests/comm/comm.empty", "tests/comm/comm.empty"],
+        "comm.empty_both",
+    );
+}
+
+#[test]
+fn comm_empty_file1() {
+    run_comm_test(
+        vec!["tests/comm/comm.empty", "tests/comm/comm.file2"],
+        "comm.empty_file1",
+    );
+}
+
+#[test]
+fn comm_empty_file2() {
+    run_comm_test(
+        vec!["tests/comm/comm.file1", "tests/comm/comm.empty"],
+        "comm.empty_file2",
+    );
+}
+
+#[test]
+fn comm_stdin_file1() {
+    // Test using "-" for file1 (stdin)
+    let expected_output =
+        fs::read_to_string(get_test_file_path("comm.0")).expect("Failed to read expected output");
+    let file1_content =
+        fs::read_to_string(get_test_file_path("comm.file1")).expect("Failed to read file1");
+
+    run_test(TestPlan {
+        cmd: String::from("comm"),
+        args: vec![String::from("-"), String::from("tests/comm/comm.file2")],
+        expected_out: expected_output,
+        expected_err: String::new(),
+        stdin_data: file1_content,
+        expected_exit_code: 0,
+    });
+}
+
+#[test]
+fn comm_stdin_file2() {
+    // Test using "-" for file2 (stdin)
+    let expected_output =
+        fs::read_to_string(get_test_file_path("comm.0")).expect("Failed to read expected output");
+    let file2_content =
+        fs::read_to_string(get_test_file_path("comm.file2")).expect("Failed to read file2");
+
+    run_test(TestPlan {
+        cmd: String::from("comm"),
+        args: vec![String::from("tests/comm/comm.file1"), String::from("-")],
+        expected_out: expected_output,
+        expected_err: String::new(),
+        stdin_data: file2_content,
+        expected_exit_code: 0,
+    });
+}
+
+#[test]
+fn comm_missing_file_error() {
+    // Test error handling for missing file
+    // Note: error message text varies by OS, so we only check that stderr is non-empty
+    run_test_with_checker(
+        TestPlan {
+            cmd: String::from("comm"),
+            args: vec![
+                String::from("tests/comm/nonexistent_file"),
+                String::from("tests/comm/comm.file2"),
+            ],
+            expected_out: String::new(),
+            expected_err: String::new(), // Not used by checker
+            stdin_data: String::new(),
+            expected_exit_code: 1,
+        },
+        |_plan, output| {
+            assert!(output.stdout.is_empty(), "stdout should be empty");
+            assert!(
+                !output.stderr.is_empty(),
+                "stderr should contain error message"
+            );
+            assert_eq!(output.status.code(), Some(1), "exit code should be 1");
+        },
+    );
+}
diff --git a/text/tests/csplit/mod.rs b/text/tests/csplit/mod.rs
index 6c557907c..3b22eb9fe 100644
--- a/text/tests/csplit/mod.rs
+++ b/text/tests/csplit/mod.rs
@@ -8,7 +8,7 @@
 // SPDX-License-Identifier: MIT
 //
 
-use plib::testing::{run_test, TestPlan};
+use plib::testing::{run_test, run_test_with_checker, TestPlan};
 
 fn csplit_test(args: &[&str], test_data: &str, expected_output: &str) {
     let str_args: Vec<String> = args.iter().map(|s| String::from(*s)).collect();
@@ -44,7 +44,7 @@ fn test_csplit_text_by_lines() {
 15
 16
 17",
-        "43\n\n57\n\n31\n\n14\n\n",
+        "43\n57\n31\n14\n",
     );
     std::fs::remove_file("text00").unwrap();
     std::fs::remove_file("text01").unwrap();
@@ -57,7 +57,7 @@ fn test_csplit_text_by_lines_from_file() {
     csplit_test(
         &["-f", "text_f", "tests/assets/test_file.txt", "5", "{3}"],
         "",
-        "43\n\n57\n\n31\n\n14\n\n",
+        "43\n57\n31\n14\n",
     );
     std::fs::remove_file("text_f00").unwrap();
     std::fs::remove_file("text_f01").unwrap();
@@ -65,6 +65,8 @@ fn test_csplit_text_by_lines_from_file() {
     std::fs::remove_file("text_f03").unwrap();
 }
 
+// Note: In BRE, ( is a literal character, \( starts a grouping
+// So to match "main(" we use "main(" not "main\("
 #[test]
 fn test_csplit_c_code_by_regex() {
     csplit_test(
@@ -72,12 +74,12 @@ fn test_csplit_c_code_by_regex() {
             "-f",
             "code_c",
             "tests/assets/test_file_c",
-            r"%main\(%",
+            "%main(%",
             "/^}/+1",
             "{3}",
         ],
         "",
-        "59\n\n53\n\n53\n\n54\n\n",
+        "59\n53\n53\n54\n",
     );
     std::fs::remove_file("code_c00").unwrap();
     std::fs::remove_file("code_c01").unwrap();
@@ -92,12 +94,12 @@ fn test_csplit_c_code_by_regex_negative_offset() {
             "-f",
             "code_c_neg",
             "tests/assets/test_file_c",
-            r"%main\(%",
+            "%main(%",
             "/^}/-2",
             "{3}",
         ],
         "",
-        "12\n\n46\n\n52\n\n107\n\n",
+        "12\n46\n52\n107\n",
     );
     std::fs::remove_file("code_c_neg00").unwrap();
     std::fs::remove_file("code_c_neg01").unwrap();
@@ -113,7 +115,7 @@ fn test_csplit_c_code_by_regex_suppress() {
             "-f",
             "code_c_s",
             "tests/assets/test_file_c",
-            r"%main\(%",
+            "%main(%",
             "/^}/+1",
             "{3}",
         ],
@@ -135,12 +137,12 @@ fn test_csplit_c_code_by_regex_with_number() {
             "-n",
             "3",
             "tests/assets/test_file_c",
-            r"%main\(%",
+            "%main(%",
             "/^}/+1",
             "{3}",
         ],
         "",
-        "59\n\n53\n\n53\n\n54\n\n",
+        "59\n53\n53\n54\n",
     );
     std::fs::remove_file("code_c_n000").unwrap();
     std::fs::remove_file("code_c_n001").unwrap();
@@ -153,7 +155,7 @@ fn test_csplit_regex_by_empty_lines() {
     csplit_test(
         &["-f", "empty_lines", "tests/assets/empty_line.txt", "/^$/"],
         "",
-        "6\n\n7\n\n",
+        "6\n7\n",
     );
     std::fs::remove_file("empty_lines00").unwrap();
     std::fs::remove_file("empty_lines01").unwrap();
@@ -170,7 +172,7 @@ fn test_csplit_regex_would_infloop() {
             "{*}",
         ],
         "",
-        "2\n\n",
+        "2\n",
     );
     std::fs::remove_file("would_infloop00").unwrap();
 }
@@ -180,7 +182,7 @@ fn test_csplit_regex_in_uniq() {
     csplit_test(
         &["-f", "in_uniq", "tests/assets/in_uniq", "/^$/", "{*}"],
         "",
-        "6\n\n10\n\n8\n\n9\n\n",
+        "6\n10\n8\n9\n",
     );
     std::fs::remove_file("in_uniq00").unwrap();
     std::fs::remove_file("in_uniq01").unwrap();
@@ -193,7 +195,7 @@ fn test_csplit_regex_in_uniq_2() {
     csplit_test(
         &["-f", "in_uniq_2_", "tests/assets/in_uniq", "/^$/-1", "{*}"],
         "",
-        "3\n\n10\n\n8\n\n12\n\n",
+        "3\n10\n8\n12\n",
     );
     std::fs::remove_file("in_uniq_2_00").unwrap();
     std::fs::remove_file("in_uniq_2_01").unwrap();
@@ -206,7 +208,7 @@ fn test_csplit_regex_in_uniq_3() {
     csplit_test(
         &["-f", "in_uniq_3_", "tests/assets/in_uniq", "/^$/1", "{*}"],
         "",
-        "7\n\n10\n\n8\n\n8\n\n",
+        "7\n10\n8\n8\n",
     );
     std::fs::remove_file("in_uniq_3_00").unwrap();
     std::fs::remove_file("in_uniq_3_01").unwrap();
@@ -219,10 +221,102 @@ fn test_csplit_regex_in_seq() {
     csplit_test(
         &["-f", "in_seq", "tests/assets/in_seq", "/2/", "/4/", "/6/"],
         "",
-        "1\n\n3\n\n3\n\n1\n\n",
+        "1\n3\n3\n1\n",
     );
     std::fs::remove_file("in_seq00").unwrap();
     std::fs::remove_file("in_seq01").unwrap();
     std::fs::remove_file("in_seq02").unwrap();
     std::fs::remove_file("in_seq03").unwrap();
 }
+
+// Test that line number 0 is rejected (POSIX: lines numbered starting at 1)
+#[test]
+fn test_csplit_error_line_zero() {
+    let str_args: Vec<String> = vec!["-f", "err_zero", "-", "0"]
+        .iter()
+        .map(|s| String::from(*s))
+        .collect();
+
+    run_test(TestPlan {
+        cmd: String::from("csplit"),
+        args: str_args,
+        stdin_data: String::from("line1\nline2\n"),
+        expected_out: String::from(""),
+        expected_err: String::from(
+            "Error: Custom { kind: Other, error: \"line number must be greater than zero\" }\n",
+        ),
+        expected_exit_code: 1,
+    });
+}
+
+// Test invalid BRE pattern error
+#[test]
+fn test_csplit_error_invalid_bre() {
+    let str_args: Vec<String> = vec!["-f", "err_bre", "-", "/[invalid/"]
+        .iter()
+        .map(|s| String::from(*s))
+        .collect();
+
+    // Use checker to only verify error prefix - detailed message may vary by platform
+    run_test_with_checker(
+        TestPlan {
+            cmd: String::from("csplit"),
+            args: str_args,
+            stdin_data: String::from("line1\nline2\n"),
+            expected_out: String::from(""),
+            expected_err: String::new(), // checked manually below
+            expected_exit_code: 1,
+        },
+        |_plan, output| {
+            assert_eq!(output.stdout, b"");
+            let stderr = String::from_utf8_lossy(&output.stderr);
+            assert!(
+                stderr.contains("invalid regex"),
+                "Expected error containing 'invalid regex', got: {}",
+                stderr
+            );
+            assert_eq!(output.status.code(), Some(1));
+        },
+    );
+}
+
+// Test -k option: files should be kept on error
+#[test]
+fn test_csplit_keep_files_on_error() {
+    // This test creates some files then encounters an error (line 999 doesn't exist)
+    // With -k, the files should be kept
+    let str_args: Vec<String> = vec!["-k", "-f", "keep_err", "-", "3", "999"]
+        .iter()
+        .map(|s| String::from(*s))
+        .collect();
+
+    run_test(TestPlan {
+        cmd: String::from("csplit"),
+        args: str_args,
+        stdin_data: String::from("line1\nline2\nline3\nline4\n"),
+        expected_out: String::from("11\n12\n"),
+        expected_err: String::from(""),
+        expected_exit_code: 0,
+    });
+
+    // With -k, all created files should exist
+    assert!(std::path::Path::new("keep_err00").exists());
+    assert!(std::path::Path::new("keep_err01").exists());
+    std::fs::remove_file("keep_err00").unwrap();
+    std::fs::remove_file("keep_err01").unwrap();
+}
+
+// Test BRE-specific patterns work correctly
+#[test]
+fn test_csplit_bre_patterns() {
+    // In BRE: \+ means literal +, not "one or more"
+    // In BRE: ( is literal, \( is grouping
+    // First file: "header" (6 bytes), second file: "line1\nline2\n" (12 bytes)
+    csplit_test(
+        &["-f", "bre_test", "-", "/^line/"],
+        "header\nline1\nline2\n",
+        "6\n12\n",
+    );
+    std::fs::remove_file("bre_test00").unwrap();
+    std::fs::remove_file("bre_test01").unwrap();
+}
diff --git a/text/tests/grep/mod.rs b/text/tests/grep/mod.rs
index 49ef06f6d..88a87e416 100644
--- a/text/tests/grep/mod.rs
+++ b/text/tests/grep/mod.rs
@@ -8,7 +8,7 @@
 // SPDX-License-Identifier: MIT
 //
 
-use plib::testing::{run_test, TestPlan};
+use plib::testing::{run_test, run_test_with_checker, TestPlan};
 
 const LINES_INPUT: &str =
     "line_{1}\np_line_{2}_s\n  line_{3}  \nLINE_{4}\np_LINE_{5}_s\nl_{6}\nline_{70}\n";
@@ -50,6 +50,33 @@ fn grep_test(
     });
 }
 
+/// Helper for tests that check regex error messages.
+/// Only verifies the error contains "invalid regex" - detailed message may vary by platform.
+fn grep_test_regex_error(args: &[&str], test_data: &str, expected_exit_code: i32) {
+    let str_args: Vec<String> = args.iter().map(|s| String::from(*s)).collect();
+
+    run_test_with_checker(
+        TestPlan {
+            cmd: String::from("grep"),
+            args: str_args,
+            stdin_data: String::from(test_data),
+            expected_out: String::new(),
+            expected_err: String::new(), // checked manually below
+            expected_exit_code,
+        },
+        |_plan, output| {
+            assert_eq!(output.stdout, b"");
+            let stderr = String::from_utf8_lossy(&output.stderr);
+            assert!(
+                stderr.contains("invalid regex"),
+                "Expected error containing 'invalid regex', got: {}",
+                stderr
+            );
+            assert_eq!(output.status.code(), Some(expected_exit_code));
+        },
+    );
+}
+
 #[test]
 fn test_incompatible_options() {
     grep_test(
@@ -99,13 +126,8 @@ fn test_inexisting_file_pattern() {
 
 #[test]
 fn test_regexp_compiling_error() {
-    grep_test(
-        &[INVALID_BRE],
-        "",
-        "",
-        "Error compiling regex '\\{1,3\\}'\n",
-        2,
-    );
+    // Error message comes from regerror() - detailed message may vary by platform
+    grep_test_regex_error(&[INVALID_BRE], "", 2);
 }
 
 #[test]
@@ -263,13 +285,8 @@ fn test_basic_regexp_no_messages_with_error_02() {
 
 #[test]
 fn test_basic_regexp_no_messages_with_error_03() {
-    grep_test(
-        &["-s", INVALID_BRE, "-", BAD_INPUT_FILE],
-        LINES_INPUT,
-        "",
-        "Error compiling regex '\\{1,3\\}'\n",
-        2,
-    );
+    // Error message comes from regerror() - detailed message may vary by platform
+    grep_test_regex_error(&["-s", INVALID_BRE, "-", BAD_INPUT_FILE], LINES_INPUT, 2);
 }
 
 #[test]
@@ -498,11 +515,10 @@ fn test_extended_regexp_no_messages_with_error_02() {
 
 #[test]
 fn test_extended_regexp_no_messages_with_error_03() {
-    grep_test(
+    // Error message comes from regerror() - detailed message may vary by platform
+    grep_test_regex_error(
         &["-E", "-s", INVALID_ERE, "-", BAD_INPUT_FILE],
         LINES_INPUT,
-        "",
-        "Error compiling regex '{1,3}'\n",
         2,
     );
 }
diff --git a/text/tests/sed/mod.rs b/text/tests/sed/mod.rs
index c0aff379b..a95bc66a8 100644
--- a/text/tests/sed/mod.rs
+++ b/text/tests/sed/mod.rs
@@ -7,7 +7,7 @@
 // SPDX-License-Identifier: MIT
 //
 
-use plib::testing::{run_test, TestPlan};
+use plib::testing::{run_test, run_test_with_checker, TestPlan};
 
 fn sed_test(
     args: &[&str],
@@ -28,6 +28,37 @@ fn sed_test(
     });
 }
 
+/// Helper for tests that check regex error messages.
+/// Only verifies the error starts with the expected prefix - detailed message may vary by platform.
+fn sed_test_regex_error(
+    args: &[&str],
+    test_data: &str,
+    expected_err_prefix: &str,
+    expected_exit_code: i32,
+) {
+    let str_args: Vec<String> = args.iter().map(|s| String::from(*s)).collect();
+
+    run_test_with_checker(
+        TestPlan {
+            cmd: String::from("sed"),
+            args: str_args,
+            stdin_data: String::from(test_data),
+            expected_out: String::new(),
+            expected_err: String::new(),
+            expected_exit_code,
+        },
+        |_, output| {
+            let stderr = String::from_utf8_lossy(&output.stderr);
+            assert!(
+                stderr.starts_with(expected_err_prefix),
+                "Expected stderr to start with '{}', got: '{}'",
+                expected_err_prefix,
+                stderr
+            );
+        },
+    );
+}
+
 const ABC_INPUT: &str = "abc\n";
 const SCRIPT_A: &str = "s/a/ab/g";
 const SCRIPT_B: &str = "s/b/bc/g";
@@ -1559,12 +1590,6 @@ mod tests {
                 "",
                 "sed: commands must be delimited with ';' (line: 0, col: 6)\n",
             ),
-            (
-                "s/\\(\\(x\\)/\\1\\2/",
-                "abc\nbbb\nbcb\nrbt\n@#$",
-                "",
-                "sed: can't compile pattern '\\(\\(x\\)'\n",
-            ),
             (
                 "s\na\nb\n",
                 "abc\nbbb\nbcb\nrbt\n@#$",
@@ -1576,6 +1601,14 @@ mod tests {
         for (script, input, output, err) in test_data {
             sed_test(&["-e", script], input, output, err, !err.is_empty() as i32);
         }
+
+        // Test regex compilation error separately - detailed error message varies by platform
+        sed_test_regex_error(
+            &["-e", "s/\\(\\(x\\)/\\1\\2/"],
+            "abc\nbbb\nbcb\nrbt\n@#$",
+            "sed: can't compile pattern '\\(\\(x\\)'",
+            1,
+        );
     }
 
     #[test]
@@ -2239,9 +2272,11 @@ mod tests {
                 "sed: unterminated `s' command (line: 0, col: 3)\n",
             ),
             (
+                // Pattern ^[*][[:space:]] only matches lines starting with "* "
+                // "---------------* product" does NOT start with *, so it's unchanged
                 r#"s/\(^[*][[:space:]]\)/   \1/;\/List of products:/a\ ---------------"#,
                 "List of products:\n---------------* product\n* product1",
-                "List of products:\n ---------------\n---------------   * product\n   * product1",
+                "List of products:\n ---------------\n---------------* product\n   * product1",
                 "",
             ),
         ];