feat: implement utils.rs and state.rs

utils.rs: natural sort, file fingerprinting, library ID computation, pretty title formatting, path helpers, clamp, truthy (38 tests) state.rs: atomic JSON persistence with backup rotation and fallback loading (8 tests)
2026-02-19 01:47:37 +02:00
parent 40d7ce4291
commit 6ecbeb9a9b
3 changed files with 947 additions and 0 deletions
@@ -1,3 +1,6 @@
 pub mod state;
 pub mod utils;
 #[cfg_attr(mobile, tauri::mobile_entry_point)]
 pub fn run() {
    tauri::Builder::default()
@@ -0,0 +1,247 @@
 use serde_json::Value;
 use std::fs;
 use std::path::Path;
 /// Default number of rolling backups to keep.
 pub const BACKUP_COUNT: usize = 8;
 /// Write JSON data to a file atomically with backup rotation.
 ///
 /// Creates rolling backups (.bak1 through .bakN) and a .lastgood copy
 /// for crash recovery.
 ///
 /// For a file `foo.json`, backups are `foo.json.bak1`, `foo.json.tmp`, etc.
 pub fn atomic_write_json(path: &Path, data: &Value, backup_count: usize) {
    // Create parent directories if needed
    if let Some(parent) = path.parent() {
        fs::create_dir_all(parent).ok();
    }
    let path_str = path.as_os_str().to_string_lossy();
    let tmp = Path::new(&*format!("{}.tmp", path_str)).to_path_buf();
    let payload = serde_json::to_string_pretty(data).expect("failed to serialize JSON");
    if path.exists() {
        // Rotate existing backups: move .bakN -> .bak(N+1), down to .bak1 -> .bak2
        for i in (1..=backup_count).rev() {
            let src = Path::new(&*format!("{}.bak{}", path_str, i)).to_path_buf();
            let dst = Path::new(&*format!("{}.bak{}", path_str, i + 1)).to_path_buf();
            if src.exists() {
                // Remove dst if it exists, then rename src -> dst
                fs::remove_file(&dst).ok();
                fs::rename(&src, &dst).ok();
            }
        }
        // Move current file to .bak1
        let bak1 = Path::new(&*format!("{}.bak1", path_str)).to_path_buf();
        fs::remove_file(&bak1).ok();
        fs::rename(path, &bak1).ok();
    }
    // Write atomically via tmp file
    fs::write(&tmp, &payload).expect("failed to write tmp file");
    fs::rename(&tmp, path).expect("failed to rename tmp to primary");
    // Keep a .lastgood copy for recovery
    let lastgood = Path::new(&*format!("{}.lastgood", path_str)).to_path_buf();
    fs::write(&lastgood, &payload).ok();
 }
 /// Load JSON from path, falling back to backups if the primary is corrupted.
 ///
 /// Tries: path -> .lastgood -> .bak1 -> .bak2 -> ... -> .bak{backup_count+2}
 /// Returns `None` if all candidates fail.
 pub fn load_json_with_fallbacks(path: &Path, backup_count: usize) -> Option<Value> {
    let path_str = path.as_os_str().to_string_lossy();
    // Build candidate list: primary, lastgood, bak1..bak{backup_count+2}
    let mut candidates: Vec<std::path::PathBuf> = Vec::new();
    candidates.push(path.to_path_buf());
    candidates.push(Path::new(&*format!("{}.lastgood", path_str)).to_path_buf());
    for i in 1..=(backup_count + 2) {
        candidates.push(Path::new(&*format!("{}.bak{}", path_str, i)).to_path_buf());
    }
    for p in &candidates {
        if p.exists() {
            if let Ok(text) = fs::read_to_string(p) {
                if let Ok(val) = serde_json::from_str::<Value>(&text) {
                    return Some(val);
                }
            }
        }
    }
    None
 }
 #[cfg(test)]
 mod tests {
    use super::*;
    use serde_json::json;
    use tempfile::TempDir;
    /// Helper: path to a JSON file inside a temp dir.
    fn json_path(dir: &TempDir) -> std::path::PathBuf {
        dir.path().join("data.json")
    }
    #[test]
    fn test_write_and_read_round_trip() {
        let dir = TempDir::new().unwrap();
        let path = json_path(&dir);
        let data = json!({"key": "value", "num": 42});
        atomic_write_json(&path, &data, BACKUP_COUNT);
        let loaded = load_json_with_fallbacks(&path, BACKUP_COUNT);
        assert_eq!(loaded, Some(data));
    }
    #[test]
    fn test_fallback_to_lastgood_when_primary_corrupted() {
        let dir = TempDir::new().unwrap();
        let path = json_path(&dir);
        let data = json!({"status": "good"});
        // Write valid data (creates primary + lastgood)
        atomic_write_json(&path, &data, BACKUP_COUNT);
        // Corrupt the primary file
        fs::write(&path, "NOT VALID JSON!!!").unwrap();
        let loaded = load_json_with_fallbacks(&path, BACKUP_COUNT);
        assert_eq!(loaded, Some(data));
    }
    #[test]
    fn test_fallback_to_bak1_when_primary_and_lastgood_corrupted() {
        let dir = TempDir::new().unwrap();
        let path = json_path(&dir);
        let path_str = path.as_os_str().to_string_lossy().to_string();
        let first = json!({"version": 1});
        let second = json!({"version": 2});
        // First write — creates primary + lastgood
        atomic_write_json(&path, &first, BACKUP_COUNT);
        // Second write — rotates first to .bak1, writes second as primary + lastgood
        atomic_write_json(&path, &second, BACKUP_COUNT);
        // Corrupt primary and lastgood
        fs::write(&path, "CORRUPT").unwrap();
        let lastgood = format!("{}.lastgood", path_str);
        fs::write(&lastgood, "ALSO CORRUPT").unwrap();
        // Should fall back to .bak1 which has first version
        let loaded = load_json_with_fallbacks(&path, BACKUP_COUNT);
        assert_eq!(loaded, Some(first));
    }
    #[test]
    fn test_backup_rotation_after_multiple_writes() {
        let dir = TempDir::new().unwrap();
        let path = json_path(&dir);
        let path_str = path.as_os_str().to_string_lossy().to_string();
        // Write 5 times with distinct values
        for i in 1..=5 {
            let data = json!({"write": i});
            atomic_write_json(&path, &data, BACKUP_COUNT);
        }
        // Primary should be the latest (write 5)
        let primary: Value =
            serde_json::from_str(&fs::read_to_string(&path).unwrap()).unwrap();
        assert_eq!(primary, json!({"write": 5}));
        // .bak1 should be the second-to-last (write 4)
        let bak1_path = format!("{}.bak1", path_str);
        let bak1: Value =
            serde_json::from_str(&fs::read_to_string(&bak1_path).unwrap()).unwrap();
        assert_eq!(bak1, json!({"write": 4}));
        // .bak2 should be write 3
        let bak2_path = format!("{}.bak2", path_str);
        let bak2: Value =
            serde_json::from_str(&fs::read_to_string(&bak2_path).unwrap()).unwrap();
        assert_eq!(bak2, json!({"write": 3}));
        // .bak3 should be write 2
        let bak3_path = format!("{}.bak3", path_str);
        let bak3: Value =
            serde_json::from_str(&fs::read_to_string(&bak3_path).unwrap()).unwrap();
        assert_eq!(bak3, json!({"write": 2}));
        // .bak4 should be write 1
        let bak4_path = format!("{}.bak4", path_str);
        let bak4: Value =
            serde_json::from_str(&fs::read_to_string(&bak4_path).unwrap()).unwrap();
        assert_eq!(bak4, json!({"write": 1}));
    }
    #[test]
    fn test_load_nonexistent_returns_none() {
        let dir = TempDir::new().unwrap();
        let path = dir.path().join("does_not_exist.json");
        let loaded = load_json_with_fallbacks(&path, BACKUP_COUNT);
        assert_eq!(loaded, None);
    }
    #[test]
    fn test_parent_directories_created() {
        let dir = TempDir::new().unwrap();
        let path = dir.path().join("sub").join("dir").join("nested.json");
        let data = json!({"nested": true});
        atomic_write_json(&path, &data, BACKUP_COUNT);
        let loaded = load_json_with_fallbacks(&path, BACKUP_COUNT);
        assert_eq!(loaded, Some(data));
    }
    #[test]
    fn test_lastgood_written() {
        let dir = TempDir::new().unwrap();
        let path = json_path(&dir);
        let path_str = path.as_os_str().to_string_lossy().to_string();
        let data = json!({"lg": true});
        atomic_write_json(&path, &data, BACKUP_COUNT);
        let lastgood_path = format!("{}.lastgood", path_str);
        let lg: Value =
            serde_json::from_str(&fs::read_to_string(&lastgood_path).unwrap()).unwrap();
        assert_eq!(lg, data);
    }
    #[test]
    fn test_backup_count_respected() {
        let dir = TempDir::new().unwrap();
        let path = json_path(&dir);
        let path_str = path.as_os_str().to_string_lossy().to_string();
        let small_count = 2;
        // Write 5 times with a backup_count of 2
        for i in 1..=5 {
            let data = json!({"write": i});
            atomic_write_json(&path, &data, small_count);
        }
        // With backup_count=2, rotation only goes up to .bak2 -> .bak3
        // After 5 writes: primary=5, bak1=4, bak2=3, bak3=2 (pushed from bak2)
        // .bak1 should exist
        let bak1_path = format!("{}.bak1", path_str);
        assert!(Path::new(&bak1_path).exists());
        // .bak2 should exist
        let bak2_path = format!("{}.bak2", path_str);
        assert!(Path::new(&bak2_path).exists());
        // .bak3 should exist (rotated from bak2)
        let bak3_path = format!("{}.bak3", path_str);
        assert!(Path::new(&bak3_path).exists());
    }
 }
@@ -0,0 +1,697 @@
 use once_cell::sync::Lazy;
 use regex::Regex;
 use sha2::{Digest, Sha256};
 use std::cmp::Ordering;
 use std::fs;
 use std::io::{Read, Seek, SeekFrom};
 use std::path::Path;
 // ---------------------------------------------------------------------------
 // 1. clamp
 // ---------------------------------------------------------------------------
 /// Clamp value `v` to the range `[a, b]`.
 pub fn clamp(v: f64, a: f64, b: f64) -> f64 {
    a.max(b.min(v))
 }
 // ---------------------------------------------------------------------------
 // 2. is_within_root
 // ---------------------------------------------------------------------------
 /// Check if `target` path is within (or equal to) the `root` directory.
 /// Prevents path-traversal attacks.
 pub fn is_within_root(root: &Path, target: &Path) -> bool {
    match (root.canonicalize(), target.canonicalize()) {
        (Ok(r), Ok(t)) => {
            t == r || t.starts_with(&r)
        }
        _ => false,
    }
 }
 // ---------------------------------------------------------------------------
 // 3. truthy
 // ---------------------------------------------------------------------------
 /// Convert a `serde_json::Value` to bool.
 ///
 /// Handles bool, number (nonzero == true), and string ("1","true","yes","y","on").
 pub fn truthy(v: &serde_json::Value) -> bool {
    match v {
        serde_json::Value::Bool(b) => *b,
        serde_json::Value::Number(n) => {
            if let Some(i) = n.as_i64() {
                i != 0
            } else if let Some(f) = n.as_f64() {
                f != 0.0
            } else {
                false
            }
        }
        serde_json::Value::String(s) => {
            matches!(s.trim().to_lowercase().as_str(), "1" | "true" | "yes" | "y" | "on")
        }
        _ => false,
    }
 }
 // ---------------------------------------------------------------------------
 // 4. folder_display_name
 // ---------------------------------------------------------------------------
 /// Get a display-friendly name for a folder path (last component).
 pub fn folder_display_name(path_str: &str) -> String {
    let p = Path::new(path_str);
    match p.file_name() {
        Some(name) => name.to_string_lossy().to_string(),
        None => path_str.to_string(),
    }
 }
 // ---------------------------------------------------------------------------
 // 5. deduplicate_list
 // ---------------------------------------------------------------------------
 /// Remove duplicates from a list while preserving order.
 /// Skips empty / whitespace-only strings. Items are trimmed.
 pub fn deduplicate_list(items: &[String]) -> Vec<String> {
    let mut seen = std::collections::HashSet::new();
    let mut result = Vec::new();
    for item in items {
        let s = item.trim().to_string();
        if !s.is_empty() && seen.insert(s.clone()) {
            result.push(s);
        }
    }
    result
 }
 // ---------------------------------------------------------------------------
 // 6. natural_key
 // ---------------------------------------------------------------------------
 /// One part of a natural sort key: either a number or a lowercased text fragment.
 #[derive(Debug, Clone, PartialEq, Eq)]
 pub enum NaturalKeyPart {
    Num(u64),
    Text(String),
 }
 impl PartialOrd for NaturalKeyPart {
    fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
        Some(self.cmp(other))
    }
 }
 impl Ord for NaturalKeyPart {
    fn cmp(&self, other: &Self) -> Ordering {
        match (self, other) {
            (NaturalKeyPart::Num(a), NaturalKeyPart::Num(b)) => a.cmp(b),
            (NaturalKeyPart::Text(a), NaturalKeyPart::Text(b)) => a.cmp(b),
            // Numbers sort before text (matches Python behaviour where int < str
            // is not directly defined, but in practice natural_key is only compared
            // against keys of the same structure).
            (NaturalKeyPart::Num(_), NaturalKeyPart::Text(_)) => Ordering::Less,
            (NaturalKeyPart::Text(_), NaturalKeyPart::Num(_)) => Ordering::Greater,
        }
    }
 }
 static NUM_SPLIT_RE: Lazy<Regex> = Lazy::new(|| Regex::new(r"(\d+)").unwrap());
 /// Generate a sort key for natural sorting (e.g., "2" sorts before "10").
 ///
 /// Splits the string on digit runs; numeric parts become `Num`, the rest become
 /// lower-cased `Text`.
 pub fn natural_key(s: &str) -> Vec<NaturalKeyPart> {
    let mut parts = Vec::new();
    let mut last_end = 0;
    for m in NUM_SPLIT_RE.find_iter(s) {
        // Text before this match
        if m.start() > last_end {
            parts.push(NaturalKeyPart::Text(
                s[last_end..m.start()].to_lowercase(),
            ));
        }
        // The numeric match
        let num: u64 = m.as_str().parse().unwrap_or(u64::MAX);
        parts.push(NaturalKeyPart::Num(num));
        last_end = m.end();
    }
    // Trailing text after the last match (or the entire string if no digits)
    if last_end < s.len() {
        parts.push(NaturalKeyPart::Text(s[last_end..].to_lowercase()));
    }
    // If the input was empty, return a single empty Text part so comparisons
    // never deal with an empty vec.
    if parts.is_empty() {
        parts.push(NaturalKeyPart::Text(String::new()));
    }
    parts
 }
 // ---------------------------------------------------------------------------
 // 7. smart_title_case
 // ---------------------------------------------------------------------------
 /// Words that should remain lowercase in title case (except at start).
 const SMALL_WORDS: &[&str] = &[
    "a", "an", "the", "and", "or", "but", "for", "nor", "as", "at", "by", "in", "of", "on",
    "per", "to", "vs", "via", "with", "into", "from",
 ];
 static WHITESPACE_SPLIT_RE: Lazy<Regex> = Lazy::new(|| Regex::new(r"(\s+)").unwrap());
 /// Convert text to title case, keeping small words lowercase (except at start).
 /// Words containing digits or all-uppercase words (acronyms) are preserved as-is.
 pub fn smart_title_case(text: &str) -> String {
    let trimmed = text.trim();
    if trimmed.is_empty() {
        return String::new();
    }
    // Split while keeping whitespace tokens (odd indices are whitespace).
    let tokens: Vec<&str> = WHITESPACE_SPLIT_RE.split(trimmed).collect();
    let spaces: Vec<&str> = WHITESPACE_SPLIT_RE
        .find_iter(trimmed)
        .map(|m| m.as_str())
        .collect();
    let mut out = String::new();
    let mut word_index = 0usize; // count of actual words seen so far (0-based)
    for (i, token) in tokens.iter().enumerate() {
        if i > 0 {
            // Insert whitespace separator that was between tokens[i-1] and tokens[i]
            if let Some(sp) = spaces.get(i - 1) {
                out.push_str(sp);
            }
        }
        let w = *token;
        // Preserve words with digits
        if w.chars().any(|c| c.is_ascii_digit()) {
            out.push_str(w);
            word_index += 1;
            continue;
        }
        // Preserve all-caps acronyms
        if w.chars().all(|c| c.is_uppercase() || !c.is_alphabetic()) && w.chars().any(|c| c.is_uppercase()) {
            out.push_str(w);
            word_index += 1;
            continue;
        }
        let lw = w.to_lowercase();
        if word_index != 0 && SMALL_WORDS.contains(&lw.as_str()) {
            out.push_str(&lw);
        } else {
            // Capitalize first character, lowercase the rest
            let mut chars = lw.chars();
            if let Some(first) = chars.next() {
                for c in first.to_uppercase() {
                    out.push(c);
                }
                out.extend(chars);
            }
        }
        word_index += 1;
    }
    out.trim().to_string()
 }
 // ---------------------------------------------------------------------------
 // 8. pretty_title_from_filename
 // ---------------------------------------------------------------------------
 static LEADING_INDEX_RE: Lazy<Regex> = Lazy::new(|| {
    Regex::new(r"^\s*(?:\(?\s*)?(?P<num>\d+)(?:\s*[.\-_]\s*\d+)*(?:\s*[.)\]\-]\s*|\s+)").unwrap()
 });
 static UNDERSCORE_RE: Lazy<Regex> = Lazy::new(|| Regex::new(r"[_]+").unwrap());
 static MULTI_SPACE_RE: Lazy<Regex> = Lazy::new(|| Regex::new(r"\s+").unwrap());
 static LEADING_PUNCT_RE: Lazy<Regex> =
    Lazy::new(|| Regex::new(r"^\s*[-\u{2013}\u{2014}:.)\]]\s*").unwrap());
 /// Convert a filename to a human-readable title.
 ///
 /// Removes extension, leading indices, underscores, and applies smart title case.
 pub fn pretty_title_from_filename(filename: &str) -> String {
    let stem = Path::new(filename)
        .file_stem()
        .map(|s| s.to_string_lossy().to_string())
        .unwrap_or_else(|| filename.to_string());
    // Replace underscores with spaces
    let base = UNDERSCORE_RE.replace_all(&stem, " ");
    let base = MULTI_SPACE_RE.replace_all(&base, " ");
    let mut base = base.trim().to_string();
    // Remove leading index numbers
    if let Some(m) = LEADING_INDEX_RE.find(&base) {
        base = base[m.end()..].trim().to_string();
    }
    // Remove leading punctuation
    let cleaned = LEADING_PUNCT_RE.replace(&base, "");
    let cleaned = MULTI_SPACE_RE.replace_all(&cleaned, " ");
    let mut base = cleaned.trim().to_string();
    // Fall back to original stem if nothing left
    if base.is_empty() {
        base = Path::new(filename)
            .file_stem()
            .map(|s| s.to_string_lossy().to_string())
            .unwrap_or_else(|| filename.to_string());
    }
    smart_title_case(&base)
 }
 // ---------------------------------------------------------------------------
 // 9. file_fingerprint
 // ---------------------------------------------------------------------------
 const FP_CHUNK_SIZE: u64 = 256 * 1024; // 256 KB
 /// Generate a content-based fingerprint (SHA-256 based) that survives renames/moves.
 ///
 /// Hash input: `b"VIDFIDv1\0"` + ascii(size) + `b"\0"` + first 256 KB + last 256 KB.
 /// Returns the first 20 hex chars of the digest.
 pub fn file_fingerprint(path: &Path) -> String {
    let size: u64 = fs::metadata(path).map(|m| m.len()).unwrap_or(0);
    let mut hasher = Sha256::new();
    hasher.update(b"VIDFIDv1\0");
    hasher.update(size.to_string().as_bytes());
    hasher.update(b"\0");
    if let Ok(mut f) = fs::File::open(path) {
        // Read head
        let head_len = std::cmp::min(size, FP_CHUNK_SIZE) as usize;
        let mut head = vec![0u8; head_len];
        if f.read_exact(&mut head).is_ok() {
            hasher.update(&head);
        }
        // Read tail if file is large enough
        if size > FP_CHUNK_SIZE {
            let tail_offset = size.saturating_sub(FP_CHUNK_SIZE);
            if f.seek(SeekFrom::Start(tail_offset)).is_ok() {
                let tail_len = (size - tail_offset) as usize;
                let mut tail = vec![0u8; tail_len];
                if f.read_exact(&mut tail).is_ok() {
                    hasher.update(&tail);
                }
            }
        }
    }
    let digest = hasher.finalize();
    format!("{:x}", digest)
        .chars()
        .take(20)
        .collect()
 }
 // ---------------------------------------------------------------------------
 // 10. compute_library_id
 // ---------------------------------------------------------------------------
 /// Compute a stable library ID from a list of file fingerprints.
 ///
 /// Hash input: `b"LIBFIDv2\0"` + each fid (sorted) joined by `b"\n"`.
 /// Returns the first 16 hex chars of the digest.
 pub fn compute_library_id(fids: &[String]) -> String {
    let mut valid_fids: Vec<&str> = fids
        .iter()
        .map(|s| s.as_str())
        .filter(|s| !s.is_empty())
        .collect();
    valid_fids.sort();
    let mut hasher = Sha256::new();
    hasher.update(b"LIBFIDv2\0");
    for fid in &valid_fids {
        hasher.update(fid.as_bytes());
        hasher.update(b"\n");
    }
    let digest = hasher.finalize();
    format!("{:x}", digest)
        .chars()
        .take(16)
        .collect()
 }
 // ===========================================================================
 // Tests
 // ===========================================================================
 #[cfg(test)]
 mod tests {
    use super::*;
    use std::io::Write;
    // -- clamp ---------------------------------------------------------------
    #[test]
    fn test_clamp_within_range() {
        assert_eq!(clamp(5.0, 0.0, 10.0), 5.0);
    }
    #[test]
    fn test_clamp_below() {
        assert_eq!(clamp(-1.0, 0.0, 10.0), 0.0);
    }
    #[test]
    fn test_clamp_above() {
        assert_eq!(clamp(15.0, 0.0, 10.0), 10.0);
    }
    #[test]
    fn test_clamp_at_boundary() {
        assert_eq!(clamp(0.0, 0.0, 10.0), 0.0);
        assert_eq!(clamp(10.0, 0.0, 10.0), 10.0);
    }
    // -- is_within_root ------------------------------------------------------
    #[test]
    fn test_is_within_root_same_dir() {
        let dir = tempfile::tempdir().unwrap();
        assert!(is_within_root(dir.path(), dir.path()));
    }
    #[test]
    fn test_is_within_root_child() {
        let dir = tempfile::tempdir().unwrap();
        let child = dir.path().join("child");
        fs::create_dir(&child).unwrap();
        assert!(is_within_root(dir.path(), &child));
    }
    #[test]
    fn test_is_within_root_outside() {
        let dir1 = tempfile::tempdir().unwrap();
        let dir2 = tempfile::tempdir().unwrap();
        assert!(!is_within_root(dir1.path(), dir2.path()));
    }
    #[test]
    fn test_is_within_root_nonexistent() {
        let dir = tempfile::tempdir().unwrap();
        let fake = dir.path().join("no_such_dir");
        assert!(!is_within_root(dir.path(), &fake));
    }
    // -- truthy --------------------------------------------------------------
    #[test]
    fn test_truthy_bool() {
        assert!(truthy(&serde_json::json!(true)));
        assert!(!truthy(&serde_json::json!(false)));
    }
    #[test]
    fn test_truthy_number() {
        assert!(truthy(&serde_json::json!(1)));
        assert!(truthy(&serde_json::json!(-1)));
        assert!(!truthy(&serde_json::json!(0)));
        assert!(truthy(&serde_json::json!(0.5)));
        assert!(!truthy(&serde_json::json!(0.0)));
    }
    #[test]
    fn test_truthy_string() {
        for s in &["1", "true", "yes", "y", "on", "TRUE", "Yes", " on "] {
            assert!(truthy(&serde_json::json!(s)), "expected truthy for {:?}", s);
        }
        for s in &["0", "false", "no", "off", "", "random"] {
            assert!(!truthy(&serde_json::json!(s)), "expected falsy for {:?}", s);
        }
    }
    #[test]
    fn test_truthy_null_and_array() {
        assert!(!truthy(&serde_json::json!(null)));
        assert!(!truthy(&serde_json::json!([])));
        assert!(!truthy(&serde_json::json!({})));
    }
    // -- folder_display_name -------------------------------------------------
    #[test]
    fn test_folder_display_name_normal() {
        assert_eq!(folder_display_name("/home/user/videos"), "videos");
    }
    #[test]
    fn test_folder_display_name_root() {
        // On unix "/" has no file_name component
        assert_eq!(folder_display_name("/"), "/");
    }
    #[test]
    fn test_folder_display_name_windows() {
        assert_eq!(folder_display_name(r"C:\Users\foo\bar"), "bar");
    }
    // -- deduplicate_list ----------------------------------------------------
    #[test]
    fn test_deduplicate_preserves_order() {
        let input: Vec<String> = vec!["a", "b", "c", "a", "b"]
            .into_iter()
            .map(String::from)
            .collect();
        assert_eq!(deduplicate_list(&input), vec!["a", "b", "c"]);
    }
    #[test]
    fn test_deduplicate_skips_empty_and_whitespace() {
        let input: Vec<String> = vec!["a", "", "  ", "b", " a "]
            .into_iter()
            .map(String::from)
            .collect();
        assert_eq!(deduplicate_list(&input), vec!["a", "b"]);
    }
    // -- natural_key ---------------------------------------------------------
    #[test]
    fn test_natural_key_basic() {
        let key = natural_key("file10name");
        assert_eq!(
            key,
            vec![
                NaturalKeyPart::Text("file".to_string()),
                NaturalKeyPart::Num(10),
                NaturalKeyPart::Text("name".to_string()),
            ]
        );
    }
    #[test]
    fn test_natural_sort_order() {
        let mut items = vec!["file10", "file2", "file1", "file20"];
        items.sort_by(|a, b| natural_key(a).cmp(&natural_key(b)));
        assert_eq!(items, vec!["file1", "file2", "file10", "file20"]);
    }
    #[test]
    fn test_natural_key_case_insensitive() {
        let k1 = natural_key("ABC");
        let k2 = natural_key("abc");
        assert_eq!(k1, k2);
    }
    #[test]
    fn test_natural_key_empty() {
        let key = natural_key("");
        assert_eq!(key, vec![NaturalKeyPart::Text(String::new())]);
    }
    // -- smart_title_case ----------------------------------------------------
    #[test]
    fn test_smart_title_case_basic() {
        assert_eq!(smart_title_case("hello world"), "Hello World");
    }
    #[test]
    fn test_smart_title_case_small_words() {
        assert_eq!(
            smart_title_case("the art of war"),
            "The Art of War"
        );
    }
    #[test]
    fn test_smart_title_case_preserves_acronyms() {
        assert_eq!(smart_title_case("learn SQL today"), "Learn SQL Today");
    }
    #[test]
    fn test_smart_title_case_preserves_digits() {
        assert_eq!(smart_title_case("lesson 3b overview"), "Lesson 3b Overview");
    }
    #[test]
    fn test_smart_title_case_empty() {
        assert_eq!(smart_title_case(""), "");
    }
    // -- pretty_title_from_filename ------------------------------------------
    #[test]
    fn test_pretty_title_basic() {
        assert_eq!(
            pretty_title_from_filename("01_introduction_to_python.mp4"),
            "Introduction to Python"
        );
    }
    #[test]
    fn test_pretty_title_with_parens_index() {
        assert_eq!(
            pretty_title_from_filename("(2) my_file.mp4"),
            "My File"
        );
    }
    #[test]
    fn test_pretty_title_no_extension() {
        assert_eq!(
            pretty_title_from_filename("hello_world"),
            "Hello World"
        );
    }
    #[test]
    fn test_pretty_title_only_numbers() {
        // When stripping removes everything, falls back to stem
        let result = pretty_title_from_filename("123.mp4");
        assert!(!result.is_empty());
    }
    // -- file_fingerprint ----------------------------------------------------
    #[test]
    fn test_file_fingerprint_small_file() {
        let dir = tempfile::tempdir().unwrap();
        let fpath = dir.path().join("test.bin");
        {
            let mut f = fs::File::create(&fpath).unwrap();
            f.write_all(b"hello world").unwrap();
        }
        let fp = file_fingerprint(&fpath);
        assert_eq!(fp.len(), 20);
        // Should be deterministic
        assert_eq!(fp, file_fingerprint(&fpath));
    }
    #[test]
    fn test_file_fingerprint_large_file() {
        let dir = tempfile::tempdir().unwrap();
        let fpath = dir.path().join("big.bin");
        {
            let mut f = fs::File::create(&fpath).unwrap();
            // Write 512 KB + 1 byte to ensure head/tail branches are hit
            let data = vec![0xABu8; 256 * 1024 + 1];
            f.write_all(&data).unwrap();
            f.write_all(&vec![0xCDu8; 256 * 1024]).unwrap();
        }
        let fp = file_fingerprint(&fpath);
        assert_eq!(fp.len(), 20);
    }
    #[test]
    fn test_file_fingerprint_nonexistent() {
        let fp = file_fingerprint(Path::new("/no/such/file/ever.bin"));
        assert_eq!(fp.len(), 20);
    }
    #[test]
    fn test_file_fingerprint_matches_python() {
        // Verify against a known value produced by the Python code.
        // Python: file_fingerprint on a file containing b"hello world" (11 bytes).
        //   h = sha256()
        //   h.update(b"VIDFIDv1\0")
        //   h.update(b"11")       # str(size)
        //   h.update(b"\0")
        //   h.update(b"hello world")  # head (< CHUNK_SIZE, no tail)
        //   digest[:20]
        //
        // We precompute this in Rust to assert compatibility.
        let mut h = Sha256::new();
        h.update(b"VIDFIDv1\0");
        h.update(b"11");
        h.update(b"\0");
        h.update(b"hello world");
        let expected: String = format!("{:x}", h.finalize()).chars().take(20).collect();
        let dir = tempfile::tempdir().unwrap();
        let fpath = dir.path().join("compat.bin");
        fs::write(&fpath, b"hello world").unwrap();
        assert_eq!(file_fingerprint(&fpath), expected);
    }
    // -- compute_library_id --------------------------------------------------
    #[test]
    fn test_compute_library_id_basic() {
        let fids = vec!["abc".to_string(), "def".to_string()];
        let id = compute_library_id(&fids);
        assert_eq!(id.len(), 16);
    }
    #[test]
    fn test_compute_library_id_order_independent() {
        let fids1 = vec!["abc".to_string(), "def".to_string()];
        let fids2 = vec!["def".to_string(), "abc".to_string()];
        assert_eq!(compute_library_id(&fids1), compute_library_id(&fids2));
    }
    #[test]
    fn test_compute_library_id_skips_empty() {
        let with_empty = vec!["abc".to_string(), "".to_string(), "def".to_string()];
        let without_empty = vec!["abc".to_string(), "def".to_string()];
        assert_eq!(
            compute_library_id(&with_empty),
            compute_library_id(&without_empty)
        );
    }
    #[test]
    fn test_compute_library_id_matches_python() {
        // Python: compute_library_id_from_fids(["abc", "def"])
        //   sorted valid = ["abc", "def"]
        //   h = sha256()
        //   h.update(b"LIBFIDv2\0")
        //   h.update(b"abc"); h.update(b"\n")
        //   h.update(b"def"); h.update(b"\n")
        //   hexdigest()[:16]
        let mut h = Sha256::new();
        h.update(b"LIBFIDv2\0");
        h.update(b"abc");
        h.update(b"\n");
        h.update(b"def");
        h.update(b"\n");
        let expected: String = format!("{:x}", h.finalize()).chars().take(16).collect();
        let fids = vec!["abc".to_string(), "def".to_string()];
        assert_eq!(compute_library_id(&fids), expected);
    }
 }