From 211f95f5ae822e027023617ba6c06140e1cfb2b8 Mon Sep 17 00:00:00 2001
From: Oleh Martsokha <o.martsokha@gmail.com>
Date: Tue, 19 May 2026 03:42:09 +0200
Subject: [PATCH 1/6] refactor(codec, engine): first-class tabular redaction
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Spreadsheets now live in their own modality. Previously CSV pretended
to be text and XLSX pretended to be CSV; this PR makes both natively
tabular, with a new TabularHandler capability trait and a
ContentHandle::Tabular variant.

Codec changes:

- New TabularHandler trait in handler/tabular/ mirroring TextHandler's
  shape: locations(), read(&loc) -> Option<TextData>,
  redact(Redactions<TabularLocation, TabularRedaction>).
- BoxedTabularHandler type-erased wrapper.
- ContentHandle::Tabular(BoxedTabularHandler) — fifth variant.
  Spreadsheets route through decode_tabular() instead of decode_text().
- transform/tabular/apply.rs — apply_tabular_redactions() helper (the
  byte-level intra-cell replacement we deleted earlier, now driven).
- CsvHandler implements TabularHandler only — the prior
  TextHandler/byte-offset path is gone, taking ~250 lines of
  locate_cells/find_field_in_line scaffolding with it. Cells are
  addressed by (row_index, column_index); row 0 = headers if present,
  row 1+ = data rows. Intra-cell start/end offsets are optional;
  omitted means redact the whole cell.
- XlsxHandler implements TabularHandler-only (stub, real
  implementation pending).
- ContentHandle gains tabular_locations(), read_tabular(),
  apply_tabular_redactions().
- handler/text/ no longer contains csv_*.rs or xlsx_*.rs — they
  moved to handler/tabular/. Folder layout now matches modality.

Engine changes:

- Document gains collect_tabular_locations, read_tabular,
  apply_tabular_redactions. value_at(&Location) now dispatches
  Location::Tabular to read_tabular instead of returning None.
- RedactionApplicator gains build_tabular_redactions, parallel to
  the text/image/audio builders. Tabular entities with text
  strategies now actually apply (mask, replace, remove, hash,
  pseudonymize, encrypt-placeholder, tokenize-placeholder).

Redaction code-review cleanup (folded into the same PR since it
touches the same file):

- entity_map and mapping_index built once at the top of apply(),
  shared across all four build phases. Old code rebuilt them per
  phase and did O(n²) linear scans over redaction_map.entries.
- text_output mask repeat uses chars().count() instead of bytes()
  — a multi-byte grapheme like 'é' now produces one mask char, not
  two.
- text/image/audio strategy → output dispatch made explicit per
  variant. Non-exhaustive fallthroughs still exist (the strategy
  enums are #[non_exhaustive]) but each warns/logs instead of
  silently producing a generic placeholder.
- Image audit placeholders now encode the strategy:
  [IMAGE_BLUR:5], [IMAGE_BLOCK:#ff0000], [IMAGE_PIXELATE:8]
  instead of a single [IMAGE_REDACTED] for everything.
- Audio placeholders similarly: [AUDIO_SILENCE], [AUDIO_REMOVE].
- Modality-mismatch (e.g. Strategy::Image on a text entity) now
  logs at trace level instead of silently dropping.
- text_output / image_output / audio_output extracted to free
  functions; they no longer hide as ::Self::method calls.

Tests:

- 4 new end-to-end tabular tests on RedactionApplicator covering
  full-cell mask, partial-cell replace, remove → empty cell,
  and modality mismatch.
- 6 new TabularHandler tests on CsvHandler covering
  locations/read/redact across header and data rows.
- Codec: 87 → 93 tests pass.
- Engine: 80 → 85 tests pass.

cargo check / clippy / doc all clean.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 crates/nvisy-codec/src/document/mod.rs        |  88 ++-
 crates/nvisy-codec/src/handler/mod.rs         |   2 +
 .../src/handler/tabular/csv_handler.rs        | 439 +++++++++++++
 .../handler/{text => tabular}/csv_loader.rs   |   2 +-
 crates/nvisy-codec/src/handler/tabular/mod.rs |  64 ++
 .../src/handler/tabular/tabular_handler.rs    |  75 +++
 .../handler/{text => tabular}/xlsx_handler.rs |  22 +-
 .../handler/{text => tabular}/xlsx_loader.rs  |   0
 .../src/handler/text/csv_handler.rs           | 512 ---------------
 crates/nvisy-codec/src/handler/text/mod.rs    |   8 -
 .../src/handler/text/text_handler.rs          |   4 +-
 crates/nvisy-codec/src/transform/mod.rs       |   1 +
 .../src/transform/tabular/apply.rs            | 102 +++
 .../nvisy-codec/src/transform/tabular/mod.rs  |   2 +
 .../src/operation/envelope/document.rs        |  36 +-
 .../src/operation/extraction/mod.rs           |   8 +-
 .../src/operation/redaction/apply.rs          | 590 +++++++++++++-----
 17 files changed, 1244 insertions(+), 711 deletions(-)
 create mode 100644 crates/nvisy-codec/src/handler/tabular/csv_handler.rs
 rename crates/nvisy-codec/src/handler/{text => tabular}/csv_loader.rs (99%)
 create mode 100644 crates/nvisy-codec/src/handler/tabular/mod.rs
 create mode 100644 crates/nvisy-codec/src/handler/tabular/tabular_handler.rs
 rename crates/nvisy-codec/src/handler/{text => tabular}/xlsx_handler.rs (64%)
 rename crates/nvisy-codec/src/handler/{text => tabular}/xlsx_loader.rs (100%)
 delete mode 100644 crates/nvisy-codec/src/handler/text/csv_handler.rs
 create mode 100644 crates/nvisy-codec/src/transform/tabular/apply.rs
diff --git a/crates/nvisy-codec/src/document/mod.rs b/crates/nvisy-codec/src/document/mod.rs
index f192d6b5..8f5fe004 100644
--- a/crates/nvisy-codec/src/document/mod.rs
+++ b/crates/nvisy-codec/src/document/mod.rs
@@ -12,7 +12,7 @@ use nvisy_core::content::{Content, ContentData, ContentSource};
 use nvisy_core::media::{
     AudioFormat, DocumentType, ImageFormat, SpreadsheetFormat, TextFormat, WordFormat,
 };
-use nvisy_ontology::entity::{AudioLocation, ImageLocation, TextLocation};
+use nvisy_ontology::entity::{AudioLocation, ImageLocation, TabularLocation, TextLocation};
 
 pub use self::located::Located;
 pub use self::span::Span;
@@ -25,23 +25,27 @@ use crate::handler::{HtmlLoader, HtmlParams};
 use crate::handler::{PdfLoader, PdfParams};
 use crate::handler::{
     AudioData, AudioHandler, BoxedAudioHandler, BoxedImageHandler, BoxedRichHandler,
-    BoxedTextHandler, CsvLoader, CsvParams, Handler, ImageData, ImageHandler, JpegLoader,
-    JpegParams, JsonLoader, JsonParams, Loader, MarkdownLoader, MarkdownParams, Mp3Loader,
-    Mp3Params, PngLoader, PngParams, TextData, TextHandler, TiffLoader, TiffParams, TxtLoader,
-    TxtParams, WavLoader, WavParams, XlsxLoader, XlsxParams,
+    BoxedTabularHandler, BoxedTextHandler, CsvLoader, CsvParams, Handler, ImageData, ImageHandler,
+    JpegLoader, JpegParams, JsonLoader, JsonParams, Loader, MarkdownLoader, MarkdownParams,
+    Mp3Loader, Mp3Params, PngLoader, PngParams, TabularHandler, TextData, TextHandler, TiffLoader,
+    TiffParams, TxtLoader, TxtParams, WavLoader, WavParams, XlsxLoader, XlsxParams,
+};
+use crate::transform::{
+    AudioRedaction, ImageRedaction, Redactions, TabularRedaction, TextRedaction,
 };
-use crate::transform::{AudioRedaction, ImageRedaction, Redactions, TextRedaction};
 
 /// A fully type-erased document that can hold any supported format.
 ///
-/// Groups documents into four modality families:
-/// - **Text**: plain text, CSV, JSON, HTML, XLSX
+/// Groups documents into five modality families:
+/// - **Text**: plain text, JSON, HTML
+/// - **Tabular**: CSV, XLSX (cell-coordinate addressed)
 /// - **Image**: PNG, JPEG, TIFF
 /// - **Audio**: WAV, MP3
 /// - **Rich**: PDF, DOCX (multi-modal documents with text + images)
 #[derive(From, IsVariant, TryInto)]
 pub enum ContentHandle {
     Text(BoxedTextHandler),
+    Tabular(BoxedTabularHandler),
     Image(BoxedImageHandler),
     Audio(BoxedAudioHandler),
     Rich(BoxedRichHandler),
@@ -60,6 +64,7 @@ impl ContentHandle {
     pub fn document_type(&self) -> DocumentType {
         match self {
             Self::Text(h) => h.document_type(),
+            Self::Tabular(h) => h.document_type(),
             Self::Image(h) => h.document_type(),
             Self::Audio(h) => h.document_type(),
             Self::Rich(h) => h.document_type(),
@@ -70,6 +75,7 @@ impl ContentHandle {
     pub fn source(&self) -> ContentSource {
         match self {
             Self::Text(h) => h.source(),
+            Self::Tabular(h) => h.source(),
             Self::Image(h) => h.source(),
             Self::Audio(h) => h.source(),
             Self::Rich(h) => h.source(),
@@ -80,6 +86,7 @@ impl ContentHandle {
     pub fn encode(&self) -> Result<ContentData, Error> {
         match self {
             Self::Text(h) => h.encode(),
+            Self::Tabular(h) => h.encode(),
             Self::Image(h) => h.encode(),
             Self::Audio(h) => h.encode(),
             Self::Rich(h) => h.encode(),
@@ -91,7 +98,15 @@ impl ContentHandle {
         match self {
             Self::Text(h) => h.locations(),
             Self::Rich(h) => TextHandler::locations(h),
-            Self::Image(_) | Self::Audio(_) => LocationStream::empty(),
+            Self::Tabular(_) | Self::Image(_) | Self::Audio(_) => LocationStream::empty(),
+        }
+    }
+
+    /// Stream tabular (cell) locations from spreadsheet documents.
+    pub fn tabular_locations(&self) -> LocationStream<'_, TabularLocation> {
+        match self {
+            Self::Tabular(h) => h.locations(),
+            _ => LocationStream::empty(),
         }
     }
 
@@ -100,7 +115,7 @@ impl ContentHandle {
         match self {
             Self::Image(h) => h.locations(),
             Self::Rich(h) => ImageHandler::locations(h),
-            Self::Text(_) | Self::Audio(_) => LocationStream::empty(),
+            Self::Text(_) | Self::Tabular(_) | Self::Audio(_) => LocationStream::empty(),
         }
     }
 
@@ -120,7 +135,15 @@ impl ContentHandle {
         match self {
             Self::Text(h) => h.read(location).await,
             Self::Rich(h) => TextHandler::read(h, location).await,
-            Self::Image(_) | Self::Audio(_) => None,
+            Self::Tabular(_) | Self::Image(_) | Self::Audio(_) => None,
+        }
+    }
+
+    /// Read the cell value at the given tabular location.
+    pub async fn read_tabular(&self, location: &TabularLocation) -> Option<TextData> {
+        match self {
+            Self::Tabular(h) => h.read(location).await,
+            _ => None,
         }
     }
 
@@ -129,7 +152,7 @@ impl ContentHandle {
         match self {
             Self::Image(h) => h.read(location).await,
             Self::Rich(h) => ImageHandler::read(h, location).await,
-            Self::Text(_) | Self::Audio(_) => None,
+            Self::Text(_) | Self::Tabular(_) | Self::Audio(_) => None,
         }
     }
 
@@ -149,7 +172,18 @@ impl ContentHandle {
         match self {
             Self::Text(h) => h.redact(redactions).await,
             Self::Rich(h) => TextHandler::redact(h, redactions).await,
-            Self::Image(_) | Self::Audio(_) => Ok(()),
+            Self::Tabular(_) | Self::Image(_) | Self::Audio(_) => Ok(()),
+        }
+    }
+
+    /// Apply a batch of tabular redactions to the document.
+    pub async fn apply_tabular_redactions(
+        &mut self,
+        redactions: Redactions<TabularLocation, TabularRedaction>,
+    ) -> Result<(), Error> {
+        match self {
+            Self::Tabular(h) => h.redact(redactions).await,
+            _ => Ok(()),
         }
     }
 
@@ -161,7 +195,7 @@ impl ContentHandle {
         match self {
             Self::Image(h) => h.redact(redactions).await,
             Self::Rich(h) => ImageHandler::redact(h, redactions).await,
-            Self::Text(_) | Self::Audio(_) => Ok(()),
+            Self::Text(_) | Self::Tabular(_) | Self::Audio(_) => Ok(()),
         }
     }
 
@@ -172,7 +206,7 @@ impl ContentHandle {
     ) -> Result<(), Error> {
         match self {
             Self::Audio(h) => h.redact(redactions).await,
-            Self::Text(_) | Self::Image(_) | Self::Rich(_) => Ok(()),
+            _ => Ok(()),
         }
     }
 
@@ -188,9 +222,8 @@ impl ContentHandle {
         let data = content.data();
 
         match doc_type {
-            DocumentType::Text(_) | DocumentType::Html | DocumentType::Spreadsheet(_) => {
-                Self::decode_text(doc_type, data).await
-            }
+            DocumentType::Text(_) | DocumentType::Html => Self::decode_text(doc_type, data).await,
+            DocumentType::Spreadsheet(_) => Self::decode_tabular(doc_type, data).await,
             DocumentType::Image(_) => Self::decode_image(doc_type, data).await,
             DocumentType::Audio(_) => Self::decode_audio(doc_type, data).await,
             DocumentType::Pdf | DocumentType::Word(_) | DocumentType::Presentation(_) => {
@@ -218,6 +251,21 @@ impl ContentHandle {
                 .decode(content, &HtmlParams::default())
                 .await?
                 .into(),
+            _ => {
+                return Err(Error::validation(
+                    format!("no text loader for: {doc_type}"),
+                    "ContentHandle::decode_text",
+                ));
+            }
+        };
+        Ok(Self::from(handler))
+    }
+
+    async fn decode_tabular(
+        doc_type: DocumentType,
+        content: &ContentData,
+    ) -> Result<Self, Error> {
+        let handler: BoxedTabularHandler = match doc_type {
             DocumentType::Spreadsheet(SpreadsheetFormat::Csv) => CsvLoader
                 .decode(content, &CsvParams::default())
                 .await?
@@ -228,8 +276,8 @@ impl ContentHandle {
             }
             _ => {
                 return Err(Error::validation(
-                    format!("no text loader for: {doc_type}"),
-                    "ContentHandle::decode_text",
+                    format!("no tabular loader for: {doc_type}"),
+                    "ContentHandle::decode_tabular",
                 ));
             }
         };
diff --git a/crates/nvisy-codec/src/handler/mod.rs b/crates/nvisy-codec/src/handler/mod.rs
index 81e1bf3f..a5229f62 100644
--- a/crates/nvisy-codec/src/handler/mod.rs
+++ b/crates/nvisy-codec/src/handler/mod.rs
@@ -15,6 +15,7 @@ use nvisy_core::media::DocumentType;
 mod audio;
 mod image;
 mod rich;
+mod tabular;
 mod text;
 
 use nvisy_core::content::ContentSource;
@@ -22,6 +23,7 @@ use nvisy_core::content::ContentSource;
 pub use self::audio::*;
 pub use self::image::*;
 pub use self::rich::*;
+pub use self::tabular::*;
 pub use self::text::*;
 
 /// Base trait implemented by all format handlers.
diff --git a/crates/nvisy-codec/src/handler/tabular/csv_handler.rs b/crates/nvisy-codec/src/handler/tabular/csv_handler.rs
new file mode 100644
index 00000000..4901366d
--- /dev/null
+++ b/crates/nvisy-codec/src/handler/tabular/csv_handler.rs
@@ -0,0 +1,439 @@
+//! CSV handler: holds parsed CSV content and provides cell-coordinate
+//! access via [`Handler`] + [`TabularHandler`].
+//!
+//! [`TabularHandler::locations`] yields one [`TabularLocation`] per
+//! cell using `(row, col)` coordinates. Row `0` is the header row
+//! (if present); row `1` is the first data row when headers exist,
+//! else row `0` is the first data row. [`TabularHandler::read`]
+//! returns the cell's value as [`TextData`].
+//! [`TabularHandler::redact`] mutates cells by coordinate, applying
+//! intra-cell byte-offset replacements via [`apply_tabular_redactions`].
+//!
+//! [`TabularLocation`]: nvisy_ontology::entity::TabularLocation
+
+use nvisy_core::Error;
+use nvisy_core::content::{ContentData, ContentSource};
+use nvisy_core::media::{DocumentType, SpreadsheetFormat};
+use nvisy_ontology::entity::TabularLocation;
+
+use crate::document::{Located, LocationStream};
+use crate::handler::text::TextData;
+use crate::handler::{Handler, TabularHandler};
+use crate::transform::{Redactions, TabularRedaction, apply_tabular_redactions};
+
+const TARGET: &str = "csv-handler";
+
+/// Parsed CSV content.
+#[derive(Debug, Clone)]
+pub struct CsvData {
+    /// Column headers, if present.
+    pub headers: Option<Vec<String>>,
+    /// Data rows (excluding the header row).
+    pub rows: Vec<Vec<String>>,
+    /// Field delimiter byte (e.g. `b','`, `b'\t'`, `b';'`).
+    pub delimiter: u8,
+    /// Whether the original source had a trailing newline.
+    pub trailing_newline: bool,
+}
+
+/// Handler for loaded CSV content.
+#[derive(Debug)]
+pub struct CsvHandler {
+    source: ContentSource,
+    data: CsvData,
+}
+
+impl Handler for CsvHandler {
+    fn document_type(&self) -> DocumentType {
+        DocumentType::Spreadsheet(SpreadsheetFormat::Csv)
+    }
+
+    fn source(&self) -> ContentSource {
+        self.source
+    }
+
+    #[tracing::instrument(name = "csv.encode", skip_all, fields(output_bytes))]
+    fn encode(&self) -> Result<ContentData, Error> {
+        let bytes = self.serialize_bytes()?;
+        tracing::Span::current().record("output_bytes", bytes.len());
+        let source = ContentSource::new().with_parent(&self.source);
+        Ok(ContentData::new(source, bytes.into()))
+    }
+}
+
+#[async_trait::async_trait]
+impl TabularHandler for CsvHandler {
+    fn locations(&self) -> LocationStream<'_, TabularLocation> {
+        let source = self.source;
+        let has_headers = self.data.headers.is_some();
+
+        let mut items: Vec<_> = Vec::new();
+
+        if let Some(headers) = &self.data.headers {
+            for (col, _) in headers.iter().enumerate() {
+                items.push(Located::new(
+                    source,
+                    TabularLocation {
+                        row_index: 0,
+                        column_index: col,
+                        start_offset: None,
+                        end_offset: None,
+                        column_name: Some(headers[col].clone()),
+                        sheet_name: None,
+                    },
+                ));
+            }
+        }
+
+        for (data_row, row) in self.data.rows.iter().enumerate() {
+            let row_index = if has_headers { data_row + 1 } else { data_row };
+            for (col, _) in row.iter().enumerate() {
+                items.push(Located::new(
+                    source,
+                    TabularLocation {
+                        row_index,
+                        column_index: col,
+                        start_offset: None,
+                        end_offset: None,
+                        column_name: self
+                            .data
+                            .headers
+                            .as_ref()
+                            .and_then(|h| h.get(col).cloned()),
+                        sheet_name: None,
+                    },
+                ));
+            }
+        }
+
+        LocationStream::new(futures::stream::iter(items))
+    }
+
+    async fn read(&self, location: &TabularLocation) -> Option<TextData> {
+        let (is_header, data_row) = self.resolve_row(location.row_index)?;
+        let cell = if is_header {
+            self.data.headers.as_ref()?.get(location.column_index)?
+        } else {
+            self.data.rows.get(data_row)?.get(location.column_index)?
+        };
+        Some(TextData::from(cell.clone()))
+    }
+
+    async fn redact(
+        &mut self,
+        redactions: Redactions<TabularLocation, TabularRedaction>,
+    ) -> Result<(), Error> {
+        if redactions.is_empty() {
+            return Ok(());
+        }
+
+        for (loc, items) in redactions {
+            let Some((is_header, data_row)) = self.resolve_row(loc.row_index) else {
+                continue;
+            };
+            let cell = if is_header {
+                let Some(headers) = self.data.headers.as_mut() else {
+                    continue;
+                };
+                let Some(cell) = headers.get_mut(loc.column_index) else {
+                    continue;
+                };
+                cell
+            } else {
+                let Some(row) = self.data.rows.get_mut(data_row) else {
+                    continue;
+                };
+                let Some(cell) = row.get_mut(loc.column_index) else {
+                    continue;
+                };
+                cell
+            };
+            apply_tabular_redactions(cell, &items, TARGET)?;
+        }
+        Ok(())
+    }
+}
+
+impl CsvHandler {
+    /// Create a new handler from parsed CSV data.
+    pub fn new(data: CsvData) -> Self {
+        Self {
+            source: ContentSource::new(),
+            data,
+        }
+    }
+
+    /// Set the content source for lineage tracking.
+    pub fn with_source(mut self, source: ContentSource) -> Self {
+        self.source = source;
+        self
+    }
+
+    /// Column headers, if present.
+    pub fn headers(&self) -> Option<&[String]> {
+        self.data.headers.as_deref()
+    }
+
+    /// All data rows.
+    pub fn rows(&self) -> &[Vec<String>] {
+        &self.data.rows
+    }
+
+    /// Mutable access to all data rows.
+    pub fn rows_mut(&mut self) -> &mut Vec<Vec<String>> {
+        &mut self.data.rows
+    }
+
+    /// A specific cell by `(data_row, col)`.
+    ///
+    /// `data_row` is 0-based against the data rows (header is *not*
+    /// data row 0). Use [`TabularLocation`] coordinates with
+    /// [`TabularHandler::read`] if you need to address the header row.
+    ///
+    /// [`TabularHandler::read`]: crate::handler::TabularHandler::read
+    pub fn cell(&self, data_row: usize, col: usize) -> Option<&str> {
+        self.data
+            .rows
+            .get(data_row)
+            .and_then(|r| r.get(col))
+            .map(|s| s.as_str())
+    }
+
+    /// Number of data rows (excluding the header).
+    pub fn len(&self) -> usize {
+        self.data.rows.len()
+    }
+
+    /// Whether the document has no data rows.
+    pub fn is_empty(&self) -> bool {
+        self.data.rows.is_empty()
+    }
+
+    /// Detected field delimiter.
+    pub fn delimiter(&self) -> u8 {
+        self.data.delimiter
+    }
+
+    /// Whether the original source had a trailing newline.
+    pub fn trailing_newline(&self) -> bool {
+        self.data.trailing_newline
+    }
+
+    /// Consume the handler and return the inner [`CsvData`].
+    pub fn into_data(self) -> CsvData {
+        self.data
+    }
+
+    /// Resolve a [`TabularLocation::row_index`] to `(is_header, data_row)`.
+    ///
+    /// Returns `None` when the row index is out of range.
+    ///
+    /// [`TabularLocation::row_index`]: nvisy_ontology::entity::TabularLocation::row_index
+    fn resolve_row(&self, row_index: usize) -> Option<(bool, usize)> {
+        if self.data.headers.is_some() {
+            if row_index == 0 {
+                Some((true, 0))
+            } else {
+                let data_row = row_index - 1;
+                (data_row < self.data.rows.len()).then_some((false, data_row))
+            }
+        } else {
+            (row_index < self.data.rows.len()).then_some((false, row_index))
+        }
+    }
+
+    /// Serialize to bytes (with CRLF→LF normalization and trailing
+    /// newline handling).
+    fn serialize_bytes(&self) -> Result<Vec<u8>, Error> {
+        let mut wtr = csv::WriterBuilder::new()
+            .delimiter(self.data.delimiter)
+            .has_headers(false)
+            .from_writer(Vec::new());
+
+        if let Some(headers) = &self.data.headers {
+            wtr.write_record(headers)
+                .map_err(|e| Error::validation(format!("CSV encode error: {e}"), TARGET))?;
+        }
+        for row in &self.data.rows {
+            wtr.write_record(row)
+                .map_err(|e| Error::validation(format!("CSV encode error: {e}"), TARGET))?;
+        }
+        let mut bytes = wtr
+            .into_inner()
+            .map_err(|e| Error::validation(format!("CSV encode error: {e}"), TARGET))?;
+
+        bytes.retain(|&b| b != b'\r');
+
+        if !self.data.trailing_newline && bytes.last() == Some(&b'\n') {
+            bytes.pop();
+        }
+
+        Ok(bytes)
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use futures::StreamExt;
+    use nvisy_core::Error;
+
+    use super::*;
+    use crate::transform::{ConflictPolicy, TextOutput};
+
+    fn handler_with_headers(headers: Vec<&str>, rows: Vec<Vec<&str>>) -> CsvHandler {
+        CsvHandler::new(CsvData {
+            headers: Some(headers.into_iter().map(String::from).collect()),
+            rows: rows
+                .into_iter()
+                .map(|r| r.into_iter().map(String::from).collect())
+                .collect(),
+            delimiter: b',',
+            trailing_newline: true,
+        })
+    }
+
+    fn handler_no_headers(rows: Vec<Vec<&str>>) -> CsvHandler {
+        CsvHandler::new(CsvData {
+            headers: None,
+            rows: rows
+                .into_iter()
+                .map(|r| r.into_iter().map(String::from).collect())
+                .collect(),
+            delimiter: b',',
+            trailing_newline: true,
+        })
+    }
+
+    fn cell_loc(row: usize, col: usize) -> TabularLocation {
+        TabularLocation::builder()
+            .with_row_index(row)
+            .with_column_index(col)
+            .build()
+            .unwrap()
+    }
+
+    #[tokio::test]
+    async fn locations_yield_header_then_rows() {
+        let h = handler_with_headers(vec!["name", "age"], vec![vec!["Alice", "30"]]);
+        let items: Vec<_> = h.locations().collect().await;
+        assert_eq!(items.len(), 4);
+        assert_eq!(items[0].location.row_index, 0);
+        assert_eq!(items[0].location.column_index, 0);
+        assert_eq!(items[0].location.column_name.as_deref(), Some("name"));
+        assert_eq!(items[2].location.row_index, 1); // first data row
+        assert_eq!(items[2].location.column_index, 0);
+    }
+
+    #[tokio::test]
+    async fn locations_no_headers_start_at_row_zero() {
+        let h = handler_no_headers(vec![vec!["a", "b"], vec!["c", "d"]]);
+        let items: Vec<_> = h.locations().collect().await;
+        assert_eq!(items.len(), 4);
+        assert_eq!(items[0].location.row_index, 0);
+        assert_eq!(items[2].location.row_index, 1);
+    }
+
+    #[tokio::test]
+    async fn read_returns_cell_value() {
+        let h = handler_with_headers(vec!["name"], vec![vec!["Alice"]]);
+        // header
+        assert_eq!(h.read(&cell_loc(0, 0)).await.unwrap().as_str(), "name");
+        // first data row
+        assert_eq!(h.read(&cell_loc(1, 0)).await.unwrap().as_str(), "Alice");
+    }
+
+    #[tokio::test]
+    async fn read_out_of_bounds_returns_none() {
+        let h = handler_with_headers(vec!["a"], vec![vec!["1"]]);
+        assert!(h.read(&cell_loc(99, 0)).await.is_none());
+        assert!(h.read(&cell_loc(0, 99)).await.is_none());
+    }
+
+    #[tokio::test]
+    async fn redact_full_cell() -> Result<(), Error> {
+        let mut h = handler_with_headers(vec!["ssn"], vec![vec!["123-45-6789"]]);
+        let mut rs = Redactions::new(ConflictPolicy::Reject);
+        rs.try_insert(
+            cell_loc(1, 0),
+            TabularRedaction::new(0, 11, TextOutput::replace("[REDACTED]")),
+        )
+        .unwrap();
+        h.redact(rs).await?;
+        assert_eq!(h.cell(0, 0), Some("[REDACTED]"));
+        Ok(())
+    }
+
+    #[tokio::test]
+    async fn redact_partial_cell() -> Result<(), Error> {
+        let mut h = handler_with_headers(vec!["bio"], vec![vec!["Alice Smith"]]);
+        let mut rs = Redactions::new(ConflictPolicy::Reject);
+        rs.try_insert(
+            cell_loc(1, 0),
+            TabularRedaction::new(0, 5, TextOutput::replace("[NAME]")),
+        )
+        .unwrap();
+        h.redact(rs).await?;
+        assert_eq!(h.cell(0, 0), Some("[NAME] Smith"));
+        Ok(())
+    }
+
+    #[tokio::test]
+    async fn redact_header() -> Result<(), Error> {
+        let mut h = handler_with_headers(vec!["secret_field"], vec![vec!["v"]]);
+        let mut rs = Redactions::new(ConflictPolicy::Reject);
+        rs.try_insert(
+            cell_loc(0, 0),
+            TabularRedaction::new(0, 12, TextOutput::replace("redacted")),
+        )
+        .unwrap();
+        h.redact(rs).await?;
+        assert_eq!(h.headers(), Some(["redacted".to_string()].as_slice()));
+        Ok(())
+    }
+
+    #[tokio::test]
+    async fn redact_unknown_row_skipped() -> Result<(), Error> {
+        let mut h = handler_with_headers(vec!["a"], vec![vec!["one"]]);
+        let mut rs = Redactions::new(ConflictPolicy::Reject);
+        rs.try_insert(
+            cell_loc(99, 0),
+            TabularRedaction::new(0, 1, TextOutput::replace("X")),
+        )
+        .unwrap();
+        h.redact(rs).await?;
+        assert_eq!(h.cell(0, 0), Some("one"));
+        Ok(())
+    }
+
+    #[test]
+    fn encode_with_headers() -> Result<(), Error> {
+        let h = handler_with_headers(
+            vec!["name", "age"],
+            vec![vec!["Alice", "30"], vec!["Bob", "25"]],
+        );
+        let content = h.encode()?;
+        assert_eq!(
+            content.as_str().expect("valid utf-8"),
+            "name,age\nAlice,30\nBob,25\n"
+        );
+        Ok(())
+    }
+
+    #[test]
+    fn encode_with_quoting() -> Result<(), Error> {
+        let h = handler_with_headers(vec!["name", "bio"], vec![vec!["Alice", "Has a, comma"]]);
+        let content = h.encode()?;
+        let text = content.as_str().expect("valid utf-8");
+        assert!(text.contains("\"Has a, comma\""));
+        Ok(())
+    }
+
+    #[test]
+    fn encode_without_trailing_newline() -> Result<(), Error> {
+        let mut h = handler_with_headers(vec!["a"], vec![vec!["1"]]);
+        h.data.trailing_newline = false;
+        let content = h.encode()?;
+        assert_eq!(content.as_str().expect("valid utf-8"), "a\n1");
+        Ok(())
+    }
+}
diff --git a/crates/nvisy-codec/src/handler/text/csv_loader.rs b/crates/nvisy-codec/src/handler/tabular/csv_loader.rs
similarity index 99%
rename from crates/nvisy-codec/src/handler/text/csv_loader.rs
rename to crates/nvisy-codec/src/handler/tabular/csv_loader.rs
index df25da0b..0d749f77 100644
--- a/crates/nvisy-codec/src/handler/text/csv_loader.rs
+++ b/crates/nvisy-codec/src/handler/tabular/csv_loader.rs
@@ -140,7 +140,7 @@ mod tests {
     use nvisy_core::media::{DocumentType, SpreadsheetFormat};
 
     use super::*;
-    use crate::handler::{Handler, TextHandler};
+    use crate::handler::{Handler, TabularHandler};
 
     fn content_from_str(s: &str) -> ContentData {
         ContentData::new(ContentSource::new(), Bytes::from(s.to_owned()))
diff --git a/crates/nvisy-codec/src/handler/tabular/mod.rs b/crates/nvisy-codec/src/handler/tabular/mod.rs
new file mode 100644
index 00000000..95712cf8
--- /dev/null
+++ b/crates/nvisy-codec/src/handler/tabular/mod.rs
@@ -0,0 +1,64 @@
+//! Tabular (spreadsheet) handlers and capability trait.
+//!
+//! Tabular handlers address content by cell coordinate
+//! ([`TabularLocation`] = row + column, optionally with intra-cell
+//! byte offsets), distinct from text handlers that address content by
+//! byte offset in a serialized stream. CSV decodes into a handler
+//! that implements **both** capabilities — the same parsed rows are
+//! readable either by byte offset (as text) or by `(row, col)` (as a
+//! cell). XLSX decodes into a handler that implements **only** the
+//! tabular capability — the underlying ZIP-of-XML structure does not
+//! map to flat byte offsets.
+//!
+//! [`TabularLocation`]: nvisy_ontology::entity::TabularLocation
+
+use nvisy_core::Error;
+use nvisy_ontology::entity::TabularLocation;
+
+use super::Handler;
+use crate::document::LocationStream;
+use crate::handler::TextData;
+use crate::transform::{Redactions, TabularRedaction};
+
+mod csv_handler;
+mod csv_loader;
+mod tabular_handler;
+mod xlsx_handler;
+mod xlsx_loader;
+
+pub use self::csv_handler::{CsvData, CsvHandler};
+pub use self::csv_loader::{CsvLoader, CsvParams};
+pub use self::tabular_handler::BoxedTabularHandler;
+pub use self::xlsx_handler::XlsxHandler;
+pub use self::xlsx_loader::{XlsxLoader, XlsxParams};
+
+/// Capability trait for handlers that expose content by cell coordinate.
+///
+/// Handlers expose tabular content as a stream of
+/// [`TabularLocation`]s identifying individual cells, with explicit
+/// `read` calls to fetch a cell's value as [`TextData`], and a
+/// `redact` call that applies a batch of [`TabularRedaction`]s
+/// grouped by cell.
+#[async_trait::async_trait]
+pub trait TabularHandler: Handler {
+    /// Async stream of [`TabularLocation`]s for this document, each
+    /// tagged with the handler's [`ContentSource`].
+    ///
+    /// [`ContentSource`]: nvisy_core::content::ContentSource
+    fn locations(&self) -> LocationStream<'_, TabularLocation>;
+
+    /// Read the cell value at the given location as text.
+    ///
+    /// Returns `None` if the location is out of bounds.
+    async fn read(&self, location: &TabularLocation) -> Option<TextData>;
+
+    /// Apply a batch of redactions grouped by [`TabularLocation`].
+    ///
+    /// Cell identity is supplied by the [`Redactions`] collection's
+    /// keys; each redaction within a cell carries intra-cell byte
+    /// offsets that the handler maps onto its own cell value.
+    async fn redact(
+        &mut self,
+        redactions: Redactions<TabularLocation, TabularRedaction>,
+    ) -> Result<(), Error>;
+}
diff --git a/crates/nvisy-codec/src/handler/tabular/tabular_handler.rs b/crates/nvisy-codec/src/handler/tabular/tabular_handler.rs
new file mode 100644
index 00000000..dab555f2
--- /dev/null
+++ b/crates/nvisy-codec/src/handler/tabular/tabular_handler.rs
@@ -0,0 +1,75 @@
+//! [`BoxedTabularHandler`]: type-erased wrapper over all tabular handler types.
+
+use std::fmt;
+
+use nvisy_core::Error;
+use nvisy_core::content::{ContentData, ContentSource};
+use nvisy_core::media::DocumentType;
+use nvisy_ontology::entity::TabularLocation;
+
+use super::TabularHandler;
+use crate::document::LocationStream;
+use crate::handler::{CsvHandler, Handler, TextData, XlsxHandler};
+use crate::transform::{Redactions, TabularRedaction};
+
+/// A type-erased tabular handler backed by a boxed trait object.
+pub struct BoxedTabularHandler(Box<dyn TabularHandler>);
+
+impl BoxedTabularHandler {
+    /// Wrap any concrete tabular handler.
+    pub fn new(handler: impl TabularHandler + 'static) -> Self {
+        Self(Box::new(handler))
+    }
+}
+
+impl fmt::Debug for BoxedTabularHandler {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        f.debug_tuple("BoxedTabularHandler")
+            .field(&self.0.document_type())
+            .finish()
+    }
+}
+
+impl Handler for BoxedTabularHandler {
+    fn document_type(&self) -> DocumentType {
+        self.0.document_type()
+    }
+
+    fn source(&self) -> ContentSource {
+        self.0.source()
+    }
+
+    fn encode(&self) -> Result<ContentData, Error> {
+        self.0.encode()
+    }
+}
+
+#[async_trait::async_trait]
+impl TabularHandler for BoxedTabularHandler {
+    fn locations(&self) -> LocationStream<'_, TabularLocation> {
+        self.0.locations()
+    }
+
+    async fn read(&self, location: &TabularLocation) -> Option<TextData> {
+        self.0.read(location).await
+    }
+
+    async fn redact(
+        &mut self,
+        redactions: Redactions<TabularLocation, TabularRedaction>,
+    ) -> Result<(), Error> {
+        self.0.redact(redactions).await
+    }
+}
+
+impl From<CsvHandler> for BoxedTabularHandler {
+    fn from(h: CsvHandler) -> Self {
+        Self::new(h)
+    }
+}
+
+impl From<XlsxHandler> for BoxedTabularHandler {
+    fn from(h: XlsxHandler) -> Self {
+        Self::new(h)
+    }
+}
diff --git a/crates/nvisy-codec/src/handler/text/xlsx_handler.rs b/crates/nvisy-codec/src/handler/tabular/xlsx_handler.rs
similarity index 64%
rename from crates/nvisy-codec/src/handler/text/xlsx_handler.rs
rename to crates/nvisy-codec/src/handler/tabular/xlsx_handler.rs
index ac6d0e92..3af2d881 100644
--- a/crates/nvisy-codec/src/handler/text/xlsx_handler.rs
+++ b/crates/nvisy-codec/src/handler/tabular/xlsx_handler.rs
@@ -1,14 +1,20 @@
 //! XLSX handler (stub: awaiting full spreadsheet support).
+//!
+//! Implements [`TabularHandler`] only — the underlying ZIP-of-XML
+//! structure does not map to flat byte offsets, so the handler does
+//! not implement [`TextHandler`].
+//!
+//! [`TabularHandler`]: crate::handler::TabularHandler
+//! [`TextHandler`]: crate::handler::TextHandler
 
 use nvisy_core::Error;
 use nvisy_core::content::{ContentData, ContentSource};
 use nvisy_core::media::{DocumentType, SpreadsheetFormat};
-use nvisy_ontology::entity::TextLocation;
+use nvisy_ontology::entity::TabularLocation;
 
 use crate::document::LocationStream;
-use crate::handler::text::TextData;
-use crate::handler::{Handler, TextHandler};
-use crate::transform::{Redactions, TextRedaction};
+use crate::handler::{Handler, TabularHandler, TextData};
+use crate::transform::{Redactions, TabularRedaction};
 
 #[derive(Debug, Default)]
 pub struct XlsxHandler {
@@ -47,18 +53,18 @@ impl Handler for XlsxHandler {
 }
 
 #[async_trait::async_trait]
-impl TextHandler for XlsxHandler {
-    fn locations(&self) -> LocationStream<'_, TextLocation> {
+impl TabularHandler for XlsxHandler {
+    fn locations(&self) -> LocationStream<'_, TabularLocation> {
         LocationStream::empty()
     }
 
-    async fn read(&self, _location: &TextLocation) -> Option<TextData> {
+    async fn read(&self, _location: &TabularLocation) -> Option<TextData> {
         None
     }
 
     async fn redact(
         &mut self,
-        _redactions: Redactions<TextLocation, TextRedaction>,
+        _redactions: Redactions<TabularLocation, TabularRedaction>,
     ) -> Result<(), Error> {
         Ok(())
     }
diff --git a/crates/nvisy-codec/src/handler/text/xlsx_loader.rs b/crates/nvisy-codec/src/handler/tabular/xlsx_loader.rs
similarity index 100%
rename from crates/nvisy-codec/src/handler/text/xlsx_loader.rs
rename to crates/nvisy-codec/src/handler/tabular/xlsx_loader.rs
diff --git a/crates/nvisy-codec/src/handler/text/csv_handler.rs b/crates/nvisy-codec/src/handler/text/csv_handler.rs
deleted file mode 100644
index 67c60ba1..00000000
--- a/crates/nvisy-codec/src/handler/text/csv_handler.rs
+++ /dev/null
@@ -1,512 +0,0 @@
-//! CSV handler: holds parsed CSV content and provides location-based
-//! access via [`Handler`] + [`TextHandler`].
-//!
-//! [`TextHandler::locations`] yields one location per cell, ordered
-//! header-then-row-major. Each location's byte offsets address the
-//! field in the **serialized** CSV form (quoted/escaped if necessary).
-//! [`TextHandler::read`] returns the unescaped cell value.
-
-use nvisy_core::Error;
-use nvisy_core::content::{ContentData, ContentSource};
-use nvisy_core::media::{DocumentType, SpreadsheetFormat};
-use nvisy_ontology::entity::TextLocation;
-
-use crate::document::{Located, LocationStream};
-use crate::handler::text::TextData;
-use crate::handler::{Handler, TextHandler};
-use crate::transform::{Redactions, TextRedaction, apply_text_redactions};
-
-const TARGET: &str = "csv-handler";
-
-/// Parsed CSV content.
-#[derive(Debug, Clone)]
-pub struct CsvData {
-    /// Column headers, if present.
-    pub headers: Option<Vec<String>>,
-    /// Data rows (excluding the header row).
-    pub rows: Vec<Vec<String>>,
-    /// Field delimiter byte (e.g. `b','`, `b'\t'`, `b';'`).
-    pub delimiter: u8,
-    /// Whether the original source had a trailing newline.
-    pub trailing_newline: bool,
-}
-
-/// Handler for loaded CSV content.
-#[derive(Debug)]
-pub struct CsvHandler {
-    source: ContentSource,
-    data: CsvData,
-}
-
-/// A located CSV cell with structural identity and byte offsets.
-struct CellLocation {
-    is_header: bool,
-    row: usize,
-    col: usize,
-    value: String,
-    start: usize,
-    end: usize,
-    line_number: u32,
-}
-
-impl Handler for CsvHandler {
-    fn document_type(&self) -> DocumentType {
-        DocumentType::Spreadsheet(SpreadsheetFormat::Csv)
-    }
-
-    fn source(&self) -> ContentSource {
-        self.source
-    }
-
-    #[tracing::instrument(name = "csv.encode", skip_all, fields(output_bytes))]
-    fn encode(&self) -> Result<ContentData, Error> {
-        let bytes = self.serialize_bytes()?;
-        tracing::Span::current().record("output_bytes", bytes.len());
-        let source = ContentSource::new().with_parent(&self.source);
-        Ok(ContentData::new(source, bytes.into()))
-    }
-}
-
-#[async_trait::async_trait]
-impl TextHandler for CsvHandler {
-    fn locations(&self) -> LocationStream<'_, TextLocation> {
-        let source = self.source;
-        let cells = self.locate_cells();
-        let items: Vec<_> = cells
-            .into_iter()
-            .map(|c| {
-                Located::new(
-                    source,
-                    TextLocation {
-                        start_offset: c.start,
-                        end_offset: c.end,
-                        line_number: Some(c.line_number),
-                        ..Default::default()
-                    },
-                )
-            })
-            .collect();
-        LocationStream::new(futures::stream::iter(items))
-    }
-
-    async fn read(&self, location: &TextLocation) -> Option<TextData> {
-        self.locate_cells()
-            .into_iter()
-            .find(|c| c.start == location.start_offset && c.end == location.end_offset)
-            .map(|c| TextData::from(c.value))
-    }
-
-    async fn redact(
-        &mut self,
-        redactions: Redactions<TextLocation, TextRedaction>,
-    ) -> Result<(), Error> {
-        if redactions.is_empty() {
-            return Ok(());
-        }
-        let cells = self.locate_cells();
-
-        let mut updates: Vec<(bool, usize, usize, String)> = Vec::new();
-        for (loc, items) in redactions {
-            let Some(cell) = cells
-                .iter()
-                .find(|c| c.start == loc.start_offset && c.end == loc.end_offset)
-            else {
-                continue;
-            };
-            let mut value = cell.value.clone();
-            apply_text_redactions(&mut value, &items, TARGET)?;
-            updates.push((cell.is_header, cell.row, cell.col, value));
-        }
-
-        for (is_header, row, col, new_value) in updates {
-            if is_header {
-                let headers = self
-                    .data
-                    .headers
-                    .as_mut()
-                    .ok_or_else(|| Error::validation("no headers to edit", TARGET))?;
-                headers[col] = new_value;
-            } else {
-                let row_vec = self.data.rows.get_mut(row).ok_or_else(|| {
-                    Error::validation(format!("row {row} out of bounds"), TARGET)
-                })?;
-                let target = row_vec.get_mut(col).ok_or_else(|| {
-                    Error::validation(
-                        format!("col {col} out of bounds in row {row}"),
-                        TARGET,
-                    )
-                })?;
-                *target = new_value;
-            }
-        }
-        Ok(())
-    }
-}
-
-impl CsvHandler {
-    /// Create a new handler from parsed CSV data.
-    pub fn new(data: CsvData) -> Self {
-        Self {
-            source: ContentSource::new(),
-            data,
-        }
-    }
-
-    /// Set the content source for lineage tracking.
-    pub fn with_source(mut self, source: ContentSource) -> Self {
-        self.source = source;
-        self
-    }
-
-    /// Column headers, if present.
-    pub fn headers(&self) -> Option<&[String]> {
-        self.data.headers.as_deref()
-    }
-
-    /// All data rows.
-    pub fn rows(&self) -> &[Vec<String>] {
-        &self.data.rows
-    }
-
-    /// Mutable access to all data rows.
-    pub fn rows_mut(&mut self) -> &mut Vec<Vec<String>> {
-        &mut self.data.rows
-    }
-
-    /// A specific cell by (row, col).
-    pub fn cell(&self, row: usize, col: usize) -> Option<&str> {
-        self.data
-            .rows
-            .get(row)
-            .and_then(|r| r.get(col))
-            .map(|s| s.as_str())
-    }
-
-    /// Number of data rows (excluding the header).
-    pub fn len(&self) -> usize {
-        self.data.rows.len()
-    }
-
-    /// Whether the document has no data rows.
-    pub fn is_empty(&self) -> bool {
-        self.data.rows.is_empty()
-    }
-
-    /// Detected field delimiter.
-    pub fn delimiter(&self) -> u8 {
-        self.data.delimiter
-    }
-
-    /// Whether the original source had a trailing newline.
-    pub fn trailing_newline(&self) -> bool {
-        self.data.trailing_newline
-    }
-
-    /// Consume the handler and return the inner [`CsvData`].
-    pub fn into_data(self) -> CsvData {
-        self.data
-    }
-
-    /// Serialize to bytes (with CRLF→LF normalization and trailing
-    /// newline handling).
-    fn serialize_bytes(&self) -> Result<Vec<u8>, Error> {
-        let mut wtr = csv::WriterBuilder::new()
-            .delimiter(self.data.delimiter)
-            .has_headers(false)
-            .from_writer(Vec::new());
-
-        if let Some(headers) = &self.data.headers {
-            wtr.write_record(headers)
-                .map_err(|e| Error::validation(format!("CSV encode error: {e}"), TARGET))?;
-        }
-        for row in &self.data.rows {
-            wtr.write_record(row)
-                .map_err(|e| Error::validation(format!("CSV encode error: {e}"), TARGET))?;
-        }
-        let mut bytes = wtr
-            .into_inner()
-            .map_err(|e| Error::validation(format!("CSV encode error: {e}"), TARGET))?;
-
-        bytes.retain(|&b| b != b'\r');
-
-        if !self.data.trailing_newline && bytes.last() == Some(&b'\n') {
-            bytes.pop();
-        }
-
-        Ok(bytes)
-    }
-
-    /// Locate all cells by serializing and finding field boundaries.
-    fn locate_cells(&self) -> Vec<CellLocation> {
-        let bytes = match self.serialize_bytes() {
-            Ok(b) => b,
-            Err(_) => return Vec::new(),
-        };
-        let text = String::from_utf8_lossy(&bytes);
-
-        let mut cells = Vec::new();
-        let has_headers = self.data.headers.is_some();
-        let mut absolute_offset = 0usize;
-
-        for (row_idx, line) in text.split('\n').enumerate() {
-            if line.is_empty() {
-                continue;
-            }
-
-            let is_header = has_headers && row_idx == 0;
-            let data_row = if is_header {
-                0
-            } else if has_headers {
-                row_idx - 1
-            } else {
-                row_idx
-            };
-            let line_num = (row_idx + 1) as u32;
-
-            let row_values = if is_header {
-                self.data.headers.as_deref().unwrap_or(&[])
-            } else {
-                self.data
-                    .rows
-                    .get(data_row)
-                    .map(|r| r.as_slice())
-                    .unwrap_or(&[])
-            };
-
-            for (col, value) in row_values.iter().enumerate() {
-                if let Some((rel_start, rel_end)) =
-                    find_field_in_line(line, self.data.delimiter, col)
-                {
-                    cells.push(CellLocation {
-                        is_header,
-                        row: data_row,
-                        col,
-                        value: value.clone(),
-                        start: absolute_offset + rel_start,
-                        end: absolute_offset + rel_end,
-                        line_number: line_num,
-                    });
-                }
-            }
-
-            absolute_offset += line.len() + 1; // +1 for the newline
-        }
-
-        cells
-    }
-}
-
-/// Find a field's byte range within a CSV line, accounting for quoting.
-fn find_field_in_line(line: &str, delimiter: u8, target_col: usize) -> Option<(usize, usize)> {
-    let mut col = 0usize;
-    let mut pos = 0usize;
-
-    while pos < line.len() && col <= target_col {
-        if col == target_col {
-            if line[pos..].starts_with('"') {
-                let content_start = pos;
-                pos += 1;
-                loop {
-                    if pos >= line.len() {
-                        break;
-                    }
-                    if line.as_bytes()[pos] == b'"' {
-                        pos += 1;
-                        if pos < line.len() && line.as_bytes()[pos] == b'"' {
-                            pos += 1;
-                        } else {
-                            break;
-                        }
-                    } else {
-                        pos += 1;
-                    }
-                }
-                return Some((content_start, pos));
-            } else {
-                let start = pos;
-                while pos < line.len()
-                    && line.as_bytes()[pos] != delimiter
-                    && line.as_bytes()[pos] != b'\n'
-                {
-                    pos += 1;
-                }
-                return Some((start, pos));
-            }
-        }
-
-        if line[pos..].starts_with('"') {
-            pos += 1;
-            loop {
-                if pos >= line.len() {
-                    break;
-                }
-                if line.as_bytes()[pos] == b'"' {
-                    pos += 1;
-                    if pos < line.len() && line.as_bytes()[pos] == b'"' {
-                        pos += 1;
-                    } else {
-                        break;
-                    }
-                } else {
-                    pos += 1;
-                }
-            }
-        } else {
-            while pos < line.len()
-                && line.as_bytes()[pos] != delimiter
-                && line.as_bytes()[pos] != b'\n'
-            {
-                pos += 1;
-            }
-        }
-
-        if pos < line.len() && line.as_bytes()[pos] == delimiter {
-            pos += 1;
-        }
-        col += 1;
-    }
-
-    None
-}
-
-#[cfg(test)]
-mod tests {
-    use futures::StreamExt;
-    use nvisy_core::Error;
-
-    use super::*;
-    use crate::transform::{ConflictPolicy, TextOutput};
-
-    fn handler_with_headers(headers: Vec<&str>, rows: Vec<Vec<&str>>) -> CsvHandler {
-        CsvHandler::new(CsvData {
-            headers: Some(headers.into_iter().map(String::from).collect()),
-            rows: rows
-                .into_iter()
-                .map(|r| r.into_iter().map(String::from).collect())
-                .collect(),
-            delimiter: b',',
-            trailing_newline: true,
-        })
-    }
-
-    fn handler_no_headers(rows: Vec<Vec<&str>>) -> CsvHandler {
-        CsvHandler::new(CsvData {
-            headers: None,
-            rows: rows
-                .into_iter()
-                .map(|r| r.into_iter().map(String::from).collect())
-                .collect(),
-            delimiter: b',',
-            trailing_newline: true,
-        })
-    }
-
-    #[tokio::test]
-    async fn locations_with_headers() {
-        let h = handler_with_headers(
-            vec!["name", "age"],
-            vec![vec!["Alice", "30"], vec!["Bob", "25"]],
-        );
-        let items: Vec<_> = h.locations().collect().await;
-        assert_eq!(items.len(), 6);
-    }
-
-    #[tokio::test]
-    async fn locations_no_headers() {
-        let h = handler_no_headers(vec![vec!["x", "y"], vec!["1", "2"]]);
-        let items: Vec<_> = h.locations().collect().await;
-        assert_eq!(items.len(), 4);
-    }
-
-    #[tokio::test]
-    async fn redact_cell() -> Result<(), Error> {
-        let mut h = handler_with_headers(vec!["ssn"], vec![vec!["123-45-6789"]]);
-        let items: Vec<_> = h.locations().collect().await;
-        let data_loc = items[1].location.clone();
-        let mut rs = Redactions::new(ConflictPolicy::Reject);
-        rs.try_insert(
-            data_loc,
-            TextRedaction::new(0, 11, TextOutput::replace("[REDACTED]")),
-        )
-        .unwrap();
-        h.redact(rs).await?;
-        assert_eq!(h.cell(0, 0), Some("[REDACTED]"));
-        Ok(())
-    }
-
-    #[tokio::test]
-    async fn redact_header() -> Result<(), Error> {
-        let mut h = handler_with_headers(vec!["secret_field"], vec![vec!["value"]]);
-        let items: Vec<_> = h.locations().collect().await;
-        let header_loc = items[0].location.clone();
-        let mut rs = Redactions::new(ConflictPolicy::Reject);
-        rs.try_insert(
-            header_loc,
-            TextRedaction::new(0, 12, TextOutput::replace("redacted")),
-        )
-        .unwrap();
-        h.redact(rs).await?;
-        assert_eq!(h.headers(), Some(["redacted".to_string()].as_slice()));
-        Ok(())
-    }
-
-    #[tokio::test]
-    async fn read_returns_cell() {
-        let h = handler_with_headers(vec!["name"], vec![vec!["Alice"]]);
-        let items: Vec<_> = h.locations().collect().await;
-        assert_eq!(
-            h.read(&items[1].location).await.unwrap().as_str(),
-            "Alice"
-        );
-    }
-
-    #[tokio::test]
-    async fn quoted_field_offsets_correct() {
-        let h = handler_with_headers(vec!["bio"], vec![vec!["has, comma"]]);
-        let items: Vec<_> = h.locations().collect().await;
-        // Header + data cell.
-        assert_eq!(items.len(), 2);
-        let data_loc = &items[1].location;
-        assert!(data_loc.end_offset > data_loc.start_offset);
-        assert_eq!(h.read(data_loc).await.unwrap().as_str(), "has, comma");
-    }
-
-    #[tokio::test]
-    async fn empty_data_with_headers() {
-        let h = handler_with_headers(vec!["a", "b"], vec![]);
-        let items: Vec<_> = h.locations().collect().await;
-        assert_eq!(items.len(), 2);
-    }
-
-    #[test]
-    fn encode_with_headers() -> Result<(), Error> {
-        let h = handler_with_headers(
-            vec!["name", "age"],
-            vec![vec!["Alice", "30"], vec!["Bob", "25"]],
-        );
-        let content = h.encode()?;
-        assert_eq!(
-            content.as_str().expect("valid utf-8"),
-            "name,age\nAlice,30\nBob,25\n"
-        );
-        Ok(())
-    }
-
-    #[test]
-    fn encode_with_quoting() -> Result<(), Error> {
-        let h = handler_with_headers(vec!["name", "bio"], vec![vec!["Alice", "Has a, comma"]]);
-        let content = h.encode()?;
-        let text = content.as_str().expect("valid utf-8");
-        assert!(text.contains("\"Has a, comma\""));
-        Ok(())
-    }
-
-    #[test]
-    fn encode_without_trailing_newline() -> Result<(), Error> {
-        let mut h = handler_with_headers(vec!["a"], vec![vec!["1"]]);
-        h.data.trailing_newline = false;
-        let content = h.encode()?;
-        assert_eq!(content.as_str().expect("valid utf-8"), "a\n1");
-        Ok(())
-    }
-}
diff --git a/crates/nvisy-codec/src/handler/text/mod.rs b/crates/nvisy-codec/src/handler/text/mod.rs
index f507c67d..64cd2c98 100644
--- a/crates/nvisy-codec/src/handler/text/mod.rs
+++ b/crates/nvisy-codec/src/handler/text/mod.rs
@@ -7,8 +7,6 @@ use super::Handler;
 use crate::document::LocationStream;
 use crate::transform::{Redactions, TextRedaction};
 
-mod csv_handler;
-mod csv_loader;
 #[cfg(feature = "html")]
 mod html_handler;
 #[cfg(feature = "html")]
@@ -20,11 +18,7 @@ mod text_data;
 mod text_handler;
 mod txt_handler;
 mod txt_loader;
-mod xlsx_handler;
-mod xlsx_loader;
 
-pub use self::csv_handler::{CsvData, CsvHandler};
-pub use self::csv_loader::{CsvLoader, CsvParams};
 #[cfg(feature = "html")]
 pub use self::html_handler::{HtmlData, HtmlHandler};
 #[cfg(feature = "html")]
@@ -36,8 +30,6 @@ pub use self::text_data::TextData;
 pub use self::text_handler::BoxedTextHandler;
 pub use self::txt_handler::TxtHandler;
 pub use self::txt_loader::{TxtLoader, TxtParams};
-pub use self::xlsx_handler::XlsxHandler;
-pub use self::xlsx_loader::{XlsxLoader, XlsxParams};
 
 /// Capability trait for handlers that expose text content.
 ///
diff --git a/crates/nvisy-codec/src/handler/text/text_handler.rs b/crates/nvisy-codec/src/handler/text/text_handler.rs
index bad0fe7e..f690cfef 100644
--- a/crates/nvisy-codec/src/handler/text/text_handler.rs
+++ b/crates/nvisy-codec/src/handler/text/text_handler.rs
@@ -76,8 +76,8 @@ macro_rules! impl_from_text_handler {
     };
 }
 
-use super::{CsvHandler, JsonHandler, TxtHandler, XlsxHandler};
-impl_from_text_handler!(TxtHandler, CsvHandler, JsonHandler, XlsxHandler);
+use super::{JsonHandler, TxtHandler};
+impl_from_text_handler!(TxtHandler, JsonHandler);
 
 #[cfg(feature = "html")]
 use super::HtmlHandler;
diff --git a/crates/nvisy-codec/src/transform/mod.rs b/crates/nvisy-codec/src/transform/mod.rs
index eee4a1a9..c4f7db44 100644
--- a/crates/nvisy-codec/src/transform/mod.rs
+++ b/crates/nvisy-codec/src/transform/mod.rs
@@ -26,6 +26,7 @@ pub use self::image::{ImageOutput, ImageRedaction};
 pub use self::mergeable::Mergeable;
 pub use self::policy::{ConflictPolicy, InsertError};
 pub use self::redactions::Redactions;
+pub(crate) use self::tabular::apply_tabular_redactions;
 pub use self::tabular::TabularRedaction;
 pub(crate) use self::text::apply_text_redactions;
 pub use self::text::{TextOutput, TextRedaction};
diff --git a/crates/nvisy-codec/src/transform/tabular/apply.rs b/crates/nvisy-codec/src/transform/tabular/apply.rs
new file mode 100644
index 00000000..719e0375
--- /dev/null
+++ b/crates/nvisy-codec/src/transform/tabular/apply.rs
@@ -0,0 +1,102 @@
+//! Byte-level helper for applying a batch of [`TabularRedaction`]s to a
+//! single cell's value in place.
+
+use std::cmp::Reverse;
+
+use nvisy_core::Error;
+
+use super::instruction::TabularRedaction;
+
+/// Apply a slice of cell-scoped redactions to `cell` in place.
+///
+/// Redactions are sorted right-to-left so earlier byte offsets stay
+/// valid as later ones are replaced. Returns an error if any offset
+/// falls mid-character.
+///
+/// The slice must not contain overlapping ranges — that invariant is
+/// owned by [`Redactions`] on insert.
+///
+/// [`Redactions`]: crate::transform::Redactions
+pub(crate) fn apply_tabular_redactions(
+    cell: &mut String,
+    redactions: &[TabularRedaction],
+    target: &'static str,
+) -> Result<(), Error> {
+    let mut items: Vec<&TabularRedaction> = redactions.iter().collect();
+    items.sort_by_key(|r| Reverse(r.start));
+
+    for r in items {
+        let value = r.output.replacement_value().unwrap_or_default();
+        let s = r.start.min(cell.len());
+        let e = r.end.min(cell.len());
+        if s >= e {
+            continue;
+        }
+        if !cell.is_char_boundary(s) || !cell.is_char_boundary(e) {
+            return Err(Error::validation(
+                format!(
+                    "redaction offset falls mid-character \
+                     (start={}, end={}, len={})",
+                    r.start,
+                    r.end,
+                    cell.len()
+                ),
+                target,
+            ));
+        }
+        cell.replace_range(s..e, value);
+    }
+
+    Ok(())
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::transform::TextOutput;
+
+    fn redaction(start: usize, end: usize, replacement: &str) -> TabularRedaction {
+        TabularRedaction::new(start, end, TextOutput::replace(replacement))
+    }
+
+    #[test]
+    fn single_replacement() {
+        let mut s = String::from("hello world");
+        apply_tabular_redactions(&mut s, &[redaction(0, 5, "[X]")], "test").unwrap();
+        assert_eq!(s, "[X] world");
+    }
+
+    #[test]
+    fn right_to_left_application() {
+        let mut s = String::from("aaa bbb ccc");
+        let rs = vec![redaction(0, 3, "[A]"), redaction(8, 11, "[C]")];
+        apply_tabular_redactions(&mut s, &rs, "test").unwrap();
+        assert_eq!(s, "[A] bbb [C]");
+    }
+
+    #[test]
+    fn remove_output() {
+        let mut s = String::from("hello world");
+        apply_tabular_redactions(
+            &mut s,
+            &[TabularRedaction::new(5, 11, TextOutput::Remove)],
+            "test",
+        )
+        .unwrap();
+        assert_eq!(s, "hello");
+    }
+
+    #[test]
+    fn out_of_bounds_clipped() {
+        let mut s = String::from("short");
+        apply_tabular_redactions(&mut s, &[redaction(0, 999, "[X]")], "test").unwrap();
+        assert_eq!(s, "[X]");
+    }
+
+    #[test]
+    fn mid_character_rejected() {
+        let mut s = String::from("héllo"); // 'é' is 2 bytes
+        let err = apply_tabular_redactions(&mut s, &[redaction(0, 2, "[X]")], "test").unwrap_err();
+        assert!(err.to_string().contains("mid-character"));
+    }
+}
diff --git a/crates/nvisy-codec/src/transform/tabular/mod.rs b/crates/nvisy-codec/src/transform/tabular/mod.rs
index 9465c8c0..c23ae21c 100644
--- a/crates/nvisy-codec/src/transform/tabular/mod.rs
+++ b/crates/nvisy-codec/src/transform/tabular/mod.rs
@@ -1,5 +1,7 @@
 //! Tabular redaction primitives.
 
+mod apply;
 mod instruction;
 
+pub(crate) use self::apply::apply_tabular_redactions;
 pub use self::instruction::TabularRedaction;
diff --git a/crates/nvisy-engine/src/operation/envelope/document.rs b/crates/nvisy-engine/src/operation/envelope/document.rs
index cb114457..fda04469 100644
--- a/crates/nvisy-engine/src/operation/envelope/document.rs
+++ b/crates/nvisy-engine/src/operation/envelope/document.rs
@@ -10,14 +10,16 @@ use std::fmt;
 use futures::StreamExt;
 use nvisy_codec::handler::{AudioData, ImageData, TextData};
 use nvisy_codec::transform::{
-    AudioRedaction, ImageRedaction, Redactions, TextRedaction,
+    AudioRedaction, ImageRedaction, Redactions, TabularRedaction, TextRedaction,
 };
 use nvisy_codec::{ContentHandle, Located};
 use nvisy_core::Error;
 use nvisy_core::content::{ContentData, ContentMetadata, ContentSource};
 use nvisy_core::media::DocumentType;
 use nvisy_ontology::artifacts::ContentArtifacts;
-use nvisy_ontology::entity::{AudioLocation, ImageLocation, Location, TextLocation};
+use nvisy_ontology::entity::{
+    AudioLocation, ImageLocation, Location, TabularLocation, TextLocation,
+};
 
 /// Engine-level document combining content, metadata, and artifacts.
 ///
@@ -39,6 +41,7 @@ impl Document {
     pub fn new(handle: ContentHandle, metadata: ContentMetadata) -> Self {
         let artifacts = match &handle {
             ContentHandle::Text(_) => ContentArtifacts::text(),
+            ContentHandle::Tabular(_) => ContentArtifacts::tabular(),
             ContentHandle::Image(_) => ContentArtifacts::image(),
             ContentHandle::Audio(_) => ContentArtifacts::audio(),
             ContentHandle::Rich(_) => ContentArtifacts::rich(),
@@ -70,6 +73,11 @@ impl Document {
         self.handle.text_locations().collect().await
     }
 
+    /// Collect all tabular (cell) locations into a `Vec`.
+    pub async fn collect_tabular_locations(&self) -> Vec<Located<TabularLocation>> {
+        self.handle.tabular_locations().collect().await
+    }
+
     /// Collect all image locations into a `Vec`.
     pub async fn collect_image_locations(&self) -> Vec<Located<ImageLocation>> {
         self.handle.image_locations().collect().await
@@ -85,6 +93,11 @@ impl Document {
         self.handle.read_text(location).await
     }
 
+    /// Read the cell value at the given tabular location.
+    pub async fn read_tabular(&self, location: &TabularLocation) -> Option<TextData> {
+        self.handle.read_tabular(location).await
+    }
+
     /// Read the image data at the given image location.
     pub async fn read_image(&self, location: &ImageLocation) -> Option<ImageData> {
         self.handle.read_image(location).await
@@ -103,17 +116,15 @@ impl Document {
     pub async fn value_at(&self, location: &Location) -> Option<String> {
         match location {
             Location::Text(loc) => self.read_text(loc).await.map(TextData::into_inner),
+            Location::Tabular(loc) => self.read_tabular(loc).await.map(TextData::into_inner),
             Location::Audio(_) => self
                 .artifacts
                 .as_audio()
                 .and_then(|a| a.transcription.as_ref())
                 .map(|t| t.text()),
-            // Tabular locations are currently surfaced through the
-            // underlying TextHandler; per-cell extraction would need a
-            // (row, col) → byte-offset bridge that the engine no longer
-            // owns. Image OCR results are multi-region; per-location
-            // lookup is not yet implemented.
-            Location::Tabular(_) | Location::Image(_) => None,
+            // Image OCR results are multi-region; per-location lookup
+            // is not yet implemented.
+            Location::Image(_) => None,
             _ => None,
         }
     }
@@ -126,6 +137,14 @@ impl Document {
         self.handle.apply_text_redactions(redactions).await
     }
 
+    /// Apply a batch of tabular redactions to the document.
+    pub async fn apply_tabular_redactions(
+        &mut self,
+        redactions: Redactions<TabularLocation, TabularRedaction>,
+    ) -> Result<(), Error> {
+        self.handle.apply_tabular_redactions(redactions).await
+    }
+
     /// Apply a batch of image redactions to the document.
     pub async fn apply_image_redactions(
         &mut self,
@@ -162,4 +181,5 @@ impl Document {
         let handle = ContentHandle::decode(&content).await.expect("decode text");
         Self::new(handle, meta)
     }
+
 }
diff --git a/crates/nvisy-engine/src/operation/extraction/mod.rs b/crates/nvisy-engine/src/operation/extraction/mod.rs
index 16115f9d..fefb0f90 100644
--- a/crates/nvisy-engine/src/operation/extraction/mod.rs
+++ b/crates/nvisy-engine/src/operation/extraction/mod.rs
@@ -76,10 +76,10 @@ impl Operation for ExtractionOp {
                     op.execute(envelope).await?;
                 }
             }
-            ContentHandle::Text(_) => {
-                // Text documents are already structured text — no
-                // extraction needed. Future: whitespace normalization.
-                tracing::debug!(target: TARGET, "text document, no extraction needed");
+            ContentHandle::Text(_) | ContentHandle::Tabular(_) => {
+                // Text and tabular documents are already structured —
+                // no extraction needed. Future: whitespace normalization.
+                tracing::debug!(target: TARGET, "structured document, no extraction needed");
             }
         }
         Ok(())
diff --git a/crates/nvisy-engine/src/operation/redaction/apply.rs b/crates/nvisy-engine/src/operation/redaction/apply.rs
index 38f76d21..59d46164 100644
--- a/crates/nvisy-engine/src/operation/redaction/apply.rs
+++ b/crates/nvisy-engine/src/operation/redaction/apply.rs
@@ -10,11 +10,11 @@ use std::collections::HashMap;
 
 use nvisy_codec::transform::{
     AudioOutput, AudioRedaction, ConflictPolicy, ImageOutput, ImageRedaction, Redactions,
-    TextOutput, TextRedaction,
+    TabularRedaction, TextOutput, TextRedaction,
 };
 use nvisy_core::{Error, Result};
 use nvisy_ontology::entity::{
-    AudioLocation, Entity, EntityKind, ImageLocation, Location, TextLocation,
+    AudioLocation, Entity, EntityKind, ImageLocation, Location, TabularLocation, TextLocation,
 };
 use nvisy_ontology::policy::{AudioStrategy, ImageStrategy, Strategy, TextStrategy};
 use sha2::{Digest, Sha256};
@@ -24,9 +24,6 @@ use crate::operation::DocumentEnvelope;
 
 const TARGET: &str = "nvisy_engine::op::redaction::apply";
 
-const IMAGE_REDACTED: &str = "[IMAGE_REDACTED]";
-const AUDIO_REDACTED: &str = "[AUDIO_REDACTED]";
-
 /// Builds and applies redaction instructions across all modalities.
 ///
 /// Holds `&mut DocumentEnvelope` and iterates `audit.entries` to build
@@ -43,13 +40,23 @@ impl<'a> RedactionApplicator<'a> {
 
     /// Build and apply all redaction instructions.
     pub async fn apply(mut self) -> Result<()> {
-        let text = self.build_text_redactions().await?;
-        let image = self.build_image_redactions()?;
-        let audio = self.build_audio_redactions()?;
+        let entity_map = entity_map(&self.envelope.audit.entities);
+        let mut mapping_index = mapping_index(&self.envelope.redaction_map.entries);
+
+        let text = self.build_text_redactions(&entity_map, &mut mapping_index).await?;
+        let tabular = self.build_tabular_redactions(&entity_map, &mut mapping_index).await?;
+        let image = self.build_image_redactions(&entity_map, &mut mapping_index)?;
+        let audio = self.build_audio_redactions(&entity_map, &mut mapping_index)?;
 
         if !text.is_empty() {
             self.envelope.document.apply_text_redactions(text).await?;
         }
+        if !tabular.is_empty() {
+            self.envelope
+                .document
+                .apply_tabular_redactions(tabular)
+                .await?;
+        }
         if !image.is_empty() {
             self.envelope.document.apply_image_redactions(image).await?;
         }
@@ -62,20 +69,23 @@ impl<'a> RedactionApplicator<'a> {
 
     async fn build_text_redactions(
         &mut self,
+        entity_map: &HashMap<Uuid, Entity>,
+        mapping_index: &mut HashMap<Uuid, usize>,
     ) -> Result<Redactions<TextLocation, TextRedaction>> {
-        let entity_map = Self::entity_map(&self.envelope.audit.entities);
         let mut redactions = Redactions::new(ConflictPolicy::Reject);
 
         for i in 0..self.envelope.audit.entries.len() {
             let record = &self.envelope.audit.entries[i];
-            let entity = match entity_map.get(&record.entity_id) {
-                Some(e) => *e,
-                None => continue,
+            let Some(entity) = entity_map.get(&record.entity_id) else {
+                continue;
             };
-
             let Location::Text(ref loc) = entity.location else {
                 continue;
             };
+            let Strategy::Text(ref strategy) = record.redaction.strategy else {
+                log_modality_mismatch(entity.id, "text", &record.redaction.strategy);
+                continue;
+            };
 
             let value = self
                 .envelope
@@ -85,23 +95,13 @@ impl<'a> RedactionApplicator<'a> {
                 .map(|d| d.into_inner())
                 .unwrap_or_default();
 
-            let output = match &record.redaction.strategy {
-                Strategy::Text(text) => Self::text_output(&value, entity, text),
-                _ => continue,
-            };
-
+            let output = text_output(&value, entity, strategy);
             let entity_id = record.entity_id;
-
             let replacement = output.replacement_value().map(String::from);
+
             self.envelope.audit.entries[i].value.replacement = replacement.clone();
-            if let Some(mapping) = self
-                .envelope
-                .redaction_map
-                .entries
-                .iter_mut()
-                .find(|m| m.entity_id == entity_id)
-            {
-                mapping.replacement = replacement;
+            if let Some(&idx) = mapping_index.get(&entity_id) {
+                self.envelope.redaction_map.entries[idx].replacement = replacement;
             }
 
             tracing::trace!(
@@ -112,16 +112,72 @@ impl<'a> RedactionApplicator<'a> {
                 "built text redaction instruction",
             );
 
-            // The entity location identifies the span; start/end are
-            // intra-span offsets (0..len for full value replacement).
             redactions
                 .try_insert(
                     loc.clone(),
                     TextRedaction::new(loc.start_offset, loc.end_offset, output),
                 )
-                .map_err(|e| {
-                    Error::validation(e.to_string(), "redaction-apply-text")
-                })?;
+                .map_err(|e| Error::validation(e.to_string(), "redaction-apply-text"))?;
+        }
+
+        Ok(redactions)
+    }
+
+    async fn build_tabular_redactions(
+        &mut self,
+        entity_map: &HashMap<Uuid, Entity>,
+        mapping_index: &mut HashMap<Uuid, usize>,
+    ) -> Result<Redactions<TabularLocation, TabularRedaction>> {
+        let mut redactions = Redactions::new(ConflictPolicy::Reject);
+
+        for i in 0..self.envelope.audit.entries.len() {
+            let record = &self.envelope.audit.entries[i];
+            let Some(entity) = entity_map.get(&record.entity_id) else {
+                continue;
+            };
+            let Location::Tabular(ref loc) = entity.location else {
+                continue;
+            };
+            let Strategy::Text(ref strategy) = record.redaction.strategy else {
+                log_modality_mismatch(entity.id, "tabular", &record.redaction.strategy);
+                continue;
+            };
+
+            let value = self
+                .envelope
+                .document
+                .read_tabular(loc)
+                .await
+                .map(|d| d.into_inner())
+                .unwrap_or_default();
+
+            let output = text_output(&value, entity, strategy);
+            let entity_id = record.entity_id;
+            let replacement = output.replacement_value().map(String::from);
+
+            self.envelope.audit.entries[i].value.replacement = replacement.clone();
+            if let Some(&idx) = mapping_index.get(&entity_id) {
+                self.envelope.redaction_map.entries[idx].replacement = replacement;
+            }
+
+            // Intra-cell byte range: prefer explicit offsets if the
+            // entity provided them, otherwise redact the entire cell.
+            let start = loc.start_offset.unwrap_or(0);
+            let end = loc.end_offset.unwrap_or(value.len());
+
+            tracing::trace!(
+                target: TARGET,
+                %entity_id,
+                row = loc.row_index,
+                col = loc.column_index,
+                start,
+                end,
+                "built tabular redaction instruction",
+            );
+
+            redactions
+                .try_insert(loc.clone(), TabularRedaction::new(start, end, output))
+                .map_err(|e| Error::validation(e.to_string(), "redaction-apply-tabular"))?;
         }
 
         Ok(redactions)
@@ -129,45 +185,38 @@ impl<'a> RedactionApplicator<'a> {
 
     fn build_image_redactions(
         &mut self,
+        entity_map: &HashMap<Uuid, Entity>,
+        mapping_index: &mut HashMap<Uuid, usize>,
     ) -> Result<Redactions<ImageLocation, ImageRedaction>> {
-        let entity_map = Self::entity_map(&self.envelope.audit.entities);
         let mut redactions = Redactions::new(ConflictPolicy::Reject);
 
         for i in 0..self.envelope.audit.entries.len() {
             let record = &self.envelope.audit.entries[i];
-            let entity = match entity_map.get(&record.entity_id) {
-                Some(e) => *e,
-                None => continue,
+            let Some(entity) = entity_map.get(&record.entity_id) else {
+                continue;
             };
-
             let Location::Image(ref loc) = entity.location else {
                 continue;
             };
+            let Strategy::Image(ref strategy) = record.redaction.strategy else {
+                log_modality_mismatch(entity.id, "image", &record.redaction.strategy);
+                continue;
+            };
 
-            let output = match &record.redaction.strategy {
-                Strategy::Image(img) => match img {
-                    ImageStrategy::Blur { sigma } => ImageOutput::Blur { sigma: *sigma },
-                    ImageStrategy::Block { color } => ImageOutput::Block { color: *color },
-                    ImageStrategy::Pixelate { block_size } => ImageOutput::Pixelate {
-                        block_size: *block_size,
-                    },
-                    _ => continue,
-                },
-                _ => continue,
+            let Some((output, placeholder)) = image_output(strategy) else {
+                tracing::debug!(
+                    target: TARGET,
+                    entity_id = %entity.id,
+                    strategy = ?strategy,
+                    "image strategy has no codec output, skipping",
+                );
+                continue;
             };
 
             let entity_id = record.entity_id;
-            let replacement = IMAGE_REDACTED.to_string();
-
-            self.envelope.audit.entries[i].value.replacement = Some(replacement.clone());
-            if let Some(mapping) = self
-                .envelope
-                .redaction_map
-                .entries
-                .iter_mut()
-                .find(|m| m.entity_id == entity_id)
-            {
-                mapping.replacement = Some(replacement);
+            self.envelope.audit.entries[i].value.replacement = Some(placeholder.clone());
+            if let Some(&idx) = mapping_index.get(&entity_id) {
+                self.envelope.redaction_map.entries[idx].replacement = Some(placeholder);
             }
 
             tracing::trace!(
@@ -178,9 +227,7 @@ impl<'a> RedactionApplicator<'a> {
 
             redactions
                 .try_insert(loc.clone(), ImageRedaction::new(loc.bounding_box, output))
-                .map_err(|e| {
-                    Error::validation(e.to_string(), "redaction-apply-image")
-                })?;
+                .map_err(|e| Error::validation(e.to_string(), "redaction-apply-image"))?;
         }
 
         Ok(redactions)
@@ -188,42 +235,38 @@ impl<'a> RedactionApplicator<'a> {
 
     fn build_audio_redactions(
         &mut self,
+        entity_map: &HashMap<Uuid, Entity>,
+        mapping_index: &mut HashMap<Uuid, usize>,
     ) -> Result<Redactions<AudioLocation, AudioRedaction>> {
-        let entity_map = Self::entity_map(&self.envelope.audit.entities);
         let mut redactions = Redactions::new(ConflictPolicy::Reject);
 
         for i in 0..self.envelope.audit.entries.len() {
             let record = &self.envelope.audit.entries[i];
-            let entity = match entity_map.get(&record.entity_id) {
-                Some(e) => *e,
-                None => continue,
+            let Some(entity) = entity_map.get(&record.entity_id) else {
+                continue;
             };
-
             let Location::Audio(ref loc) = entity.location else {
                 continue;
             };
+            let Strategy::Audio(ref strategy) = record.redaction.strategy else {
+                log_modality_mismatch(entity.id, "audio", &record.redaction.strategy);
+                continue;
+            };
 
-            let output = match &record.redaction.strategy {
-                Strategy::Audio(audio) => match audio {
-                    AudioStrategy::Silence => AudioOutput::Silence,
-                    AudioStrategy::Remove => AudioOutput::Remove,
-                    _ => continue,
-                },
-                _ => continue,
+            let Some((output, placeholder)) = audio_output(strategy) else {
+                tracing::debug!(
+                    target: TARGET,
+                    entity_id = %entity.id,
+                    strategy = ?strategy,
+                    "audio strategy has no codec output, skipping",
+                );
+                continue;
             };
 
             let entity_id = record.entity_id;
-            let replacement = AUDIO_REDACTED.to_string();
-
-            self.envelope.audit.entries[i].value.replacement = Some(replacement.clone());
-            if let Some(mapping) = self
-                .envelope
-                .redaction_map
-                .entries
-                .iter_mut()
-                .find(|m| m.entity_id == entity_id)
-            {
-                mapping.replacement = Some(replacement);
+            self.envelope.audit.entries[i].value.replacement = Some(placeholder.clone());
+            if let Some(&idx) = mapping_index.get(&entity_id) {
+                self.envelope.redaction_map.entries[idx].replacement = Some(placeholder);
             }
 
             tracing::trace!(
@@ -236,83 +279,152 @@ impl<'a> RedactionApplicator<'a> {
 
             redactions
                 .try_insert(loc.clone(), AudioRedaction::new(loc.time_span, output))
-                .map_err(|e| {
-                    Error::validation(e.to_string(), "redaction-apply-audio")
-                })?;
+                .map_err(|e| Error::validation(e.to_string(), "redaction-apply-audio"))?;
         }
 
         Ok(redactions)
     }
+}
 
-    /// Build a lookup map from entity UUID to entity reference.
-    fn entity_map(entities: &nvisy_ontology::entity::Entities) -> HashMap<Uuid, &Entity> {
-        entities.iter().map(|e| (e.id, e)).collect()
-    }
-
-    fn text_output(value: &str, entity: &Entity, strategy: &TextStrategy) -> TextOutput {
-        match strategy {
-            TextStrategy::Mask { mask_char } => {
-                TextOutput::replace(mask_char.to_string().repeat(value.len()))
-            }
-
-            TextStrategy::Replace { placeholder } => {
-                if placeholder.is_empty() {
-                    TextOutput::replace(format!(
-                        "[{}]",
-                        entity.entity_kind.to_string().to_uppercase()
-                    ))
-                } else {
-                    TextOutput::replace(
-                        placeholder
-                            .replace("{entityType}", &entity.entity_kind.to_string())
-                            .replace("{category}", &entity.category.to_string()),
-                    )
-                }
-            }
-
-            TextStrategy::Remove => TextOutput::Remove,
-
-            TextStrategy::Hash => TextOutput::replace(Self::hash_value(value)),
+/// Build a lookup map from entity UUID to a cloned entity.
+fn entity_map(entities: &nvisy_ontology::entity::Entities) -> HashMap<Uuid, Entity> {
+    entities.iter().map(|e| (e.id, e.clone())).collect()
+}
 
-            TextStrategy::Pseudonymize => {
-                TextOutput::replace(Self::pseudonymize(&entity.entity_kind, value))
-            }
+/// Build an index from entity UUID to its position in
+/// [`RedactionMap::entries`], so per-entity mapping updates become
+/// `O(1)` instead of a linear scan per audit entry.
+///
+/// [`RedactionMap::entries`]: nvisy_ontology::provenance::RedactionMap::entries
+fn mapping_index(
+    mappings: &[nvisy_ontology::provenance::RedactionMapping],
+) -> HashMap<Uuid, usize> {
+    mappings.iter().enumerate().map(|(i, m)| (m.entity_id, i)).collect()
+}
 
-            TextStrategy::Encrypt { .. } => {
-                TextOutput::replace(format!("[ENC:{}]", entity.entity_kind))
-            }
-            TextStrategy::Tokenize { .. } => {
-                TextOutput::replace(format!("[TOKEN:{}]", entity.entity_kind))
+/// Compute the codec [`TextOutput`] for a value + entity + strategy.
+fn text_output(value: &str, entity: &Entity, strategy: &TextStrategy) -> TextOutput {
+    match strategy {
+        TextStrategy::Mask { mask_char } => {
+            // Repeat by character count, not byte length: a 2-byte
+            // grapheme like `é` should produce one mask char.
+            TextOutput::replace(mask_char.to_string().repeat(value.chars().count()))
+        }
+        TextStrategy::Replace { placeholder } => {
+            if placeholder.is_empty() {
+                TextOutput::replace(format!(
+                    "[{}]",
+                    entity.entity_kind.to_string().to_uppercase()
+                ))
+            } else {
+                TextOutput::replace(
+                    placeholder
+                        .replace("{entityType}", &entity.entity_kind.to_string())
+                        .replace("{category}", &entity.category.to_string()),
+                )
             }
-            _ => TextOutput::replace(format!("[REDACTED:{}]", entity.entity_kind)),
+        }
+        TextStrategy::Remove => TextOutput::Remove,
+        TextStrategy::Hash => TextOutput::replace(hash_value(value)),
+        TextStrategy::Pseudonymize => {
+            TextOutput::replace(pseudonymize(&entity.entity_kind, value))
+        }
+        TextStrategy::Encrypt { .. } => {
+            // TODO: real encryption — placeholder until the key vault is wired.
+            TextOutput::replace(format!("[ENC:{}]", entity.entity_kind))
+        }
+        TextStrategy::Tokenize { .. } => {
+            // TODO: real tokenization — placeholder until the vault is wired.
+            TextOutput::replace(format!("[TOKEN:{}]", entity.entity_kind))
+        }
+        // `TextStrategy` is `#[non_exhaustive]`; new variants need
+        // explicit handling. Surface a generic placeholder so the
+        // pipeline doesn't silently drop entities.
+        _ => {
+            tracing::warn!(
+                target: TARGET,
+                entity_id = %entity.id,
+                strategy = ?strategy,
+                "unhandled text strategy, using generic placeholder",
+            );
+            TextOutput::replace(format!("[REDACTED:{}]", entity.entity_kind))
         }
     }
+}
 
-    fn hash_value(value: &str) -> String {
-        let mut hasher = Sha256::new();
-        hasher.update(value.as_bytes());
-        let hash = hasher.finalize();
-        hash.iter().take(8).map(|b| format!("{b:02x}")).collect()
+/// Compute the codec [`ImageOutput`] for a strategy, paired with a
+/// human-readable placeholder for the audit trail.
+///
+/// Returns `None` when the strategy has no defined codec output.
+fn image_output(strategy: &ImageStrategy) -> Option<(ImageOutput, String)> {
+    match strategy {
+        ImageStrategy::Blur { sigma } => {
+            Some((ImageOutput::Blur { sigma: *sigma }, format!("[IMAGE_BLUR:{sigma}]")))
+        }
+        ImageStrategy::Block { color } => Some((
+            ImageOutput::Block { color: *color },
+            format!("[IMAGE_BLOCK:#{:02x}{:02x}{:02x}]", color.r, color.g, color.b),
+        )),
+        ImageStrategy::Pixelate { block_size } => Some((
+            ImageOutput::Pixelate {
+                block_size: *block_size,
+            },
+            format!("[IMAGE_PIXELATE:{block_size}]"),
+        )),
+        // `ImageStrategy` is `#[non_exhaustive]`; new variants without
+        // a defined codec output are skipped.
+        _ => None,
     }
+}
 
-    fn pseudonymize(entity_kind: &EntityKind, value: &str) -> String {
-        let mut hasher = Sha256::new();
-        hasher.update(entity_kind.to_string().as_bytes());
-        hasher.update(b":");
-        hasher.update(value.as_bytes());
-        let hash = hasher.finalize();
-        let id: u32 = u32::from_le_bytes([hash[0], hash[1], hash[2], hash[3]]);
-        format!("{entity_kind}_{id}")
+/// Compute the codec [`AudioOutput`] for a strategy, paired with a
+/// human-readable placeholder for the audit trail.
+///
+/// Returns `None` when the strategy has no defined codec output.
+fn audio_output(strategy: &AudioStrategy) -> Option<(AudioOutput, String)> {
+    match strategy {
+        AudioStrategy::Silence => Some((AudioOutput::Silence, "[AUDIO_SILENCE]".to_string())),
+        AudioStrategy::Remove => Some((AudioOutput::Remove, "[AUDIO_REMOVE]".to_string())),
+        // `AudioStrategy` is `#[non_exhaustive]`; new variants without
+        // a defined codec output are skipped.
+        _ => None,
     }
 }
 
+fn hash_value(value: &str) -> String {
+    let mut hasher = Sha256::new();
+    hasher.update(value.as_bytes());
+    let hash = hasher.finalize();
+    hash.iter().take(8).map(|b| format!("{b:02x}")).collect()
+}
+
+fn pseudonymize(entity_kind: &EntityKind, value: &str) -> String {
+    let mut hasher = Sha256::new();
+    hasher.update(entity_kind.to_string().as_bytes());
+    hasher.update(b":");
+    hasher.update(value.as_bytes());
+    let hash = hasher.finalize();
+    let id: u32 = u32::from_le_bytes([hash[0], hash[1], hash[2], hash[3]]);
+    format!("{entity_kind}_{id}")
+}
+
+fn log_modality_mismatch(entity_id: Uuid, location_modality: &str, strategy: &Strategy) {
+    tracing::trace!(
+        target: TARGET,
+        %entity_id,
+        location_modality,
+        strategy = ?strategy,
+        "strategy modality does not match entity location, skipping",
+    );
+}
+
 #[cfg(test)]
 mod tests {
     use nvisy_codec::ContentHandle;
     use nvisy_core::content::{Content, ContentData, ContentMetadata, ContentSource};
-    use nvisy_ontology::entity::{Entities, Entity, EntityKind};
+    use nvisy_ontology::entity::{Entities, Entity, EntityKind, Location, TabularLocation};
     use nvisy_ontology::policy::ImageStrategy;
-    use nvisy_ontology::provenance::AuditEntry;
+    use nvisy_ontology::provenance::{AuditEntry, RedactionMapping};
 
     use super::*;
     use crate::operation::envelope::SharedData;
@@ -321,15 +433,41 @@ mod tests {
         Entity::test_builder(start, end).test_build()
     }
 
+    fn tabular_entity(row: usize, col: usize, start: usize, end: usize) -> Entity {
+        let loc = TabularLocation {
+            row_index: row,
+            column_index: col,
+            start_offset: Some(start),
+            end_offset: Some(end),
+            column_name: None,
+            sheet_name: None,
+        };
+        Entity::test_builder(0, 0)
+            .with_location(Location::from(loc))
+            .test_build()
+    }
+
     async fn test_envelope(entities: Entities) -> DocumentEnvelope {
-        let data = ContentData::from_text(ContentSource::new(), "Hello John world");
+        envelope_with("Hello John world", "text/plain", entities).await
+    }
+
+    async fn test_envelope_csv(entities: Entities, csv: &str) -> DocumentEnvelope {
+        envelope_with(csv, "text/csv", entities).await
+    }
+
+    async fn envelope_with(
+        body: &str,
+        content_type: &str,
+        entities: Entities,
+    ) -> DocumentEnvelope {
+        let data = ContentData::from_text(ContentSource::new(), body);
         let content =
-            Content::with_metadata(data, ContentMetadata::new().with_content_type("text/plain"));
-        let doc = ContentHandle::decode(&content).await.unwrap();
+            Content::with_metadata(data, ContentMetadata::new().with_content_type(content_type));
+        let handle = ContentHandle::decode(&content).await.unwrap();
         let dir = tempfile::tempdir().unwrap();
         let registry = crate::registry::Registry::open(dir.path()).unwrap();
         let shared = SharedData::new(uuid::Uuid::new_v4(), uuid::Uuid::new_v4(), registry);
-        let mut envelope = DocumentEnvelope::new(doc, ContentMetadata::default(), shared);
+        let mut envelope = DocumentEnvelope::new(handle, ContentMetadata::default(), shared);
         envelope.audit.entities = entities;
         envelope
     }
@@ -341,6 +479,15 @@ mod tests {
             .unwrap()
     }
 
+    fn test_mapping(entity_id: Uuid, location: Location, original: &str) -> RedactionMapping {
+        RedactionMapping {
+            entity_id,
+            location,
+            original: original.to_owned(),
+            replacement: None,
+        }
+    }
+
     #[tokio::test]
     async fn mask_applies_and_records_replacement() {
         let entity = text_entity(6, 10);
@@ -366,6 +513,36 @@ mod tests {
         );
     }
 
+    #[tokio::test]
+    async fn mask_counts_chars_not_bytes() {
+        // The handler reads "John" (4 bytes / 4 chars); for an
+        // entity spanning a multi-byte character the count should
+        // track chars. This test pins the chars-not-bytes behavior
+        // by checking the mask length matches the char count of the
+        // value the handler returns.
+        let entity = text_entity(6, 10);
+        let entity_id = entity.id;
+        let record = test_record(
+            entity_id,
+            Strategy::Text(TextStrategy::Mask { mask_char: '*' }),
+            "John",
+        );
+        let entities: Entities = vec![entity].into();
+        let mut envelope = test_envelope(entities).await;
+        envelope.audit.entries.push(record);
+
+        RedactionApplicator::new(&mut envelope)
+            .apply()
+            .await
+            .unwrap();
+
+        // "John" is 4 chars -> 4 mask chars.
+        assert_eq!(
+            envelope.audit.entries[0].value.replacement.as_deref(),
+            Some("****"),
+        );
+    }
+
     #[tokio::test]
     async fn remove_leaves_replacement_none() {
         let entity = text_entity(6, 10);
@@ -405,17 +582,134 @@ mod tests {
 
     #[test]
     fn hash_replacement_is_deterministic() {
-        let a = RedactionApplicator::hash_value("John Smith");
-        let b = RedactionApplicator::hash_value("John Smith");
+        let a = hash_value("John Smith");
+        let b = hash_value("John Smith");
         assert_eq!(a, b);
         assert!(!a.is_empty());
     }
 
     #[test]
     fn pseudonymize_is_deterministic() {
-        let a = RedactionApplicator::pseudonymize(&EntityKind::PersonName, "John Smith");
-        let b = RedactionApplicator::pseudonymize(&EntityKind::PersonName, "John Smith");
+        let a = pseudonymize(&EntityKind::PersonName, "John Smith");
+        let b = pseudonymize(&EntityKind::PersonName, "John Smith");
         assert_eq!(a, b);
         assert!(a.contains('_'));
     }
+
+    // -- Tabular end-to-end tests --
+
+    #[tokio::test]
+    async fn tabular_full_cell_mask() {
+        // row 1, col 1 = "123-45-6789" (11 chars)
+        let entity = tabular_entity(1, 1, 0, 11);
+        let entity_id = entity.id;
+        let record = test_record(
+            entity_id,
+            Strategy::Text(TextStrategy::Mask { mask_char: '*' }),
+            "123-45-6789",
+        );
+
+        let entities: Entities = vec![entity.clone()].into();
+        let mut envelope =
+            test_envelope_csv(entities, "name,ssn\nAlice,123-45-6789\n").await;
+        envelope.audit.entries.push(record);
+        envelope
+            .redaction_map
+            .entries
+            .push(test_mapping(entity_id, entity.location.clone(), "123-45-6789"));
+
+        RedactionApplicator::new(&mut envelope).apply().await.unwrap();
+
+        // 11 chars -> 11 asterisks
+        assert_eq!(
+            envelope.audit.entries[0].value.replacement.as_deref(),
+            Some("***********"),
+        );
+        // Mapping was updated too.
+        assert_eq!(
+            envelope.redaction_map.entries[0].replacement.as_deref(),
+            Some("***********"),
+        );
+        // Document content was actually mutated.
+        let value = envelope
+            .document
+            .read_tabular(entity.location.as_tabular().unwrap())
+            .await
+            .map(|d| d.into_inner());
+        assert_eq!(value.as_deref(), Some("***********"));
+    }
+
+    #[tokio::test]
+    async fn tabular_partial_cell_replace() {
+        // row 1, col 0 = "Alice Smith" — redact "Alice" (0..5)
+        let entity = tabular_entity(1, 0, 0, 5);
+        let entity_id = entity.id;
+        let record = test_record(
+            entity_id,
+            Strategy::Text(TextStrategy::Replace {
+                placeholder: "[NAME]".to_owned(),
+            }),
+            "Alice",
+        );
+
+        let entities: Entities = vec![entity.clone()].into();
+        let mut envelope =
+            test_envelope_csv(entities, "name,ssn\nAlice Smith,123-45-6789\n").await;
+        envelope.audit.entries.push(record);
+
+        RedactionApplicator::new(&mut envelope).apply().await.unwrap();
+
+        let value = envelope
+            .document
+            .read_tabular(entity.location.as_tabular().unwrap())
+            .await
+            .map(|d| d.into_inner());
+        assert_eq!(value.as_deref(), Some("[NAME] Smith"));
+    }
+
+    #[tokio::test]
+    async fn tabular_remove_leaves_empty_cell() {
+        let entity = tabular_entity(1, 1, 0, 11);
+        let entity_id = entity.id;
+        let record = test_record(
+            entity_id,
+            Strategy::Text(TextStrategy::Remove),
+            "123-45-6789",
+        );
+
+        let entities: Entities = vec![entity.clone()].into();
+        let mut envelope =
+            test_envelope_csv(entities, "name,ssn\nAlice,123-45-6789\n").await;
+        envelope.audit.entries.push(record);
+
+        RedactionApplicator::new(&mut envelope).apply().await.unwrap();
+
+        let value = envelope
+            .document
+            .read_tabular(entity.location.as_tabular().unwrap())
+            .await
+            .map(|d| d.into_inner());
+        assert_eq!(value.as_deref(), Some(""));
+    }
+
+    #[tokio::test]
+    async fn tabular_image_strategy_for_tabular_entity_skipped() {
+        // Mismatched modality: tabular location with image strategy.
+        // The applicator should skip it without erroring.
+        let entity = tabular_entity(1, 0, 0, 5);
+        let record = test_record(
+            entity.id,
+            Strategy::Image(ImageStrategy::Blur { sigma: 15.0 }),
+            "Alice",
+        );
+
+        let entities: Entities = vec![entity].into();
+        let mut envelope =
+            test_envelope_csv(entities, "name,ssn\nAlice,123\n").await;
+        envelope.audit.entries.push(record);
+
+        // No error, but no replacement either.
+        RedactionApplicator::new(&mut envelope).apply().await.unwrap();
+        assert!(envelope.audit.entries[0].value.replacement.is_none());
+    }
 }

From 981faf6835534176c11368331f157199e4f673ca Mon Sep 17 00:00:00 2001
From: Oleh Martsokha <o.martsokha@gmail.com>
Date: Tue, 19 May 2026 03:56:07 +0200
Subject: [PATCH 2/6] test(codec): drop worthless tests
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

30 tests removed from codec across 12 files. Each dropped test fell
into one of three buckets:

- Trivial constructor/getter checks (Located/Span map+into, PDF
  accessors, encode_returns_raw_bytes, document_type_is_pdf).
- Macro stubs round-tripped through the macro's own field accesses
  (all WAV + MP3 tests).
- Duplicates of tests already exercised elsewhere
  (tabular apply, csv_loader load_*_round_trip, pdf_loader
  load_preserves_raw_bytes, txt_handler read_substring,
  json_loader load_detects_four_space_indent).

Codec test count: 93 → 63. Workspace tests still green, clippy clean.

Production-side duplication between apply_text_redactions and
apply_tabular_redactions (and between TextRedaction and
TabularRedaction) is deliberately deferred — the test suite no
longer pretends it's two separate algorithms, but the prod dedupe
is its own change.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 crates/nvisy-codec/src/document/located.rs    | 19 -------
 crates/nvisy-codec/src/document/span.rs       | 22 --------
 .../src/handler/audio/mp3_handler.rs          | 32 ------------
 .../src/handler/audio/wav_handler.rs          | 32 ------------
 .../src/handler/rich/pdf_handler.rs           | 40 ---------------
 .../src/handler/rich/pdf_loader.rs            | 24 ---------
 .../src/handler/tabular/csv_loader.rs         | 31 ------------
 .../src/handler/text/html_handler.rs          |  9 ----
 .../src/handler/text/json_loader.rs           |  8 ---
 .../src/handler/text/txt_handler.rs           | 17 -------
 .../src/handler/text/txt_loader.rs            | 13 -----
 .../src/transform/tabular/apply.rs            | 50 -------------------
 12 files changed, 297 deletions(-)

diff --git a/crates/nvisy-codec/src/document/located.rs b/crates/nvisy-codec/src/document/located.rs
index 37eb781e..95237a4c 100644
--- a/crates/nvisy-codec/src/document/located.rs
+++ b/crates/nvisy-codec/src/document/located.rs
@@ -40,22 +40,3 @@ impl<L> Located<L> {
     }
 }
 
-#[cfg(test)]
-mod tests {
-    use super::*;
-
-    #[test]
-    fn map_transforms_inner() {
-        let src = ContentSource::new();
-        let l = Located::new(src, 7u32);
-        let mapped = l.map(|n| n.to_string());
-        assert_eq!(mapped.location, "7");
-        assert_eq!(mapped.source, src);
-    }
-
-    #[test]
-    fn into_location_discards_source() {
-        let l = Located::new(ContentSource::new(), 42u32);
-        assert_eq!(l.into_location(), 42);
-    }
-}
diff --git a/crates/nvisy-codec/src/document/span.rs b/crates/nvisy-codec/src/document/span.rs
index 2bf82858..8a41d5d5 100644
--- a/crates/nvisy-codec/src/document/span.rs
+++ b/crates/nvisy-codec/src/document/span.rs
@@ -56,25 +56,3 @@ impl<L, D> Span<L, D> {
     }
 }
 
-#[cfg(test)]
-mod tests {
-    use super::*;
-
-    #[test]
-    fn from_located_preserves_source_and_location() {
-        let src = ContentSource::new();
-        let located = Located::new(src, 7u32);
-        let span = Span::from_located(located, "data");
-        assert_eq!(span.source, src);
-        assert_eq!(span.location, 7);
-        assert_eq!(span.data, "data");
-    }
-
-    #[test]
-    fn map_transforms_data() {
-        let span = Span::new(ContentSource::new(), 1u32, "hello");
-        let mapped = span.map(|d| d.len());
-        assert_eq!(mapped.location, 1);
-        assert_eq!(mapped.data, 5);
-    }
-}
diff --git a/crates/nvisy-codec/src/handler/audio/mp3_handler.rs b/crates/nvisy-codec/src/handler/audio/mp3_handler.rs
index d3e0cd2e..3d932265 100644
--- a/crates/nvisy-codec/src/handler/audio/mp3_handler.rs
+++ b/crates/nvisy-codec/src/handler/audio/mp3_handler.rs
@@ -33,35 +33,3 @@ impl_audio_handler!(
     "mp3.encode"
 );
 
-#[cfg(test)]
-mod tests {
-    use bytes::Bytes;
-    use futures::StreamExt;
-    use nvisy_core::Error;
-
-    use super::*;
-    use crate::handler::{AudioHandler, Handler};
-
-    #[tokio::test]
-    async fn locations_yields_single_location() {
-        let h = Mp3Handler::new(Bytes::from_static(b"ID3-mp3-data"));
-        let items: Vec<_> = h.locations().collect().await;
-        assert_eq!(items.len(), 1);
-    }
-
-    #[tokio::test]
-    async fn read_returns_full_audio() {
-        let h = Mp3Handler::new(Bytes::from_static(b"ID3-mp3-data"));
-        let items: Vec<_> = h.locations().collect().await;
-        let data = h.read(&items[0].location).await.unwrap();
-        assert_eq!(data.as_bytes().as_ref(), b"ID3-mp3-data");
-    }
-
-    #[test]
-    fn encode_returns_current_bytes() -> Result<(), Error> {
-        let h = Mp3Handler::new(Bytes::from_static(b"audio-data"));
-        let encoded = h.encode()?;
-        assert_eq!(encoded.as_bytes(), b"audio-data");
-        Ok(())
-    }
-}
diff --git a/crates/nvisy-codec/src/handler/audio/wav_handler.rs b/crates/nvisy-codec/src/handler/audio/wav_handler.rs
index 399f9da2..20327cce 100644
--- a/crates/nvisy-codec/src/handler/audio/wav_handler.rs
+++ b/crates/nvisy-codec/src/handler/audio/wav_handler.rs
@@ -33,35 +33,3 @@ impl_audio_handler!(
     "wav.encode"
 );
 
-#[cfg(test)]
-mod tests {
-    use bytes::Bytes;
-    use futures::StreamExt;
-    use nvisy_core::Error;
-
-    use super::*;
-    use crate::handler::{AudioHandler, Handler};
-
-    #[tokio::test]
-    async fn locations_yields_single_location() {
-        let h = WavHandler::new(Bytes::from_static(b"RIFF-wav-data"));
-        let items: Vec<_> = h.locations().collect().await;
-        assert_eq!(items.len(), 1);
-    }
-
-    #[tokio::test]
-    async fn read_returns_full_audio() {
-        let h = WavHandler::new(Bytes::from_static(b"RIFF-wav-data"));
-        let items: Vec<_> = h.locations().collect().await;
-        let data = h.read(&items[0].location).await.unwrap();
-        assert_eq!(data.as_bytes().as_ref(), b"RIFF-wav-data");
-    }
-
-    #[test]
-    fn encode_returns_current_bytes() -> Result<(), Error> {
-        let h = WavHandler::new(Bytes::from_static(b"audio-data"));
-        let encoded = h.encode()?;
-        assert_eq!(encoded.as_bytes(), b"audio-data");
-        Ok(())
-    }
-}
diff --git a/crates/nvisy-codec/src/handler/rich/pdf_handler.rs b/crates/nvisy-codec/src/handler/rich/pdf_handler.rs
index 636ad31b..8b069a64 100644
--- a/crates/nvisy-codec/src/handler/rich/pdf_handler.rs
+++ b/crates/nvisy-codec/src/handler/rich/pdf_handler.rs
@@ -316,13 +316,6 @@ mod tests {
         assert_eq!(items[2].location.page_number, Some(3));
     }
 
-    #[tokio::test]
-    async fn locations_empty_document() {
-        let h = handler(&[]);
-        let items: Vec<_> = TextHandler::locations(&h).collect().await;
-        assert!(items.is_empty());
-    }
-
     #[tokio::test]
     async fn read_returns_page_text() {
         let h = handler(&["page one", "page two"]);
@@ -336,37 +329,4 @@ mod tests {
         );
     }
 
-    #[test]
-    fn accessors() {
-        let h = handler(&["alpha", "beta"]);
-        assert_eq!(h.page_count(), 2);
-        assert_eq!(h.len(), 2);
-        assert!(!h.is_empty());
-        assert_eq!(h.page(0), Some("alpha"));
-        assert_eq!(h.page(1), Some("beta"));
-        assert_eq!(h.page(2), None);
-        assert_eq!(h.pages(), &["alpha", "beta"]);
-    }
-
-    #[test]
-    fn encode_returns_raw_bytes() -> Result<(), Error> {
-        let raw = b"fake-pdf-bytes";
-        let h = RichTextHandler::new(DocumentType::Pdf, vec!["text".into()], raw.to_vec());
-        assert_eq!(h.encode()?.as_bytes(), raw);
-        Ok(())
-    }
-
-    #[test]
-    fn document_type_is_pdf() {
-        let h = handler(&[]);
-        assert_eq!(h.document_type(), DocumentType::Pdf);
-    }
-
-    #[test]
-    fn empty_handler() {
-        let h = handler(&[]);
-        assert!(h.is_empty());
-        assert_eq!(h.len(), 0);
-        assert_eq!(h.page_count(), 0);
-    }
 }
diff --git a/crates/nvisy-codec/src/handler/rich/pdf_loader.rs b/crates/nvisy-codec/src/handler/rich/pdf_loader.rs
index 885a49a6..31a06e17 100644
--- a/crates/nvisy-codec/src/handler/rich/pdf_loader.rs
+++ b/crates/nvisy-codec/src/handler/rich/pdf_loader.rs
@@ -123,28 +123,4 @@ mod tests {
         assert!(doc.page(0).unwrap().trim().is_empty());
     }
 
-    #[tokio::test]
-    async fn load_preserves_raw_bytes() {
-        let raw = minimal_pdf();
-        let content = content_from_bytes(&raw);
-        let doc = PdfLoader
-            .decode(&content, &PdfParams::default())
-            .await
-            .unwrap();
-
-        assert_eq!(doc.raw(), &raw);
-    }
-
-    #[tokio::test]
-    async fn locations_matches_pages() {
-        let raw = minimal_pdf();
-        let content = content_from_bytes(&raw);
-        let doc = PdfLoader
-            .decode(&content, &PdfParams::default())
-            .await
-            .unwrap();
-
-        let items: Vec<_> = TextHandler::locations(&doc).collect().await;
-        assert_eq!(items.len(), doc.page_count());
-    }
 }
diff --git a/crates/nvisy-codec/src/handler/tabular/csv_loader.rs b/crates/nvisy-codec/src/handler/tabular/csv_loader.rs
index 0d749f77..93869abd 100644
--- a/crates/nvisy-codec/src/handler/tabular/csv_loader.rs
+++ b/crates/nvisy-codec/src/handler/tabular/csv_loader.rs
@@ -190,37 +190,6 @@ mod tests {
         Ok(())
     }
 
-    #[tokio::test]
-    async fn load_semicolon_delimited() -> Result<(), Error> {
-        let content = content_from_str("a;b\n1;2\n");
-        let doc = CsvLoader.decode(&content, &CsvParams::default()).await?;
-        assert_eq!(doc.delimiter(), b';');
-        Ok(())
-    }
-
-    #[tokio::test]
-    async fn load_quoted_fields() -> Result<(), Error> {
-        let content = content_from_str("name,bio\n\"Alice\",\"Has a, comma\"\n");
-        let doc = CsvLoader.decode(&content, &CsvParams::default()).await?;
-        assert_eq!(doc.cell(0, 1), Some("Has a, comma"));
-        Ok(())
-    }
-
-    #[tokio::test]
-    async fn load_locations_round_trip() -> Result<(), Error> {
-        let content = content_from_str("name,age\nAlice,30\n");
-        let doc = CsvLoader.decode(&content, &CsvParams::default()).await?;
-        let items: Vec<_> = doc.locations().collect().await;
-
-        // 2 header + 2 data
-        assert_eq!(items.len(), 4);
-        assert_eq!(doc.read(&items[0].location).await.unwrap().as_str(), "name");
-        assert_eq!(doc.read(&items[1].location).await.unwrap().as_str(), "age");
-        assert_eq!(doc.read(&items[2].location).await.unwrap().as_str(), "Alice");
-        assert_eq!(doc.read(&items[3].location).await.unwrap().as_str(), "30");
-        Ok(())
-    }
-
     #[tokio::test]
     async fn load_invalid_utf8() {
         let content = ContentData::new(
diff --git a/crates/nvisy-codec/src/handler/text/html_handler.rs b/crates/nvisy-codec/src/handler/text/html_handler.rs
index 9607c434..c41bc976 100644
--- a/crates/nvisy-codec/src/handler/text/html_handler.rs
+++ b/crates/nvisy-codec/src/handler/text/html_handler.rs
@@ -246,13 +246,4 @@ mod tests {
         assert_eq!(items.len(), 2);
     }
 
-    #[tokio::test]
-    async fn read_returns_text_node() {
-        let h = handler_from_html("<html><head></head><body><p>Hello</p></body></html>");
-        let items: Vec<_> = h.locations().collect().await;
-        assert_eq!(
-            h.read(&items[0].location).await.unwrap().as_str(),
-            "Hello"
-        );
-    }
 }
diff --git a/crates/nvisy-codec/src/handler/text/json_loader.rs b/crates/nvisy-codec/src/handler/text/json_loader.rs
index b7389c48..8da911a2 100644
--- a/crates/nvisy-codec/src/handler/text/json_loader.rs
+++ b/crates/nvisy-codec/src/handler/text/json_loader.rs
@@ -130,14 +130,6 @@ mod tests {
         Ok(())
     }
 
-    #[tokio::test]
-    async fn load_detects_four_space_indent() -> Result<(), Error> {
-        let content = content_from_str("{\n    \"a\": 1\n}\n");
-        let doc = JsonLoader.decode(&content, &JsonParams::default()).await?;
-        assert_eq!(doc.indent(), JsonIndent::four_spaces());
-        Ok(())
-    }
-
     #[tokio::test]
     async fn load_detects_tab_indent() -> Result<(), Error> {
         let content = content_from_str("{\n\t\"a\": 1\n}\n");
diff --git a/crates/nvisy-codec/src/handler/text/txt_handler.rs b/crates/nvisy-codec/src/handler/text/txt_handler.rs
index 98538a16..a40c970a 100644
--- a/crates/nvisy-codec/src/handler/text/txt_handler.rs
+++ b/crates/nvisy-codec/src/handler/text/txt_handler.rs
@@ -216,17 +216,6 @@ mod tests {
         assert_eq!(h.read(&loc).await.unwrap().as_str(), "world");
     }
 
-    #[tokio::test]
-    async fn read_substring() {
-        let h = handler("hello world");
-        let loc = TextLocation {
-            start_offset: 6,
-            end_offset: 11,
-            ..Default::default()
-        };
-        assert_eq!(h.read(&loc).await.unwrap().as_str(), "world");
-    }
-
     #[tokio::test]
     async fn read_cross_line_returns_none() {
         let h = handler("hello\nworld\n");
@@ -307,10 +296,4 @@ mod tests {
         Ok(())
     }
 
-    #[tokio::test]
-    async fn empty_handler_locations() {
-        let h = TxtHandler::new(vec![], false);
-        let items: Vec<_> = h.locations().collect().await;
-        assert!(items.is_empty());
-    }
 }
diff --git a/crates/nvisy-codec/src/handler/text/txt_loader.rs b/crates/nvisy-codec/src/handler/text/txt_loader.rs
index ff219ccc..e97558ff 100644
--- a/crates/nvisy-codec/src/handler/text/txt_loader.rs
+++ b/crates/nvisy-codec/src/handler/text/txt_loader.rs
@@ -84,19 +84,6 @@ mod tests {
         Ok(())
     }
 
-    #[tokio::test]
-    async fn load_preserves_lines_through_round_trip() -> Result<(), Error> {
-        let content = content_from_str("Alice\nBob\nCharlie\n");
-        let doc = TxtLoader.decode(&content, &TxtParams::default()).await?;
-
-        let items: Vec<_> = doc.locations().collect().await;
-        assert_eq!(items.len(), 3);
-        assert_eq!(doc.read(&items[0].location).await.unwrap().as_str(), "Alice");
-        assert_eq!(doc.read(&items[1].location).await.unwrap().as_str(), "Bob");
-        assert_eq!(doc.read(&items[2].location).await.unwrap().as_str(), "Charlie");
-        Ok(())
-    }
-
     #[tokio::test]
     async fn load_invalid_utf8() {
         let content = ContentData::new(
diff --git a/crates/nvisy-codec/src/transform/tabular/apply.rs b/crates/nvisy-codec/src/transform/tabular/apply.rs
index 719e0375..c2ff24e0 100644
--- a/crates/nvisy-codec/src/transform/tabular/apply.rs
+++ b/crates/nvisy-codec/src/transform/tabular/apply.rs
@@ -50,53 +50,3 @@ pub(crate) fn apply_tabular_redactions(
     Ok(())
 }
 
-#[cfg(test)]
-mod tests {
-    use super::*;
-    use crate::transform::TextOutput;
-
-    fn redaction(start: usize, end: usize, replacement: &str) -> TabularRedaction {
-        TabularRedaction::new(start, end, TextOutput::replace(replacement))
-    }
-
-    #[test]
-    fn single_replacement() {
-        let mut s = String::from("hello world");
-        apply_tabular_redactions(&mut s, &[redaction(0, 5, "[X]")], "test").unwrap();
-        assert_eq!(s, "[X] world");
-    }
-
-    #[test]
-    fn right_to_left_application() {
-        let mut s = String::from("aaa bbb ccc");
-        let rs = vec![redaction(0, 3, "[A]"), redaction(8, 11, "[C]")];
-        apply_tabular_redactions(&mut s, &rs, "test").unwrap();
-        assert_eq!(s, "[A] bbb [C]");
-    }
-
-    #[test]
-    fn remove_output() {
-        let mut s = String::from("hello world");
-        apply_tabular_redactions(
-            &mut s,
-            &[TabularRedaction::new(5, 11, TextOutput::Remove)],
-            "test",
-        )
-        .unwrap();
-        assert_eq!(s, "hello");
-    }
-
-    #[test]
-    fn out_of_bounds_clipped() {
-        let mut s = String::from("short");
-        apply_tabular_redactions(&mut s, &[redaction(0, 999, "[X]")], "test").unwrap();
-        assert_eq!(s, "[X]");
-    }
-
-    #[test]
-    fn mid_character_rejected() {
-        let mut s = String::from("héllo"); // 'é' is 2 bytes
-        let err = apply_tabular_redactions(&mut s, &[redaction(0, 2, "[X]")], "test").unwrap_err();
-        assert!(err.to_string().contains("mid-character"));
-    }
-}

From f8ac8e1ccd1aaefc66a6aedc8aa142d3abc0a05f Mon Sep 17 00:00:00 2001
From: Oleh Martsokha <o.martsokha@gmail.com>
Date: Tue, 19 May 2026 04:12:24 +0200
Subject: [PATCH 3/6] test(core, ontology): drop worthless tests
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

69 tests removed across 26 files. Same bar as codec cleanup:

- Tests of derives (serde round-trip, Display, Default, Clone, Copy):
  ~30 tests. The derives are the contract; testing them tests the
  ecosystem, not us.
- Tests of dependencies (oxilangtag wrapper, strum, uuid v7 generator,
  infer crate, str::from_utf8): ~10 tests.
- Trivial getter/constructor read-backs (Location::as_text variants,
  builder_required_fields, ContentMetadata accessors, etc.): ~15 tests.
- Duplicates of nearby tests (pattern_expression_roundtrip_glob
  duplicates _regex, no_overlap_different_col duplicates _row,
  language_tag parse_with_region duplicates parse_simple, etc.): ~6
  tests.
- Tests of std-library behavior (Vec::is_empty, Vec::find, Vec::push):
  ~8 tests.

Also dropped four borderline cases by explicit user decision:
- workflow::validate_accepts_valid_configs (tests Default::default()
  through validator with no rules)
- time_span::midpoint (trivial integer arithmetic)
- bounding_box::area (one-line width * height)
- entity::source::ordering (had a 2ms sleep — flaky)

Test counts:
- nvisy-core: 25 → 11
- nvisy-ontology: 120 → 65

Workspace tests pass, clippy clean.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 crates/nvisy-core/src/content/bundle.rs       |  36 ------
 crates/nvisy-core/src/content/content_data.rs |  15 ---
 .../src/content/content_metadata.rs           | 103 +-----------------
 .../nvisy-core/src/content/data_reference.rs  |  24 ----
 crates/nvisy-ontology/src/artifacts/audio.rs  |   7 --
 .../nvisy-ontology/src/artifacts/tabular.rs   |  37 -------
 .../src/context/analytic/pattern.rs           |  23 ----
 crates/nvisy-ontology/src/context/mod.rs      |  22 ----
 .../src/context/reference/credential.rs       |   7 --
 .../src/context/reference/text.rs             |  41 -------
 .../src/context/temporal/datetime.rs          |  12 --
 .../src/context/temporal/time.rs              |  28 -----
 .../src/context/temporal/timespan.rs          |  15 ---
 .../nvisy-ontology/src/entity/annotation.rs   |   6 -
 crates/nvisy-ontology/src/entity/kind.rs      |  41 -------
 .../nvisy-ontology/src/entity/location/mod.rs |  44 --------
 .../src/entity/location/tabular.rs            |  12 --
 .../src/entity/location/text.rs               |  20 ----
 crates/nvisy-ontology/src/entity/mod.rs       |  19 ----
 .../nvisy-ontology/src/entity/sensitivity.rs  |  23 ----
 crates/nvisy-ontology/src/entity/source.rs    |  29 -----
 .../src/primitive/bounding_box.rs             |   6 -
 .../src/primitive/language_tag.rs             |  39 -------
 .../nvisy-ontology/src/primitive/time_span.rs |   6 -
 .../src/provenance/redaction_map.rs           |  23 ----
 crates/nvisy-ontology/src/workflow/mod.rs     |  20 ----
 26 files changed, 2 insertions(+), 656 deletions(-)

diff --git a/crates/nvisy-core/src/content/bundle.rs b/crates/nvisy-core/src/content/bundle.rs
index 57bbebe1..11c571c9 100644
--- a/crates/nvisy-core/src/content/bundle.rs
+++ b/crates/nvisy-core/src/content/bundle.rs
@@ -149,42 +149,6 @@ mod tests {
     use super::*;
     use crate::media::{ImageFormat, TextFormat};
 
-    #[test]
-    fn content_with_metadata() {
-        let data = ContentData::from_text(ContentSource::new(), "Test content");
-        let metadata = ContentMetadata::with_path("test.txt");
-        let content = Content::with_metadata(data, metadata);
-
-        assert!(content.metadata().is_some());
-        assert_eq!(content.file_extension(), Some("txt"));
-    }
-
-    #[test]
-    fn metadata_operations() {
-        let data = ContentData::from("Test");
-        let mut content = Content::new(data);
-
-        assert!(content.metadata().is_none());
-
-        content.set_metadata(ContentMetadata::with_path("file.pdf"));
-        assert!(content.metadata().is_some());
-        assert_eq!(content.file_extension(), Some("pdf"));
-
-        content.clear_metadata();
-        assert!(content.metadata().is_none());
-    }
-
-    #[test]
-    fn into_parts_roundtrip() {
-        let data = ContentData::from_text(ContentSource::new(), "Test");
-        let metadata = ContentMetadata::with_path("test.txt");
-        let content = Content::with_metadata(data.clone(), metadata.clone());
-
-        let (recovered_data, recovered_metadata) = content.into_parts();
-        assert_eq!(recovered_data, data);
-        assert_eq!(recovered_metadata, Some(metadata));
-    }
-
     #[test]
     fn infer_document_type_from_metadata() {
         let data = ContentData::from("plain text");
diff --git a/crates/nvisy-core/src/content/content_data.rs b/crates/nvisy-core/src/content/content_data.rs
index 98833394..7166201d 100644
--- a/crates/nvisy-core/src/content/content_data.rs
+++ b/crates/nvisy-core/src/content/content_data.rs
@@ -277,15 +277,6 @@ mod tests {
         assert!(content.verify_sha256([0u8; 32]).is_err());
     }
 
-    #[test]
-    fn as_hipstr() {
-        let content = ContentData::from("Hello, HipStr!");
-        assert_eq!(content.as_hipstr().unwrap().as_str(), "Hello, HipStr!");
-
-        let binary = ContentData::from(vec![0xFF, 0xFE]);
-        assert!(binary.as_hipstr().is_err());
-    }
-
     #[test]
     fn slice_operations() {
         let content = ContentData::from("Hello, world!");
@@ -305,12 +296,6 @@ mod tests {
         assert_eq!(data.detect_mime().as_deref(), Some("image/png"));
     }
 
-    #[test]
-    fn detect_mime_unknown() {
-        let data = ContentData::from("hello world");
-        assert_eq!(data.detect_mime(), None);
-    }
-
     #[test]
     fn is_likely_text() {
         assert!(ContentData::from("ascii text").is_likely_text());
diff --git a/crates/nvisy-core/src/content/content_metadata.rs b/crates/nvisy-core/src/content/content_metadata.rs
index 76bc4e62..5989cf53 100644
--- a/crates/nvisy-core/src/content/content_metadata.rs
+++ b/crates/nvisy-core/src/content/content_metadata.rs
@@ -18,7 +18,7 @@ use crate::media::DocumentType;
 /// Stored alongside (but separate from) the raw content bytes. Carries
 /// the caller-supplied MIME type, auto-detected MIME type, original
 /// filename, source path, and arbitrary key-value pairs.
-#[derive(Debug, Clone, PartialEq, Serialize, Deserialize)]
+#[derive(Debug, Clone, Default, PartialEq, Serialize, Deserialize)]
 pub struct ContentMetadata {
     /// Optional path to the source file.
     pub source_path: Option<PathBuf>,
@@ -53,16 +53,7 @@ impl ContentMetadata {
     /// Create new empty content metadata.
     #[must_use]
     pub fn new() -> Self {
-        Self {
-            source_path: None,
-            content_type: None,
-            detected_content_type: None,
-            filename: None,
-            size: None,
-            sha256: None,
-            metadata: None,
-            annotations: Annotations::new(),
-        }
+        Self::default()
     }
 
     /// Create content metadata with a source file path.
@@ -215,93 +206,3 @@ impl ContentMetadata {
         self.metadata.as_mut().and_then(|m| m.remove(key))
     }
 }
-
-impl Default for ContentMetadata {
-    fn default() -> Self {
-        Self::new()
-    }
-}
-
-#[cfg(test)]
-mod tests {
-    use super::*;
-
-    #[test]
-    fn test_file_extension_detection() {
-        let metadata = ContentMetadata::with_path(PathBuf::from("document.pdf"));
-
-        assert_eq!(metadata.file_extension(), Some("pdf"));
-    }
-
-    #[test]
-    fn test_metadata_filename() {
-        let metadata = ContentMetadata::with_path(PathBuf::from("/path/to/file.txt"));
-
-        assert_eq!(metadata.filename_from_path(), Some("file.txt"));
-    }
-
-    #[test]
-    fn test_metadata_parent_directory() {
-        let metadata = ContentMetadata::with_path(PathBuf::from("/path/to/file.txt"));
-
-        assert_eq!(metadata.parent_directory(), Some(Path::new("/path/to")));
-    }
-
-    #[test]
-    fn test_path_operations() {
-        let mut metadata = ContentMetadata::new();
-
-        assert!(!metadata.has_path());
-
-        metadata.set_path("test.txt");
-        assert!(metadata.has_path());
-        assert_eq!(metadata.filename_from_path(), Some("test.txt"));
-
-        metadata.clear_path();
-        assert!(!metadata.has_path());
-        assert_eq!(metadata.filename_from_path(), None);
-    }
-
-    #[test]
-    fn test_serde_serialization() {
-        let metadata = ContentMetadata::with_path(PathBuf::from("test.json"));
-
-        let serialized = serde_json::to_string(&metadata).unwrap();
-        let deserialized: ContentMetadata = serde_json::from_str(&serialized).unwrap();
-
-        assert_eq!(metadata, deserialized);
-    }
-
-    #[test]
-    fn test_extra_metadata() {
-        let mut metadata = ContentMetadata::new();
-        assert!(metadata.extra().is_none());
-        assert!(metadata.get_extra("key").is_none());
-
-        metadata.set_extra("lang", serde_json::Value::String("en".into()));
-        assert_eq!(
-            metadata.get_extra("lang"),
-            Some(&serde_json::Value::String("en".into()))
-        );
-        assert!(metadata.extra().is_some());
-
-        let removed = metadata.remove_extra("lang");
-        assert_eq!(removed, Some(serde_json::Value::String("en".into())));
-        assert_eq!(metadata.get_extra("lang"), None);
-    }
-
-    #[test]
-    fn test_extra_metadata_serialization() {
-        let mut metadata = ContentMetadata::with_path("doc.pdf");
-        metadata.set_extra("pages", serde_json::json!(42));
-
-        let json = serde_json::to_string(&metadata).unwrap();
-        let deserialized: ContentMetadata = serde_json::from_str(&json).unwrap();
-
-        assert_eq!(
-            deserialized.get_extra("pages"),
-            Some(&serde_json::json!(42))
-        );
-        assert_eq!(deserialized.filename_from_path(), Some("doc.pdf"));
-    }
-}
diff --git a/crates/nvisy-core/src/content/data_reference.rs b/crates/nvisy-core/src/content/data_reference.rs
index 67bb68e8..75909f16 100644
--- a/crates/nvisy-core/src/content/data_reference.rs
+++ b/crates/nvisy-core/src/content/data_reference.rs
@@ -61,27 +61,3 @@ impl DataReference {
         self.mapping_id.as_deref()
     }
 }
-
-#[cfg(test)]
-mod tests {
-    use super::*;
-
-    #[test]
-    fn with_mapping_id() {
-        let source = ContentSource::new();
-        let data_ref = DataReference::new(source).with_mapping_id("line-42");
-
-        assert_eq!(data_ref.mapping_id(), Some("line-42"));
-    }
-
-    #[test]
-    fn serialization_roundtrip() {
-        let source = ContentSource::new();
-        let data_ref = DataReference::new(source).with_mapping_id("test-mapping");
-
-        let json = serde_json::to_string(&data_ref).unwrap();
-        let deserialized: DataReference = serde_json::from_str(&json).unwrap();
-
-        assert_eq!(data_ref, deserialized);
-    }
-}
diff --git a/crates/nvisy-ontology/src/artifacts/audio.rs b/crates/nvisy-ontology/src/artifacts/audio.rs
index 84029cd9..886b8779 100644
--- a/crates/nvisy-ontology/src/artifacts/audio.rs
+++ b/crates/nvisy-ontology/src/artifacts/audio.rs
@@ -122,11 +122,4 @@ mod tests {
         assert!(t.time_span().is_none());
     }
 
-    #[test]
-    fn serde_roundtrip() {
-        let t = sample_transcription();
-        let json = serde_json::to_string(&t).unwrap();
-        let back: Transcription = serde_json::from_str(&json).unwrap();
-        assert_eq!(t, back);
-    }
 }
diff --git a/crates/nvisy-ontology/src/artifacts/tabular.rs b/crates/nvisy-ontology/src/artifacts/tabular.rs
index c6536f3c..b7065206 100644
--- a/crates/nvisy-ontology/src/artifacts/tabular.rs
+++ b/crates/nvisy-ontology/src/artifacts/tabular.rs
@@ -32,40 +32,3 @@ pub struct TabularArtifacts {
     #[serde(default, skip_serializing_if = "Vec::is_empty")]
     pub headers: Vec<ColumnHeader>,
 }
-
-#[cfg(test)]
-mod tests {
-    use super::*;
-
-    #[test]
-    fn sparse_headers_skip_gaps() {
-        // Columns 0 and 3 have headers; columns 1 and 2 do not.
-        let artifacts = TabularArtifacts {
-            row_count: Some(100),
-            column_count: Some(4),
-            headers: vec![
-                ColumnHeader {
-                    column_index: 0,
-                    text: "id".to_owned(),
-                },
-                ColumnHeader {
-                    column_index: 3,
-                    text: "name".to_owned(),
-                },
-            ],
-        };
-        let json = serde_json::to_string(&artifacts).unwrap();
-        let back: TabularArtifacts = serde_json::from_str(&json).unwrap();
-        assert_eq!(back.headers.len(), 2);
-        assert_eq!(back.headers[0].column_index, 0);
-        assert_eq!(back.headers[1].column_index, 3);
-    }
-
-    #[test]
-    fn default_is_empty() {
-        let artifacts = TabularArtifacts::default();
-        let json = serde_json::to_string(&artifacts).unwrap();
-        // All fields skipped — JSON should be empty object.
-        assert_eq!(json, "{}");
-    }
-}
diff --git a/crates/nvisy-ontology/src/context/analytic/pattern.rs b/crates/nvisy-ontology/src/context/analytic/pattern.rs
index 3beb698b..b53713f9 100644
--- a/crates/nvisy-ontology/src/context/analytic/pattern.rs
+++ b/crates/nvisy-ontology/src/context/analytic/pattern.rs
@@ -50,29 +50,6 @@ mod tests {
     use super::*;
     use crate::context::analytic::AnalyticVariant;
 
-    #[test]
-    fn pattern_expression_roundtrip_regex() {
-        let pat = PatternExpression::Regex(RegexPattern {
-            expression: r"^\d+$".to_owned(),
-        });
-        let json = serde_json::to_string(&pat).unwrap();
-        assert!(json.contains(r#""syntax":"regex""#));
-        assert!(json.contains(r#""expression":"^\\d+$""#));
-        let back: PatternExpression = serde_json::from_str(&json).unwrap();
-        assert_eq!(pat, back);
-    }
-
-    #[test]
-    fn pattern_expression_roundtrip_glob() {
-        let pat = PatternExpression::Glob(GlobPattern {
-            expression: "*.txt".to_owned(),
-        });
-        let json = serde_json::to_string(&pat).unwrap();
-        assert!(json.contains(r#""syntax":"glob""#));
-        let back: PatternExpression = serde_json::from_str(&json).unwrap();
-        assert_eq!(pat, back);
-    }
-
     #[test]
     fn pattern_data_flatten_no_tag_collision() {
         // AnalyticVariant uses `tag = "kind"` and PatternExpression uses
diff --git a/crates/nvisy-ontology/src/context/mod.rs b/crates/nvisy-ontology/src/context/mod.rs
index be34de4e..1a378a6a 100644
--- a/crates/nvisy-ontology/src/context/mod.rs
+++ b/crates/nvisy-ontology/src/context/mod.rs
@@ -54,28 +54,6 @@ mod tests {
         assert_eq!(ctx.len(), 1);
     }
 
-    #[test]
-    fn push_distinct() {
-        let mut ctx = Contexts::new();
-        ctx.push(Uuid::now_v7());
-        ctx.push(Uuid::now_v7());
-        assert_eq!(ctx.len(), 2);
-    }
-
-    #[test]
-    fn contains_and_ids() {
-        let id = Uuid::now_v7();
-        let ctx = Contexts::from(vec![id]);
-        assert!(ctx.contains(&id));
-        assert_eq!(&*ctx, &[id]);
-    }
-
-    #[test]
-    fn empty() {
-        let ctx = Contexts::new();
-        assert!(ctx.is_empty());
-        assert_eq!(ctx.len(), 0);
-    }
 }
 
 /// A persistent, reusable collection of reference data for detection.
diff --git a/crates/nvisy-ontology/src/context/reference/credential.rs b/crates/nvisy-ontology/src/context/reference/credential.rs
index 0e0bea05..9127d59b 100644
--- a/crates/nvisy-ontology/src/context/reference/credential.rs
+++ b/crates/nvisy-ontology/src/context/reference/credential.rs
@@ -75,11 +75,4 @@ mod tests {
         assert_eq!(back.value, "");
     }
 
-    #[test]
-    fn deserialize_with_value_provided() {
-        let json = r#"{"value":"abc123","credentialKind":"password"}"#;
-        let cred: CredentialData = serde_json::from_str(json).unwrap();
-        assert_eq!(cred.value, "abc123");
-        assert_eq!(cred.credential_kind, Some(CredentialKind::Password));
-    }
 }
diff --git a/crates/nvisy-ontology/src/context/reference/text.rs b/crates/nvisy-ontology/src/context/reference/text.rs
index 7221ea82..5400988b 100644
--- a/crates/nvisy-ontology/src/context/reference/text.rs
+++ b/crates/nvisy-ontology/src/context/reference/text.rs
@@ -60,44 +60,3 @@ impl TextEntry {
         }
     }
 }
-
-#[cfg(test)]
-mod tests {
-    use super::*;
-
-    #[test]
-    fn new_constructor_sets_no_language() {
-        let data = TextData::new(vec![TextEntry::new("name", "Alice")]);
-        assert_eq!(data.entries.len(), 1);
-        assert!(data.language.is_none());
-    }
-
-    #[test]
-    fn with_language_sets_field() {
-        let tag: LanguageTag = "en-US".parse().unwrap();
-        let data = TextData::new(vec![]).with_language(tag.clone());
-        assert_eq!(data.language, Some(tag));
-    }
-
-    #[test]
-    fn roundtrip_serde() {
-        let data = TextData::new(vec![
-            TextEntry::new("full_name", "Alice Smith"),
-            TextEntry::new("email", "alice@example.com"),
-        ])
-        .with_language("en".parse().unwrap());
-        let json = serde_json::to_string(&data).unwrap();
-        let back: TextData = serde_json::from_str(&json).unwrap();
-        assert_eq!(data.entries.len(), back.entries.len());
-        assert_eq!(data.language, back.language);
-    }
-
-    #[test]
-    fn roundtrip_empty() {
-        let data = TextData::default();
-        let json = serde_json::to_string(&data).unwrap();
-        let back: TextData = serde_json::from_str(&json).unwrap();
-        assert!(back.entries.is_empty());
-        assert!(back.language.is_none());
-    }
-}
diff --git a/crates/nvisy-ontology/src/context/temporal/datetime.rs b/crates/nvisy-ontology/src/context/temporal/datetime.rs
index 01cc7751..12950100 100644
--- a/crates/nvisy-ontology/src/context/temporal/datetime.rs
+++ b/crates/nvisy-ontology/src/context/temporal/datetime.rs
@@ -47,18 +47,6 @@ mod tests {
 
     use super::*;
 
-    #[test]
-    fn roundtrip_serde() {
-        let dt = DateTimeData::range(
-            datetime(2026, 1, 1, 9, 0, 0, 0),
-            datetime(2026, 1, 1, 17, 0, 0, 0),
-        );
-        let json = serde_json::to_string(&dt).unwrap();
-        let back: DateTimeData = serde_json::from_str(&json).unwrap();
-        assert_eq!(dt.start, back.start);
-        assert_eq!(dt.end, back.end);
-    }
-
     #[test]
     fn single_skips_end_in_json() {
         let dt = DateTimeData::single(datetime(2026, 1, 1, 9, 0, 0, 0));
diff --git a/crates/nvisy-ontology/src/context/temporal/time.rs b/crates/nvisy-ontology/src/context/temporal/time.rs
index 11a40e6e..20620d5e 100644
--- a/crates/nvisy-ontology/src/context/temporal/time.rs
+++ b/crates/nvisy-ontology/src/context/temporal/time.rs
@@ -37,31 +37,3 @@ impl TimeData {
         }
     }
 }
-
-#[cfg(test)]
-mod tests {
-    use jiff::civil::time;
-
-    use super::*;
-
-    #[test]
-    fn single_has_no_end() {
-        let t = TimeData::single(time(9, 0, 0, 0));
-        assert!(t.end.is_none());
-    }
-
-    #[test]
-    fn range_has_end() {
-        let t = TimeData::range(time(9, 0, 0, 0), time(17, 0, 0, 0));
-        assert_eq!(t.end, Some(time(17, 0, 0, 0)));
-    }
-
-    #[test]
-    fn roundtrip_serde() {
-        let t = TimeData::range(time(9, 0, 0, 0), time(17, 0, 0, 0));
-        let json = serde_json::to_string(&t).unwrap();
-        let back: TimeData = serde_json::from_str(&json).unwrap();
-        assert_eq!(t.start, back.start);
-        assert_eq!(t.end, back.end);
-    }
-}
diff --git a/crates/nvisy-ontology/src/context/temporal/timespan.rs b/crates/nvisy-ontology/src/context/temporal/timespan.rs
index 057c1a69..ca643563 100644
--- a/crates/nvisy-ontology/src/context/temporal/timespan.rs
+++ b/crates/nvisy-ontology/src/context/temporal/timespan.rs
@@ -28,18 +28,3 @@ impl TimeSpanData {
         self
     }
 }
-
-#[cfg(test)]
-mod tests {
-    use super::*;
-
-    #[test]
-    fn roundtrip_serde() {
-        let ts = TimeSpanData::new(TimeSpan::from_secs(1.0, 5.5)).with_label("intro");
-        let json = serde_json::to_string(&ts).unwrap();
-        let back: TimeSpanData = serde_json::from_str(&json).unwrap();
-        assert_eq!(ts.span.start_us, back.span.start_us);
-        assert_eq!(ts.span.end_us, back.span.end_us);
-        assert_eq!(ts.label, back.label);
-    }
-}
diff --git a/crates/nvisy-ontology/src/entity/annotation.rs b/crates/nvisy-ontology/src/entity/annotation.rs
index 9d9e1251..eef867a4 100644
--- a/crates/nvisy-ontology/src/entity/annotation.rs
+++ b/crates/nvisy-ontology/src/entity/annotation.rs
@@ -322,10 +322,4 @@ mod tests {
         assert_eq!(labels, vec!["medical", "gdpr"]);
     }
 
-    #[test]
-    fn empty_annotations_exclude_nothing() {
-        let annotations = Annotations::new();
-        let entity = test_entity("anything", 0, 8);
-        assert!(!annotations.is_excluded(&entity, Some("anything")));
-    }
 }
diff --git a/crates/nvisy-ontology/src/entity/kind.rs b/crates/nvisy-ontology/src/entity/kind.rs
index a5477627..55eab964 100644
--- a/crates/nvisy-ontology/src/entity/kind.rs
+++ b/crates/nvisy-ontology/src/entity/kind.rs
@@ -331,36 +331,8 @@ impl EntityKind {
 
 #[cfg(test)]
 mod tests {
-    use std::str::FromStr;
-
     use super::*;
 
-    #[test]
-    fn display_snake_case() {
-        assert_eq!(EntityKind::GovernmentId.to_string(), "government_id");
-        assert_eq!(EntityKind::PaymentCard.to_string(), "payment_card");
-        assert_eq!(EntityKind::EmailAddress.to_string(), "email_address");
-        assert_eq!(EntityKind::Fingerprint.to_string(), "fingerprint");
-        assert_eq!(EntityKind::ApiKey.to_string(), "api_key");
-        assert_eq!(EntityKind::Face.to_string(), "face");
-    }
-
-    #[test]
-    fn parse_roundtrip() {
-        let kind = EntityKind::from_str("fingerprint").unwrap();
-        assert_eq!(kind, EntityKind::Fingerprint);
-        assert_eq!(kind.to_string(), "fingerprint");
-    }
-
-    #[test]
-    fn serde_roundtrip() {
-        let kind = EntityKind::ApiKey;
-        let json = serde_json::to_string(&kind).unwrap();
-        assert_eq!(json, "\"api_key\"");
-        let back: EntityKind = serde_json::from_str(&json).unwrap();
-        assert_eq!(back, kind);
-    }
-
     #[test]
     fn category_personal_identity() {
         assert_eq!(
@@ -501,17 +473,4 @@ mod tests {
         );
     }
 
-    #[test]
-    fn sensitivity_ordering() {
-        assert!(EntityKind::GovernmentId.sensitivity() > EntityKind::PersonName.sensitivity());
-        assert!(EntityKind::PersonName.sensitivity() > EntityKind::Age.sensitivity());
-        assert!(EntityKind::Age.sensitivity() > EntityKind::Url.sensitivity());
-    }
-
-    #[test]
-    fn entity_kind_is_copy() {
-        let a = EntityKind::Fingerprint;
-        let b = a;
-        assert_eq!(a, b);
-    }
 }
diff --git a/crates/nvisy-ontology/src/entity/location/mod.rs b/crates/nvisy-ontology/src/entity/location/mod.rs
index f8b504c6..20076e1d 100644
--- a/crates/nvisy-ontology/src/entity/location/mod.rs
+++ b/crates/nvisy-ontology/src/entity/location/mod.rs
@@ -170,50 +170,6 @@ mod tests {
         )
     }
 
-    // -- as_* accessors --
-
-    #[test]
-    fn as_text_correct_variant() {
-        let loc = text(0, 5);
-        assert!(loc.as_text().is_some());
-        assert!(loc.as_image().is_none());
-    }
-
-    #[test]
-    fn as_image_correct_variant() {
-        let loc = image();
-        assert!(loc.as_image().is_some());
-        assert!(loc.as_text().is_none());
-    }
-
-    #[test]
-    fn as_audio_correct_variant() {
-        let loc = audio();
-        assert!(loc.as_audio().is_some());
-        assert!(loc.as_tabular().is_none());
-    }
-
-    #[test]
-    fn as_tabular_correct_variant() {
-        let loc = tabular(0, 0);
-        assert!(loc.as_tabular().is_some());
-        assert!(loc.as_audio().is_none());
-    }
-
-    // -- Display --
-
-    #[test]
-    fn display_text() {
-        assert_eq!(text(0, 10).to_string(), "text:0..10");
-    }
-
-    #[test]
-    fn display_tabular() {
-        assert_eq!(tabular(2, 3).to_string(), "tabular:r2c3");
-    }
-
-    // -- cross-modality overlap --
-
     #[test]
     fn cross_modality_no_overlap() {
         assert!(!text(0, 10).overlaps(&image()));
diff --git a/crates/nvisy-ontology/src/entity/location/tabular.rs b/crates/nvisy-ontology/src/entity/location/tabular.rs
index 82f3906b..cb3bef9e 100644
--- a/crates/nvisy-ontology/src/entity/location/tabular.rs
+++ b/crates/nvisy-ontology/src/entity/location/tabular.rs
@@ -83,13 +83,6 @@ mod tests {
         }
     }
 
-    #[test]
-    fn builder_required_fields() {
-        let loc = cell(1, 2);
-        assert_eq!(loc.row_index, 1);
-        assert_eq!(loc.column_index, 2);
-    }
-
     #[test]
     fn overlap_same_cell_no_offsets() {
         assert!(cell(0, 0).overlaps(&cell(0, 0)));
@@ -100,11 +93,6 @@ mod tests {
         assert!(!cell(0, 0).overlaps(&cell(1, 0)));
     }
 
-    #[test]
-    fn no_overlap_different_col() {
-        assert!(!cell(0, 0).overlaps(&cell(0, 1)));
-    }
-
     #[test]
     fn overlap_same_cell_intersecting_offsets() {
         assert!(cell_with_offsets(0, 0, 0, 10).overlaps(&cell_with_offsets(0, 0, 5, 15)));
diff --git a/crates/nvisy-ontology/src/entity/location/text.rs b/crates/nvisy-ontology/src/entity/location/text.rs
index 0c7aa6c0..3ab8d83d 100644
--- a/crates/nvisy-ontology/src/entity/location/text.rs
+++ b/crates/nvisy-ontology/src/entity/location/text.rs
@@ -73,18 +73,6 @@ mod tests {
             .unwrap()
     }
 
-    #[test]
-    fn builder_required_fields() {
-        let loc = TextLocation::builder()
-            .with_start_offset(0usize)
-            .with_end_offset(5usize)
-            .build()
-            .unwrap();
-        assert_eq!(loc.start_offset, 0);
-        assert_eq!(loc.end_offset, 5);
-        assert_eq!(loc.line_number, None);
-    }
-
     #[test]
     fn len_and_is_empty() {
         assert_eq!(loc(0, 10).len(), 10);
@@ -112,12 +100,4 @@ mod tests {
         assert!(!loc(0, 5).overlaps(&loc(10, 15)));
     }
 
-    #[test]
-    fn serde_round_trip() {
-        let loc = loc(0, 6);
-        let json = serde_json::to_string(&loc).unwrap();
-        let deser: TextLocation = serde_json::from_str(&json).unwrap();
-        assert_eq!(deser.start_offset, 0);
-        assert_eq!(deser.end_offset, 6);
-    }
 }
diff --git a/crates/nvisy-ontology/src/entity/mod.rs b/crates/nvisy-ontology/src/entity/mod.rs
index 0bf961a3..ee079d1e 100644
--- a/crates/nvisy-ontology/src/entity/mod.rs
+++ b/crates/nvisy-ontology/src/entity/mod.rs
@@ -210,23 +210,4 @@ mod tests {
         let filtered = entities.above_confidence(0.5);
         assert_eq!(filtered.len(), 2);
     }
-
-    #[test]
-    fn above_confidence_empty() {
-        let entities = Entities::new();
-        assert!(entities.above_confidence(0.5).is_empty());
-    }
-
-    #[test]
-    fn entities_from_vec() {
-        let v = vec![entity(0.5), entity(0.8)];
-        let entities = Entities::from(v);
-        assert_eq!(entities.len(), 2);
-    }
-
-    #[test]
-    fn entities_collect() {
-        let entities: Entities = (0..3).map(|i| entity(i as f64 * 0.3)).collect();
-        assert_eq!(entities.len(), 3);
-    }
 }
diff --git a/crates/nvisy-ontology/src/entity/sensitivity.rs b/crates/nvisy-ontology/src/entity/sensitivity.rs
index 3226d096..b2110baf 100644
--- a/crates/nvisy-ontology/src/entity/sensitivity.rs
+++ b/crates/nvisy-ontology/src/entity/sensitivity.rs
@@ -31,8 +31,6 @@ pub enum EntitySensitivity {
 
 #[cfg(test)]
 mod tests {
-    use std::str::FromStr;
-
     use super::*;
 
     #[test]
@@ -41,25 +39,4 @@ mod tests {
         assert!(EntitySensitivity::High > EntitySensitivity::Medium);
         assert!(EntitySensitivity::Medium > EntitySensitivity::Low);
     }
-
-    #[test]
-    fn display_snake_case() {
-        assert_eq!(EntitySensitivity::Critical.to_string(), "critical");
-        assert_eq!(EntitySensitivity::Low.to_string(), "low");
-    }
-
-    #[test]
-    fn parse_roundtrip() {
-        let s = EntitySensitivity::from_str("high").unwrap();
-        assert_eq!(s, EntitySensitivity::High);
-    }
-
-    #[test]
-    fn serde_roundtrip() {
-        let s = EntitySensitivity::Critical;
-        let json = serde_json::to_string(&s).unwrap();
-        assert_eq!(json, "\"critical\"");
-        let back: EntitySensitivity = serde_json::from_str(&json).unwrap();
-        assert_eq!(back, s);
-    }
 }
diff --git a/crates/nvisy-ontology/src/entity/source.rs b/crates/nvisy-ontology/src/entity/source.rs
index 9a354221..07f02ba8 100644
--- a/crates/nvisy-ontology/src/entity/source.rs
+++ b/crates/nvisy-ontology/src/entity/source.rs
@@ -124,10 +124,6 @@ impl From<ContentSource> for Uuid {
 
 #[cfg(test)]
 mod tests {
-    use std::collections::HashSet;
-    use std::thread;
-    use std::time::Duration;
-
     use super::*;
 
     #[test]
@@ -137,14 +133,6 @@ mod tests {
         assert!(!source.as_uuid().is_nil());
     }
 
-    #[test]
-    fn uniqueness() {
-        let mut sources = HashSet::new();
-        for _ in 0..1000 {
-            assert!(sources.insert(ContentSource::new()));
-        }
-    }
-
     #[test]
     fn derive_sets_parent() {
         let parent = ContentSource::new();
@@ -152,21 +140,4 @@ mod tests {
         assert_eq!(child.parent_id(), Some(parent.as_uuid()));
         assert_ne!(child.as_uuid(), parent.as_uuid());
     }
-
-    #[test]
-    fn ordering() {
-        let a = ContentSource::new();
-        thread::sleep(Duration::from_millis(2));
-        let b = ContentSource::new();
-        assert!(a.created_before(&b));
-        assert!(a < b);
-    }
-
-    #[test]
-    fn serde_roundtrip() {
-        let source = ContentSource::new();
-        let json = serde_json::to_string(&source).unwrap();
-        let d: ContentSource = serde_json::from_str(&json).unwrap();
-        assert_eq!(source, d);
-    }
 }
diff --git a/crates/nvisy-ontology/src/primitive/bounding_box.rs b/crates/nvisy-ontology/src/primitive/bounding_box.rs
index 41f764c5..8ab0825d 100644
--- a/crates/nvisy-ontology/src/primitive/bounding_box.rs
+++ b/crates/nvisy-ontology/src/primitive/bounding_box.rs
@@ -124,12 +124,6 @@ impl BoundingBox {
 mod tests {
     use super::*;
 
-    #[test]
-    fn area() {
-        let bb = BoundingBox::new(0.0, 0.0, 10.0, 5.0);
-        assert!((bb.area() - 50.0).abs() < f64::EPSILON);
-    }
-
     #[test]
     fn edges_and_center() {
         let bb = BoundingBox::new(10.0, 20.0, 30.0, 40.0);
diff --git a/crates/nvisy-ontology/src/primitive/language_tag.rs b/crates/nvisy-ontology/src/primitive/language_tag.rs
index 50a64778..f0d7d645 100644
--- a/crates/nvisy-ontology/src/primitive/language_tag.rs
+++ b/crates/nvisy-ontology/src/primitive/language_tag.rs
@@ -34,42 +34,3 @@ impl LanguageTag {
         self.0.primary_language()
     }
 }
-
-#[cfg(test)]
-mod tests {
-    use super::*;
-
-    #[test]
-    fn parse_simple() {
-        let tag: LanguageTag = "en".parse().unwrap();
-        assert_eq!(tag.as_str(), "en");
-        assert_eq!(tag.primary_language(), "en");
-    }
-
-    #[test]
-    fn parse_with_region() {
-        let tag: LanguageTag = "en-US".parse().unwrap();
-        assert_eq!(tag.as_str(), "en-US");
-        assert_eq!(tag.primary_language(), "en");
-    }
-
-    #[test]
-    fn parse_invalid() {
-        assert!("not a valid tag!!!".parse::<LanguageTag>().is_err());
-    }
-
-    #[test]
-    fn serde_roundtrip() {
-        let tag: LanguageTag = "uk-UA".parse().unwrap();
-        let json = serde_json::to_string(&tag).unwrap();
-        assert_eq!(json, "\"uk-UA\"");
-        let back: LanguageTag = serde_json::from_str(&json).unwrap();
-        assert_eq!(tag, back);
-    }
-
-    #[test]
-    fn display() {
-        let tag: LanguageTag = "de-AT".parse().unwrap();
-        assert_eq!(format!("{tag}"), "de-AT");
-    }
-}
diff --git a/crates/nvisy-ontology/src/primitive/time_span.rs b/crates/nvisy-ontology/src/primitive/time_span.rs
index f8953311..f549b8f4 100644
--- a/crates/nvisy-ontology/src/primitive/time_span.rs
+++ b/crates/nvisy-ontology/src/primitive/time_span.rs
@@ -115,12 +115,6 @@ mod tests {
         assert!((span.duration_secs() - 2.5).abs() < 1e-9);
     }
 
-    #[test]
-    fn midpoint() {
-        let span = TimeSpan::new(2_000_000, 4_000_000);
-        assert_eq!(span.midpoint_us(), 3_000_000);
-    }
-
     #[test]
     fn contains() {
         let span = TimeSpan::new(1_000_000, 5_000_000);
diff --git a/crates/nvisy-ontology/src/provenance/redaction_map.rs b/crates/nvisy-ontology/src/provenance/redaction_map.rs
index 0aa038b5..e881f145 100644
--- a/crates/nvisy-ontology/src/provenance/redaction_map.rs
+++ b/crates/nvisy-ontology/src/provenance/redaction_map.rs
@@ -89,13 +89,6 @@ mod tests {
         }
     }
 
-    #[test]
-    fn empty_map() {
-        let map = RedactionMap::new();
-        assert!(map.is_empty());
-        assert_eq!(map.len(), 0);
-    }
-
     #[test]
     fn push_and_lookup() {
         let id = Uuid::now_v7();
@@ -105,20 +98,4 @@ mod tests {
         assert_eq!(map.original(id), Some("John"));
         assert_eq!(map.replacement(id), Some("[NAME]"));
     }
-
-    #[test]
-    fn lookup_missing() {
-        let map = RedactionMap::new();
-        assert_eq!(map.original(Uuid::now_v7()), None);
-        assert_eq!(map.replacement(Uuid::now_v7()), None);
-    }
-
-    #[test]
-    fn replacement_none_when_not_applied() {
-        let id = Uuid::now_v7();
-        let mut map = RedactionMap::new();
-        map.push(mapping(id, "secret", None));
-        assert_eq!(map.original(id), Some("secret"));
-        assert_eq!(map.replacement(id), None);
-    }
 }
diff --git a/crates/nvisy-ontology/src/workflow/mod.rs b/crates/nvisy-ontology/src/workflow/mod.rs
index 81a86841..62efe553 100644
--- a/crates/nvisy-ontology/src/workflow/mod.rs
+++ b/crates/nvisy-ontology/src/workflow/mod.rs
@@ -309,26 +309,6 @@ mod tests {
         );
     }
 
-    #[test]
-    fn display() {
-        assert_eq!(import().to_string(), "import");
-        assert_eq!(extraction().to_string(), "extraction");
-        assert_eq!(detection().to_string(), "detection");
-        assert_eq!(dedup().to_string(), "deduplication");
-        assert_eq!(redaction().to_string(), "redaction");
-        assert_eq!(validation().to_string(), "validation");
-        assert_eq!(export().to_string(), "export");
-    }
-
-    #[test]
-    fn validate_accepts_valid_configs() {
-        assert!(extraction().validate().is_ok());
-        assert!(detection().validate().is_ok());
-        assert!(dedup().validate().is_ok());
-        assert!(redaction().validate().is_ok());
-        assert!(validation().validate().is_ok());
-    }
-
     #[test]
     fn validate_rejects_empty_import() {
         assert!(import().validate().is_err());

From da3cdb59985fcd8007ff080b35e360ed8ec5a9f3 Mon Sep 17 00:00:00 2001
From: Oleh Martsokha <o.martsokha@gmail.com>
Date: Tue, 19 May 2026 04:15:39 +0200
Subject: [PATCH 4/6] refactor(core): drop unused DataReference

DataReference was a "lightweight pointer into a content source" with
no callers anywhere in the workspace beyond its own re-export. The
type, the module, and the doc-comment bullet all go.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 .../nvisy-core/src/content/data_reference.rs  | 63 -------------------
 crates/nvisy-core/src/content/mod.rs          |  3 -
 2 files changed, 66 deletions(-)
 delete mode 100644 crates/nvisy-core/src/content/data_reference.rs

diff --git a/crates/nvisy-core/src/content/data_reference.rs b/crates/nvisy-core/src/content/data_reference.rs
deleted file mode 100644
index 75909f16..00000000
--- a/crates/nvisy-core/src/content/data_reference.rs
+++ /dev/null
@@ -1,63 +0,0 @@
-//! Lightweight source reference for locating data within a document.
-
-use serde::{Deserialize, Serialize};
-
-use super::ContentSource;
-
-/// A lightweight pointer to a specific location within a content source.
-///
-/// `DataReference` does **not** hold the actual data — it only records
-/// *where* the data lives (a [`ContentSource`]) and an optional
-/// sub-location within that source (the `mapping_id`).
-///
-/// # Examples
-///
-/// ```rust
-/// use nvisy_core::content::DataReference;
-/// use nvisy_core::content::ContentSource;
-///
-/// let source = ContentSource::new();
-/// let data_ref = DataReference::new(source)
-///     .with_mapping_id("line-42");
-///
-/// assert_eq!(data_ref.mapping_id(), Some("line-42"));
-/// ```
-#[derive(Debug, Clone, PartialEq, Eq)]
-#[derive(Serialize, Deserialize)]
-pub struct DataReference {
-    /// Source document this reference points into.
-    source: ContentSource,
-
-    /// Optional sub-location within the source.
-    ///
-    /// Examples: line numbers, byte offsets, element IDs, XPath expressions.
-    #[serde(skip_serializing_if = "Option::is_none")]
-    mapping_id: Option<String>,
-}
-
-impl DataReference {
-    /// Create a new reference to the given source.
-    pub fn new(source: ContentSource) -> Self {
-        Self {
-            source,
-            mapping_id: None,
-        }
-    }
-
-    /// Set the mapping ID (builder pattern).
-    #[must_use]
-    pub fn with_mapping_id(mut self, mapping_id: impl Into<String>) -> Self {
-        self.mapping_id = Some(mapping_id.into());
-        self
-    }
-
-    /// The content source this reference points to.
-    pub fn source(&self) -> ContentSource {
-        self.source
-    }
-
-    /// The sub-location within the source, if any.
-    pub fn mapping_id(&self) -> Option<&str> {
-        self.mapping_id.as_deref()
-    }
-}
diff --git a/crates/nvisy-core/src/content/mod.rs b/crates/nvisy-core/src/content/mod.rs
index 7832f90b..7971136b 100644
--- a/crates/nvisy-core/src/content/mod.rs
+++ b/crates/nvisy-core/src/content/mod.rs
@@ -4,12 +4,10 @@
 //! - [`ContentMetadata`]: MIME type, filename, and descriptive attributes
 //! - [`Content`]: [`ContentData`] paired with optional [`ContentMetadata`]
 //! - [`ContentSource`]: UUIDv7-based content identity and lineage
-//! - [`DataReference`]: Lightweight pointer into a content source
 
 mod bundle;
 mod content_data;
 mod content_metadata;
-mod data_reference;
 mod encoding;
 
 pub use nvisy_ontology::entity::ContentSource;
@@ -17,5 +15,4 @@ pub use nvisy_ontology::entity::ContentSource;
 pub use self::bundle::Content;
 pub use self::content_data::ContentData;
 pub use self::content_metadata::ContentMetadata;
-pub use self::data_reference::DataReference;
 pub use self::encoding::TextEncoding;

From 3d4e6854ada0a83dc1314e8ad114170ff18cc718 Mon Sep 17 00:00:00 2001
From: Oleh Martsokha <o.martsokha@gmail.com>
Date: Tue, 19 May 2026 04:34:52 +0200
Subject: [PATCH 5/6] test(pattern, provider, engine, server): drop worthless
 tests
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

35 tests removed across 14 files. Same bar as previous cleanups:

pattern (9 drops):
- Registry-has-entries smoke tests (builtins_load, builtins_load_and_are_nonempty, resolver_builtins).
- Trivial insert/get registry round-trips (dictionary_registry::registry_insert_and_get, pattern_registry::registry_insert_and_get).
- Engine builder smoke tests (default_engine_builds, builder_pattern_filter).
- Collection-wrapper smoke (allow_list_from_iterator, deny_list_insert_and_lookup).

provider (5 drops):
- run_params_accepts_valid_range — one happy-path code path with three values.
- OCR provider parse_response tests for aws_textract, azure_docai,
  google_vision, datalab_surya, paddle_paddlex — all pure
  serde-derive deserialization checks (testing serde, not our wire
  format mapping).

engine (11 drops):
- mask_counts_chars_not_bytes — used ASCII "John", didn't actually
  exercise the chars-not-bytes claim it documented.
- 9 pipeline config tests (serde-derive deserialization of TOML
  sections + version_parses_as_semver + validate_accepts_valid_config
  on Default::default()).
- registry/store::base_dir — trivial getter test.

server (10 drops):
- 6 http_error builder/setter tests (default_http_error,
  error_from_kind, error_with_context/message/resource,
  error_builder_chaining) — all builder-set-fields-read-back.
- std_error_trait — compile-time-only coercion check, no behavior.
- http_kind::all_error_kinds_have_responses — registry-has-entries
  smoke (Vec iteration + non-empty assertion).
- sunset::deprecate_builds_headers — HashMap::contains_key on a
  single insert; standard-library behavior.

Plus 8 unused-import cleanups in handler/loader test modules that
imported `futures::StreamExt` / `TextHandler` / `TabularHandler` /
`Error` / `JsonPattern` for tests that no longer exist.

Test counts:
- nvisy-pattern: 66 → 57
- nvisy-provider: 48 → 43 (approx — varies by feature flags)
- nvisy-engine: 85 → 74
- nvisy-server: 22 → 12

Workspace tests pass, clippy clean.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 .../src/handler/rich/pdf_handler.rs           |   1 -
 .../src/handler/rich/pdf_loader.rs            |   3 +-
 .../src/handler/tabular/csv_loader.rs         |   3 +-
 .../src/handler/text/txt_loader.rs            |   3 +-
 .../src/operation/redaction/apply.rs          |  30 -----
 .../nvisy-engine/src/pipeline/config/mod.rs   | 107 ------------------
 crates/nvisy-engine/src/registry/store.rs     |   9 --
 .../src/dictionaries/dictionary_registry.rs   |  24 ----
 crates/nvisy-pattern/src/engine/mod.rs        |  54 ---------
 .../src/patterns/pattern_registry.rs          |  24 ----
 crates/nvisy-pattern/src/validators/mod.rs    |   8 --
 crates/nvisy-provider/src/ocr/backend/mod.rs  |   7 --
 .../src/ocr/provider/aws_textract/backend.rs  |  47 --------
 .../src/ocr/provider/azure_docai/backend.rs   |  40 -------
 .../src/ocr/provider/datalab_surya/backend.rs |  63 -----------
 .../src/ocr/provider/google_vision/backend.rs |  46 --------
 .../ocr/provider/paddle_paddlex/backend.rs    |  55 ---------
 .../src/handler/error/http_error.rs           |  59 ----------
 .../src/handler/error/http_kind.rs            |  29 -----
 crates/nvisy-server/src/middleware/sunset.rs  |   7 --
 20 files changed, 3 insertions(+), 616 deletions(-)

diff --git a/crates/nvisy-codec/src/handler/rich/pdf_handler.rs b/crates/nvisy-codec/src/handler/rich/pdf_handler.rs
index 8b069a64..f24439dd 100644
--- a/crates/nvisy-codec/src/handler/rich/pdf_handler.rs
+++ b/crates/nvisy-codec/src/handler/rich/pdf_handler.rs
@@ -293,7 +293,6 @@ impl ImageHandler for RichTextHandler {
 #[cfg(test)]
 mod tests {
     use futures::StreamExt;
-    use nvisy_core::Error;
 
     use super::*;
     use crate::handler::TextHandler;
diff --git a/crates/nvisy-codec/src/handler/rich/pdf_loader.rs b/crates/nvisy-codec/src/handler/rich/pdf_loader.rs
index 31a06e17..2a15dbd2 100644
--- a/crates/nvisy-codec/src/handler/rich/pdf_loader.rs
+++ b/crates/nvisy-codec/src/handler/rich/pdf_loader.rs
@@ -49,13 +49,12 @@ impl Loader for PdfLoader {
 #[cfg(test)]
 mod tests {
     use bytes::Bytes;
-    use futures::StreamExt;
     use lopdf::{Dictionary, Document, Object, Stream, dictionary};
     use nvisy_core::content::ContentSource;
     use nvisy_core::media::DocumentType;
 
     use super::*;
-    use crate::handler::{Handler, TextHandler};
+    use crate::handler::Handler;
 
     fn content_from_bytes(bytes: &[u8]) -> ContentData {
         ContentData::new(ContentSource::new(), Bytes::from(bytes.to_vec()))
diff --git a/crates/nvisy-codec/src/handler/tabular/csv_loader.rs b/crates/nvisy-codec/src/handler/tabular/csv_loader.rs
index 93869abd..ef78b1ed 100644
--- a/crates/nvisy-codec/src/handler/tabular/csv_loader.rs
+++ b/crates/nvisy-codec/src/handler/tabular/csv_loader.rs
@@ -134,13 +134,12 @@ fn detect_delimiter(text: &str) -> u8 {
 #[cfg(test)]
 mod tests {
     use bytes::Bytes;
-    use futures::StreamExt;
     use nvisy_core::Error;
     use nvisy_core::content::ContentSource;
     use nvisy_core::media::{DocumentType, SpreadsheetFormat};
 
     use super::*;
-    use crate::handler::{Handler, TabularHandler};
+    use crate::handler::Handler;
 
     fn content_from_str(s: &str) -> ContentData {
         ContentData::new(ContentSource::new(), Bytes::from(s.to_owned()))
diff --git a/crates/nvisy-codec/src/handler/text/txt_loader.rs b/crates/nvisy-codec/src/handler/text/txt_loader.rs
index e97558ff..ee0f4a4a 100644
--- a/crates/nvisy-codec/src/handler/text/txt_loader.rs
+++ b/crates/nvisy-codec/src/handler/text/txt_loader.rs
@@ -50,13 +50,12 @@ impl Loader for TxtLoader {
 #[cfg(test)]
 mod tests {
     use bytes::Bytes;
-    use futures::StreamExt;
     use nvisy_core::Error;
     use nvisy_core::content::ContentSource;
     use nvisy_core::media::{DocumentType, TextFormat};
 
     use super::*;
-    use crate::handler::{Handler, TextHandler};
+    use crate::handler::Handler;
 
     fn content_from_str(s: &str) -> ContentData {
         ContentData::new(ContentSource::new(), Bytes::from(s.to_owned()))
diff --git a/crates/nvisy-engine/src/operation/redaction/apply.rs b/crates/nvisy-engine/src/operation/redaction/apply.rs
index 59d46164..c5e694b2 100644
--- a/crates/nvisy-engine/src/operation/redaction/apply.rs
+++ b/crates/nvisy-engine/src/operation/redaction/apply.rs
@@ -513,36 +513,6 @@ mod tests {
         );
     }
 
-    #[tokio::test]
-    async fn mask_counts_chars_not_bytes() {
-        // The handler reads "John" (4 bytes / 4 chars); for an
-        // entity spanning a multi-byte character the count should
-        // track chars. This test pins the chars-not-bytes behavior
-        // by checking the mask length matches the char count of the
-        // value the handler returns.
-        let entity = text_entity(6, 10);
-        let entity_id = entity.id;
-        let record = test_record(
-            entity_id,
-            Strategy::Text(TextStrategy::Mask { mask_char: '*' }),
-            "John",
-        );
-        let entities: Entities = vec![entity].into();
-        let mut envelope = test_envelope(entities).await;
-        envelope.audit.entries.push(record);
-
-        RedactionApplicator::new(&mut envelope)
-            .apply()
-            .await
-            .unwrap();
-
-        // "John" is 4 chars -> 4 mask chars.
-        assert_eq!(
-            envelope.audit.entries[0].value.replacement.as_deref(),
-            Some("****"),
-        );
-    }
-
     #[tokio::test]
     async fn remove_leaves_replacement_none() {
         let entity = text_entity(6, 10);
diff --git a/crates/nvisy-engine/src/pipeline/config/mod.rs b/crates/nvisy-engine/src/pipeline/config/mod.rs
index d23d66fb..7e3ccb95 100644
--- a/crates/nvisy-engine/src/pipeline/config/mod.rs
+++ b/crates/nvisy-engine/src/pipeline/config/mod.rs
@@ -129,100 +129,6 @@ impl RuntimeConfig {
 mod tests {
     use super::*;
 
-    #[test]
-    fn empty_toml_parses_to_defaults() {
-        let config: RuntimeConfig = toml::from_str("").unwrap();
-        assert_eq!(config.version, Version::new(0, 1, 0));
-        assert!(config.engine.is_none());
-        assert!(config.ocr.is_none());
-        assert!(config.llm.is_none());
-        assert!(config.stt.is_none());
-        assert!(config.tts.is_none());
-    }
-
-    #[test]
-    fn http_section_parses_under_engine() {
-        let toml = r#"
-            [engine.http]
-            max_retries = 5
-            timeout_secs = 60
-            connect_timeout_secs = 5
-            idle_timeout_secs = 30
-        "#;
-        let config: RuntimeConfig = toml::from_str(toml).unwrap();
-        let http = config.engine.unwrap().http.unwrap();
-        assert_eq!(http.max_retries, 5);
-        assert_eq!(http.timeout_secs, 60);
-    }
-
-    #[test]
-    fn ocr_provider_section_parses() {
-        let toml = r#"
-            [ocr.provider]
-            kind = "surya"
-            base_url = "http://localhost:8001"
-        "#;
-        let config: RuntimeConfig = toml::from_str(toml).unwrap();
-        assert!(config.ocr.is_some());
-        assert!(config.ocr.unwrap().provider.is_some());
-    }
-
-    #[test]
-    fn ocr_policy_section_parses() {
-        let toml = r#"
-            [ocr.policy]
-            confidence_threshold = 0.5
-        "#;
-        let config: RuntimeConfig = toml::from_str(toml).unwrap();
-        let ocr = config.ocr.unwrap();
-        let policy = ocr.policy.unwrap();
-        assert!((policy.confidence_threshold - 0.5).abs() < f64::EPSILON);
-    }
-
-    #[test]
-    fn engine_retry_section_parses() {
-        let toml = r#"
-            [engine.retry]
-            max_retries = 3
-            delay_ms = 500
-            backoff = "fixed"
-        "#;
-        let config: RuntimeConfig = toml::from_str(toml).unwrap();
-        let engine = config.engine.unwrap();
-        let retry = engine.retry.unwrap();
-        assert_eq!(retry.max_retries, 3);
-        assert_eq!(retry.delay_ms, 500);
-    }
-
-    #[test]
-    fn engine_timeout_section_parses() {
-        let toml = r#"
-            [engine.timeout]
-            duration_ms = 30000
-            on_timeout = "fail"
-        "#;
-        let config: RuntimeConfig = toml::from_str(toml).unwrap();
-        let engine = config.engine.unwrap();
-        let timeout = engine.timeout.unwrap();
-        assert_eq!(timeout.duration_ms, 30000);
-    }
-
-    #[test]
-    fn llm_policy_section_parses() {
-        let toml = r#"
-            [llm.policy]
-            temperature = 0.1
-            max_tokens = 4096
-            max_retries = 3
-        "#;
-        let config: RuntimeConfig = toml::from_str(toml).unwrap();
-        let llm = config.llm.unwrap();
-        let policy = llm.policy.unwrap();
-        assert!((policy.temperature - 0.1).abs() < f64::EPSILON);
-        assert_eq!(policy.max_tokens, 4096);
-        assert_eq!(policy.max_retries, 3);
-    }
-
     #[test]
     fn merge_overrides_present_sections() {
         let base = RuntimeConfig {
@@ -272,19 +178,6 @@ mod tests {
         assert_eq!(merged.engine.unwrap().http.unwrap().max_retries, 3);
     }
 
-    #[test]
-    fn validate_accepts_valid_config() {
-        let config = RuntimeConfig::default();
-        assert!(config.validate().is_ok());
-    }
-
-    #[test]
-    fn version_parses_as_semver() {
-        let toml = r#"version = "1.2.3""#;
-        let config: RuntimeConfig = toml::from_str(toml).unwrap();
-        assert_eq!(config.version, Version::new(1, 2, 3));
-    }
-
     #[test]
     fn fill_key_skips_nonempty() {
         let mut key = "existing".to_string();
diff --git a/crates/nvisy-engine/src/registry/store.rs b/crates/nvisy-engine/src/registry/store.rs
index 740de239..444696ec 100644
--- a/crates/nvisy-engine/src/registry/store.rs
+++ b/crates/nvisy-engine/src/registry/store.rs
@@ -545,15 +545,6 @@ mod tests {
         Ok(())
     }
 
-    #[tokio::test]
-    async fn base_dir() -> anyhow::Result<()> {
-        let temp = tempfile::tempdir()?;
-        let base = temp.path().join("reg");
-        let registry = Registry::open(&base)?;
-        assert_eq!(registry.base_dir(), base);
-        Ok(())
-    }
-
     #[tokio::test]
     async fn data_persists_across_reopen() -> anyhow::Result<()> {
         let temp = tempfile::tempdir()?;
diff --git a/crates/nvisy-pattern/src/dictionaries/dictionary_registry.rs b/crates/nvisy-pattern/src/dictionaries/dictionary_registry.rs
index 396d5d49..798594f2 100644
--- a/crates/nvisy-pattern/src/dictionaries/dictionary_registry.rs
+++ b/crates/nvisy-pattern/src/dictionaries/dictionary_registry.rs
@@ -234,15 +234,6 @@ mod tests {
         builtin_registry()
     }
 
-    #[test]
-    fn builtins_load_and_are_nonempty() {
-        let reg = registry();
-        assert!(!reg.is_empty());
-        for (_, dict) in reg.iter() {
-            assert!(!dict.terms().is_empty(), "{} is empty", dict.name());
-        }
-    }
-
     #[test]
     fn terms_are_trimmed_and_nonempty() {
         for (_, dict) in registry().iter() {
@@ -282,21 +273,6 @@ mod tests {
         assert_eq!(keys, sorted);
     }
 
-    #[test]
-    fn registry_insert_and_get() {
-        let mut reg = DictionaryRegistry::new();
-        let dict: BoxDictionary = Box::new(TxtDictionary::new("test", "foo\nbar\n"));
-        reg.insert(dict);
-
-        assert_eq!(reg.len(), 1);
-
-        let dict = reg.get("test").unwrap();
-        assert_eq!(dict.name(), "test");
-
-        let values: Vec<&str> = dict.terms().iter().map(|t| t.value.as_str()).collect();
-        assert_eq!(values, &["foo", "bar"]);
-    }
-
     #[test]
     fn load_dir_reads_filesystem() {
         let dir = tempfile::tempdir().unwrap();
diff --git a/crates/nvisy-pattern/src/engine/mod.rs b/crates/nvisy-pattern/src/engine/mod.rs
index 2aeddc87..0d57bac8 100644
--- a/crates/nvisy-pattern/src/engine/mod.rs
+++ b/crates/nvisy-pattern/src/engine/mod.rs
@@ -332,22 +332,6 @@ mod tests {
         ScanContext::default()
     }
 
-    #[test]
-    fn default_engine_builds() {
-        let engine = PatternEngine::instance();
-        assert!(!engine.regex_entries.is_empty());
-    }
-
-    #[test]
-    fn builder_pattern_filter() {
-        let engine = PatternEngine::builder()
-            .with_patterns(&["email"])
-            .build()
-            .unwrap();
-        assert_eq!(engine.regex_entries.len(), 1);
-        assert_eq!(engine.regex_entries[0].pattern_name, "email");
-    }
-
     #[test]
     fn scan_raw_returns_correct_offsets() {
         let engine = PatternEngine::instance();
@@ -427,44 +411,6 @@ mod tests {
         );
     }
 
-    #[test]
-    fn allow_list_from_iterator() {
-        let allow: AllowList = ["123-45-6789", "000-00-0000"].into_iter().collect();
-        assert_eq!(allow.len(), 2);
-        assert!(allow.contains("123-45-6789"));
-        assert!(allow.contains("000-00-0000"));
-        assert!(!allow.contains("999-99-9999"));
-    }
-
-    #[test]
-    fn deny_list_insert_and_lookup() {
-        let mut deny = DenyList::new();
-        deny.insert(
-            "secret",
-            DenyRule {
-                category: EntityCategory::PersonalIdentity,
-                entity_kind: EntityKind::PersonName,
-                method: RecognitionMethod::ner("test", ModelKind::SelfHosted),
-            },
-        );
-        deny.insert(
-            "other",
-            DenyRule {
-                category: EntityCategory::Financial,
-                entity_kind: EntityKind::PaymentCard,
-                method: RecognitionMethod::annotation(Some("test".into())),
-            },
-        );
-        assert_eq!(deny.len(), 2);
-        assert!(deny.contains("secret"));
-        let rule = deny.get("other").unwrap();
-        assert_eq!(rule.category, EntityCategory::Financial);
-        assert_eq!(
-            rule.method,
-            RecognitionMethod::annotation(Some("test".into()))
-        );
-    }
-
     #[test]
     fn column_confidence_raw() {
         let engine = PatternEngine::instance();
diff --git a/crates/nvisy-pattern/src/patterns/pattern_registry.rs b/crates/nvisy-pattern/src/patterns/pattern_registry.rs
index 1b7d6842..6ac49388 100644
--- a/crates/nvisy-pattern/src/patterns/pattern_registry.rs
+++ b/crates/nvisy-pattern/src/patterns/pattern_registry.rs
@@ -255,7 +255,6 @@ mod tests {
     use std::collections::HashSet;
     use std::fs;
 
-    use super::super::json_pattern::JsonPattern;
     use super::super::pattern::{MatchSource, RegexPattern};
     use super::*;
     use crate::validators::ValidatorResolver;
@@ -264,11 +263,6 @@ mod tests {
         builtin_registry()
     }
 
-    #[test]
-    fn builtins_load() {
-        assert!(!registry().is_empty());
-    }
-
     #[test]
     fn pattern_names_are_sorted() {
         let names: Vec<&str> = registry().names().collect();
@@ -336,24 +330,6 @@ mod tests {
         }
     }
 
-    #[test]
-    fn registry_insert_and_get() {
-        let validators = ValidatorResolver::builtins();
-        let json = br#"{
-            "name": "test",
-            "category": "personal_identity",
-            "entity_type": "government_id",
-            "pattern": { "regex": "\\d+", "confidence": 0.9 }
-        }"#;
-        let (pattern, _warnings) = JsonPattern::from_bytes(json, &validators).unwrap();
-
-        let mut reg = PatternRegistry::new();
-        reg.insert(Box::new(pattern));
-
-        assert_eq!(reg.len(), 1);
-        assert_eq!(reg.get("test").unwrap().name(), "test");
-    }
-
     #[test]
     fn load_dir_reads_filesystem() {
         let dir = tempfile::tempdir().unwrap();
diff --git a/crates/nvisy-pattern/src/validators/mod.rs b/crates/nvisy-pattern/src/validators/mod.rs
index c1ffd132..020e4e44 100644
--- a/crates/nvisy-pattern/src/validators/mod.rs
+++ b/crates/nvisy-pattern/src/validators/mod.rs
@@ -73,14 +73,6 @@ impl Default for ValidatorResolver {
 mod tests {
     use super::*;
 
-    #[test]
-    fn resolver_builtins() {
-        let r = ValidatorResolver::builtins();
-        assert!(r.resolve("ssn").is_some());
-        assert!(r.resolve("luhn").is_some());
-        assert!(r.resolve("nope").is_none());
-    }
-
     #[test]
     fn resolver_custom() {
         let mut r = ValidatorResolver::builtins();
diff --git a/crates/nvisy-provider/src/ocr/backend/mod.rs b/crates/nvisy-provider/src/ocr/backend/mod.rs
index 15cf2379..d7473250 100644
--- a/crates/nvisy-provider/src/ocr/backend/mod.rs
+++ b/crates/nvisy-provider/src/ocr/backend/mod.rs
@@ -83,13 +83,6 @@ pub trait Backend: Send + Sync + 'static {
 mod tests {
     use super::*;
 
-    #[test]
-    fn run_params_accepts_valid_range() {
-        assert!(RunParams::new(0.0).is_ok());
-        assert!(RunParams::new(0.5).is_ok());
-        assert!(RunParams::new(1.0).is_ok());
-    }
-
     #[test]
     fn run_params_rejects_above_one() {
         assert!(RunParams::new(1.01).is_err());
diff --git a/crates/nvisy-provider/src/ocr/provider/aws_textract/backend.rs b/crates/nvisy-provider/src/ocr/provider/aws_textract/backend.rs
index 8dd97e85..a2e52710 100644
--- a/crates/nvisy-provider/src/ocr/provider/aws_textract/backend.rs
+++ b/crates/nvisy-provider/src/ocr/provider/aws_textract/backend.rs
@@ -391,53 +391,6 @@ fn format_datetime(epoch_secs: u64) -> String {
 mod tests {
     use super::*;
 
-    #[test]
-    fn parse_response() {
-        let json = serde_json::json!({
-            "Blocks": [
-                {
-                    "BlockType": "PAGE",
-                    "Geometry": {
-                        "BoundingBox": { "Width": 1.0, "Height": 1.0, "Left": 0.0, "Top": 0.0 }
-                    }
-                },
-                {
-                    "BlockType": "WORD",
-                    "Text": "hello",
-                    "Confidence": 99.5,
-                    "Geometry": {
-                        "BoundingBox": {
-                            "Width": 0.2,
-                            "Height": 0.05,
-                            "Left": 0.1,
-                            "Top": 0.3
-                        },
-                        "Polygon": [
-                            { "X": 0.1, "Y": 0.3 },
-                            { "X": 0.3, "Y": 0.3 },
-                            { "X": 0.3, "Y": 0.35 },
-                            { "X": 0.1, "Y": 0.35 }
-                        ]
-                    }
-                }
-            ]
-        });
-
-        let resp: TextractResponse = serde_json::from_value(json).unwrap();
-        assert_eq!(resp.blocks.len(), 2);
-
-        let word = &resp.blocks[1];
-        assert_eq!(word.block_type, "WORD");
-        assert_eq!(word.text.as_deref(), Some("hello"));
-        assert!((word.confidence.unwrap() - 99.5).abs() < 0.01);
-
-        let geom = word.geometry.as_ref().unwrap();
-        let bbox = geom.bounding_box.as_ref().unwrap();
-        assert!((bbox.left - 0.1).abs() < 0.001);
-        assert!((bbox.top - 0.3).abs() < 0.001);
-        assert!((bbox.width - 0.2).abs() < 0.001);
-    }
-
     #[test]
     fn build_hierarchy_from_relationships() {
         let json = serde_json::json!({
diff --git a/crates/nvisy-provider/src/ocr/provider/azure_docai/backend.rs b/crates/nvisy-provider/src/ocr/provider/azure_docai/backend.rs
index c11950ca..e54909df 100644
--- a/crates/nvisy-provider/src/ocr/provider/azure_docai/backend.rs
+++ b/crates/nvisy-provider/src/ocr/provider/azure_docai/backend.rs
@@ -253,43 +253,3 @@ impl Backend for AzureDocaiBackend {
         Ok(output)
     }
 }
-
-#[cfg(test)]
-mod tests {
-    use super::*;
-
-    #[test]
-    fn parse_response() {
-        let json = serde_json::json!({
-            "status": "succeeded",
-            "analyzeResult": {
-                "pages": [{
-                    "words": [
-                        {
-                            "content": "Hello",
-                            "confidence": 0.99,
-                            "polygon": [10.0, 20.0, 50.0, 20.0, 50.0, 40.0, 10.0, 40.0]
-                        },
-                        {
-                            "content": "World",
-                            "confidence": 0.95,
-                            "polygon": [60.0, 20.0, 110.0, 20.0, 110.0, 40.0, 60.0, 40.0]
-                        }
-                    ]
-                }]
-            }
-        });
-
-        let resp: AnalyzeResponse = serde_json::from_value(json).unwrap();
-        assert_eq!(resp.status, "succeeded");
-
-        let result = resp.analyze_result.as_ref().unwrap();
-        assert_eq!(result.pages.len(), 1);
-        assert_eq!(result.pages[0].words.len(), 2);
-
-        let word = &result.pages[0].words[0];
-        assert_eq!(word.content, "Hello");
-        assert!((word.confidence - 0.99).abs() < 0.001);
-        assert_eq!(word.polygon.len(), 8);
-    }
-}
diff --git a/crates/nvisy-provider/src/ocr/provider/datalab_surya/backend.rs b/crates/nvisy-provider/src/ocr/provider/datalab_surya/backend.rs
index 100a85be..54d8f487 100644
--- a/crates/nvisy-provider/src/ocr/provider/datalab_surya/backend.rs
+++ b/crates/nvisy-provider/src/ocr/provider/datalab_surya/backend.rs
@@ -179,66 +179,3 @@ impl Backend for SuryaBackend {
         Ok(output)
     }
 }
-
-#[cfg(test)]
-mod tests {
-    use super::*;
-
-    #[test]
-    fn parse_response() {
-        let json = serde_json::json!({
-            "pages": [{
-                "page": 0,
-                "image_bbox": [0.0, 0.0, 800.0, 600.0],
-                "text_lines": [{
-                    "words": [
-                        {
-                            "text": "hello",
-                            "confidence": 0.95,
-                            "bbox": [10.0, 20.0, 60.0, 40.0],
-                            "polygon": [[10, 20], [60, 20], [60, 40], [10, 40]]
-                        },
-                        {
-                            "text": "world",
-                            "confidence": 0.93,
-                            "bbox": [65.0, 20.0, 110.0, 40.0],
-                            "polygon": [[65, 20], [110, 20], [110, 40], [65, 40]]
-                        }
-                    ]
-                }]
-            }]
-        });
-
-        let resp: SuryaResponse = serde_json::from_value(json).unwrap();
-        assert_eq!(resp.pages.len(), 1);
-        assert_eq!(resp.pages[0].text_lines.len(), 1);
-        assert_eq!(resp.pages[0].text_lines[0].words.len(), 2);
-
-        let word = &resp.pages[0].text_lines[0].words[0];
-        assert_eq!(word.text, "hello");
-        assert!((word.confidence - 0.95).abs() < 0.001);
-
-        let [x_min, y_min, x_max, y_max] = word.bbox;
-        let bbox = BoundingBox {
-            x: x_min,
-            y: y_min,
-            width: x_max - x_min,
-            height: y_max - y_min,
-        };
-        assert!((bbox.x - 10.0).abs() < 0.01);
-        assert!((bbox.y - 20.0).abs() < 0.01);
-        assert!((bbox.width - 50.0).abs() < 0.01);
-        assert!((bbox.height - 20.0).abs() < 0.01);
-
-        let polygon = Polygon {
-            vertices: word
-                .polygon
-                .iter()
-                .map(|[x, y]| Vertex::new(*x, *y))
-                .collect(),
-        };
-        assert_eq!(polygon.vertices.len(), 4);
-        assert!((polygon.vertices[0].x - 10.0).abs() < 0.01);
-        assert!((polygon.vertices[0].y - 20.0).abs() < 0.01);
-    }
-}
diff --git a/crates/nvisy-provider/src/ocr/provider/google_vision/backend.rs b/crates/nvisy-provider/src/ocr/provider/google_vision/backend.rs
index 475c2fc9..6f813e6d 100644
--- a/crates/nvisy-provider/src/ocr/provider/google_vision/backend.rs
+++ b/crates/nvisy-provider/src/ocr/provider/google_vision/backend.rs
@@ -251,52 +251,6 @@ impl Backend for GoogleVisionBackend {
 mod tests {
     use super::*;
 
-    #[test]
-    fn parse_response() {
-        let json = serde_json::json!({
-            "responses": [{
-                "fullTextAnnotation": {
-                    "pages": [{
-                        "blocks": [{
-                            "paragraphs": [{
-                                "words": [
-                                    {
-                                        "symbols": [
-                                            { "text": "H" },
-                                            { "text": "i" }
-                                        ],
-                                        "confidence": 0.99,
-                                        "boundingBox": {
-                                            "vertices": [
-                                                { "x": 10, "y": 20 },
-                                                { "x": 50, "y": 20 },
-                                                { "x": 50, "y": 40 },
-                                                { "x": 10, "y": 40 }
-                                            ]
-                                        }
-                                    }
-                                ]
-                            }]
-                        }]
-                    }]
-                }
-            }]
-        });
-
-        let resp: AnnotateResponse = serde_json::from_value(json).unwrap();
-        let annotation = resp.responses[0].full_text_annotation.as_ref().unwrap();
-        let word = &annotation.pages[0].blocks[0].paragraphs[0].words[0];
-
-        let text: String = word.symbols.iter().map(|s| s.text.as_str()).collect();
-        assert_eq!(text, "Hi");
-        assert!((word.confidence - 0.99).abs() < 0.001);
-
-        let bp = word.bounding_box.as_ref().unwrap();
-        assert_eq!(bp.vertices.len(), 4);
-        assert_eq!(bp.vertices[0].x, Some(10));
-        assert_eq!(bp.vertices[0].y, Some(20));
-    }
-
     #[test]
     fn handles_missing_vertex_coords() {
         let json = serde_json::json!({
diff --git a/crates/nvisy-provider/src/ocr/provider/paddle_paddlex/backend.rs b/crates/nvisy-provider/src/ocr/provider/paddle_paddlex/backend.rs
index e14b3d58..764fa55d 100644
--- a/crates/nvisy-provider/src/ocr/provider/paddle_paddlex/backend.rs
+++ b/crates/nvisy-provider/src/ocr/provider/paddle_paddlex/backend.rs
@@ -165,58 +165,3 @@ impl Backend for PaddleXBackend {
         Ok(output)
     }
 }
-
-#[cfg(test)]
-mod tests {
-    use super::*;
-
-    #[test]
-    fn parse_response() {
-        let json = serde_json::json!({
-            "result": {
-                "ocrResults": [{
-                    "text": "hello world",
-                    "confidence": 0.95,
-                    "textRegion": [[10, 20], [110, 20], [110, 40], [10, 40]],
-                    "wordResults": [
-                        {
-                            "text": "hello",
-                            "confidence": 0.96,
-                            "wordRegion": [[10, 20], [60, 20], [60, 40], [10, 40]]
-                        },
-                        {
-                            "text": "world",
-                            "confidence": 0.94,
-                            "wordRegion": [[65, 20], [110, 20], [110, 40], [65, 40]]
-                        }
-                    ]
-                }]
-            }
-        });
-
-        let resp: PaddleXResponse = serde_json::from_value(json).unwrap();
-        assert_eq!(resp.result.ocr_results.len(), 1);
-        assert_eq!(resp.result.ocr_results[0].word_results.len(), 2);
-
-        let word = &resp.result.ocr_results[0].word_results[0];
-        assert_eq!(word.text, "hello");
-        assert!((word.confidence - 0.96).abs() < 0.001);
-
-        let polygon = Polygon {
-            vertices: word
-                .word_region
-                .iter()
-                .map(|[x, y]| Vertex::new(*x, *y))
-                .collect(),
-        };
-        assert_eq!(polygon.vertices.len(), 4);
-        assert!((polygon.vertices[0].x - 10.0).abs() < 0.01);
-        assert!((polygon.vertices[0].y - 20.0).abs() < 0.01);
-
-        let bbox = polygon.bounding_box();
-        assert!((bbox.x - 10.0).abs() < 0.01);
-        assert!((bbox.y - 20.0).abs() < 0.01);
-        assert!((bbox.width - 50.0).abs() < 0.01);
-        assert!((bbox.height - 20.0).abs() < 0.01);
-    }
-}
diff --git a/crates/nvisy-server/src/handler/error/http_error.rs b/crates/nvisy-server/src/handler/error/http_error.rs
index 4c1cb009..cf373d64 100644
--- a/crates/nvisy-server/src/handler/error/http_error.rs
+++ b/crates/nvisy-server/src/handler/error/http_error.rs
@@ -239,59 +239,6 @@ pub type Result<T, E = Error<'static>> = result::Result<T, E>;
 mod tests {
     use super::*;
 
-    #[test]
-    fn default_http_error() {
-        let error = Error::default();
-        assert_eq!(error.kind(), ErrorKind::InternalServerError);
-        let _ = error.into_response();
-    }
-
-    #[test]
-    fn error_from_kind() {
-        let error = Error::new(ErrorKind::NotFound);
-        assert_eq!(error.kind(), ErrorKind::NotFound);
-        let _ = error.into_response();
-    }
-
-    #[test]
-    fn error_with_context() {
-        let error = ErrorKind::BadRequest.with_context("Invalid format");
-        assert_eq!(error.context(), Some("Invalid format"));
-        let _ = error.into_response();
-    }
-
-    #[test]
-    fn error_with_message() {
-        let error = ErrorKind::NotFound.with_message("Custom not found message");
-        assert_eq!(error.message(), Some("Custom not found message"));
-        let _ = error.into_response();
-    }
-
-    #[test]
-    fn error_with_resource() {
-        let error = ErrorKind::Forbidden.with_resource("document");
-        assert_eq!(error.resource(), Some("document"));
-        let _ = error.into_response();
-    }
-
-    #[test]
-    fn error_builder_chaining() {
-        let error = ErrorKind::NotFound
-            .with_message("Document not found")
-            .with_resource("document")
-            .with_context("ID: 123")
-            .with_suggestion("Check if the document ID is correct");
-
-        assert_eq!(error.kind(), ErrorKind::NotFound);
-        assert_eq!(error.message(), Some("Document not found"));
-        assert_eq!(error.resource(), Some("document"));
-        assert_eq!(error.context(), Some("ID: 123"));
-        assert_eq!(
-            error.suggestion(),
-            Some("Check if the document ID is correct")
-        );
-    }
-
     #[test]
     fn std_fmt_display() {
         let error = ErrorKind::NotFound
@@ -320,12 +267,6 @@ mod tests {
         assert!(debug.contains("document"));
     }
 
-    #[test]
-    fn std_error_trait() {
-        let error = Error::new(ErrorKind::BadRequest);
-        let _: &dyn error::Error = &error;
-    }
-
     #[test]
     fn error_into_static() {
         let error = ErrorKind::NotFound
diff --git a/crates/nvisy-server/src/handler/error/http_kind.rs b/crates/nvisy-server/src/handler/error/http_kind.rs
index 05aac5fb..7bd8eee8 100644
--- a/crates/nvisy-server/src/handler/error/http_kind.rs
+++ b/crates/nvisy-server/src/handler/error/http_kind.rs
@@ -108,32 +108,3 @@ impl IntoResponse for ErrorKind {
         self.response().into_response()
     }
 }
-
-#[cfg(test)]
-mod tests {
-    use super::*;
-
-    #[test]
-    fn all_error_kinds_have_responses() {
-        let kinds = vec![
-            ErrorKind::MissingPathParam,
-            ErrorKind::BadRequest,
-            ErrorKind::MissingAuthToken,
-            ErrorKind::MalformedAuthToken,
-            ErrorKind::Unauthorized,
-            ErrorKind::Forbidden,
-            ErrorKind::NotFound,
-            ErrorKind::Conflict,
-            ErrorKind::TooManyRequests,
-            ErrorKind::InternalServerError,
-            ErrorKind::NotImplemented,
-        ];
-
-        for kind in kinds {
-            let response = kind.response();
-            assert!(!response.name.is_empty());
-            assert!(response.status.as_u16() >= 400);
-            let _ = kind.into_response();
-        }
-    }
-}
diff --git a/crates/nvisy-server/src/middleware/sunset.rs b/crates/nvisy-server/src/middleware/sunset.rs
index 83468de5..a760c152 100644
--- a/crates/nvisy-server/src/middleware/sunset.rs
+++ b/crates/nvisy-server/src/middleware/sunset.rs
@@ -125,13 +125,6 @@ mod tests {
         NonZeroU16::new(n).unwrap()
     }
 
-    #[test]
-    fn deprecate_builds_headers() {
-        let config = SunsetConfig::new().deprecate(1, Date::new(2025, 11, 1).unwrap());
-        assert!(config.versions.contains_key(&nz(1)));
-        assert!(!config.versions.contains_key(&nz(2)));
-    }
-
     #[test]
     fn successor_is_version_plus_one() {
         let config = SunsetConfig::new().deprecate(3, Date::new(2026, 6, 15).unwrap());

From b0a59d3dac7da06210c7c28beb2700572405ea5b Mon Sep 17 00:00:00 2001
From: Oleh Martsokha <o.martsokha@gmail.com>
Date: Tue, 19 May 2026 04:53:34 +0200
Subject: [PATCH 6/6] refactor(ontology, engine): merge Strategy +
 DefaultStrategy
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Strategy and DefaultStrategy were structurally the same idea —
"what to do per modality" — represented as two different types: an
enum that picks one variant, and a struct that allows any combination.
DefaultStrategy::for_location was the bridge translating one to the
other, and the applicator's per-build_*_redactions methods each
contained a modality-mismatch branch that traced "rule wants text
but entity is image" without doing anything useful.

Collapsing them:

- Strategy is now a struct { text, image, audio } with Option<*Strategy>
  per modality, derives Default. The per-modality enums (TextStrategy,
  ImageStrategy, AudioStrategy) gain Default impls so unset fields
  resolve to a concrete strategy:
    - TextStrategy::default()  = Replace { placeholder: "" }
      → engine fills "[ENTITY_KIND]"
    - ImageStrategy::default() = Block { color: black }
    - AudioStrategy::default() = Silence
- DefaultStrategy and ResolvedStrategy are deleted. Strategy::merge
  composes rule-level with policy-default-level strategies (rule
  values win, defaults fill gaps).
- Strategy gains text_or_default/image_or_default/audio_or_default
  accessors that fall back to the modality's Default. The applicator
  already knows the entity's modality from entity.location, so it
  calls the matching accessor directly — no enum dispatch on a
  separate ResolvedStrategy wrapper.
- Strategy::is_reversible_for(&Location) replaces the old
  is_reversible(); reversibility is inherently per-modality.

The applicator's log_modality_mismatch is gone. Every modality always
resolves to a concrete strategy now — no mismatch concept exists.
Each build_*_redactions filters by Location variant (it always did)
and uses the matching accessor for the resolved per-modality strategy.

AuditEntryBuilder::for_entity takes &Location to resolve reversibility
at construction time.

While in there: deleted six divider/separator comments across
apply.rs, default.rs, csv_loader.rs.

Workspace tests pass (engine 74 → 72: dropped two modality-mismatch
tests whose premise no longer exists, replaced one with a test of the
new "image-only strategy on text entity uses TextStrategy::default()"
behavior). Clippy clean.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 crates/nvisy-codec/src/document/located.rs    |   1 -
 crates/nvisy-codec/src/document/mod.rs        |  17 +-
 crates/nvisy-codec/src/document/span.rs       |   1 -
 .../src/handler/audio/mp3_handler.rs          |   1 -
 .../src/handler/audio/wav_handler.rs          |   1 -
 .../src/handler/image/image_handler_macro.rs  |   3 +-
 .../src/handler/rich/pdf_handler.rs           |   5 +-
 .../src/handler/rich/pdf_loader.rs            |   1 -
 .../src/handler/tabular/csv_handler.rs        |   6 +-
 .../src/handler/tabular/csv_loader.rs         |   2 -
 .../src/handler/text/html_handler.rs          |   5 +-
 .../src/handler/text/json_handler.rs          |  33 ++-
 .../src/handler/text/txt_handler.rs           |   1 -
 crates/nvisy-codec/src/transform/mod.rs       |   2 +-
 .../src/transform/tabular/apply.rs            |   1 -
 .../src/operation/envelope/document.rs        |   1 -
 .../src/operation/extraction/vision.rs        |   9 +-
 crates/nvisy-engine/src/operation/mod.rs      |   5 +-
 .../src/operation/redaction/apply.rs          | 190 +++++++++---------
 .../src/operation/redaction/evaluate.rs       |  73 +++----
 crates/nvisy-engine/src/pipeline/default.rs   |   8 -
 crates/nvisy-ontology/src/artifacts/audio.rs  |   1 -
 crates/nvisy-ontology/src/context/mod.rs      |   1 -
 .../src/context/reference/credential.rs       |   1 -
 .../nvisy-ontology/src/entity/annotation.rs   |   1 -
 crates/nvisy-ontology/src/entity/kind.rs      |   1 -
 .../src/entity/location/text.rs               |   1 -
 crates/nvisy-ontology/src/policy/mod.rs       |  15 +-
 .../src/policy/strategy/audio.rs              |   8 +-
 .../src/policy/strategy/image.rs              |  14 ++
 .../nvisy-ontology/src/policy/strategy/mod.rs | 148 +++++++++-----
 .../src/policy/strategy/text.rs               |  14 ++
 crates/nvisy-ontology/src/provenance/entry.rs |   7 +-
 crates/nvisy-provider/src/http/mod.rs         |  16 +-
 34 files changed, 297 insertions(+), 297 deletions(-)

diff --git a/crates/nvisy-codec/src/document/located.rs b/crates/nvisy-codec/src/document/located.rs
index 95237a4c..8fbedcdc 100644
--- a/crates/nvisy-codec/src/document/located.rs
+++ b/crates/nvisy-codec/src/document/located.rs
@@ -39,4 +39,3 @@ impl<L> Located<L> {
         }
     }
 }
-
diff --git a/crates/nvisy-codec/src/document/mod.rs b/crates/nvisy-codec/src/document/mod.rs
index 8f5fe004..60410d52 100644
--- a/crates/nvisy-codec/src/document/mod.rs
+++ b/crates/nvisy-codec/src/document/mod.rs
@@ -17,12 +17,6 @@ use nvisy_ontology::entity::{AudioLocation, ImageLocation, TabularLocation, Text
 pub use self::located::Located;
 pub use self::span::Span;
 pub use self::stream::LocationStream;
-#[cfg(feature = "docx")]
-use crate::handler::{DocxLoader, DocxParams};
-#[cfg(feature = "html")]
-use crate::handler::{HtmlLoader, HtmlParams};
-#[cfg(feature = "pdf")]
-use crate::handler::{PdfLoader, PdfParams};
 use crate::handler::{
     AudioData, AudioHandler, BoxedAudioHandler, BoxedImageHandler, BoxedRichHandler,
     BoxedTabularHandler, BoxedTextHandler, CsvLoader, CsvParams, Handler, ImageData, ImageHandler,
@@ -30,6 +24,12 @@ use crate::handler::{
     Mp3Loader, Mp3Params, PngLoader, PngParams, TabularHandler, TextData, TextHandler, TiffLoader,
     TiffParams, TxtLoader, TxtParams, WavLoader, WavParams, XlsxLoader, XlsxParams,
 };
+#[cfg(feature = "docx")]
+use crate::handler::{DocxLoader, DocxParams};
+#[cfg(feature = "html")]
+use crate::handler::{HtmlLoader, HtmlParams};
+#[cfg(feature = "pdf")]
+use crate::handler::{PdfLoader, PdfParams};
 use crate::transform::{
     AudioRedaction, ImageRedaction, Redactions, TabularRedaction, TextRedaction,
 };
@@ -261,10 +261,7 @@ impl ContentHandle {
         Ok(Self::from(handler))
     }
 
-    async fn decode_tabular(
-        doc_type: DocumentType,
-        content: &ContentData,
-    ) -> Result<Self, Error> {
+    async fn decode_tabular(doc_type: DocumentType, content: &ContentData) -> Result<Self, Error> {
         let handler: BoxedTabularHandler = match doc_type {
             DocumentType::Spreadsheet(SpreadsheetFormat::Csv) => CsvLoader
                 .decode(content, &CsvParams::default())
diff --git a/crates/nvisy-codec/src/document/span.rs b/crates/nvisy-codec/src/document/span.rs
index 8a41d5d5..e0e749a6 100644
--- a/crates/nvisy-codec/src/document/span.rs
+++ b/crates/nvisy-codec/src/document/span.rs
@@ -55,4 +55,3 @@ impl<L, D> Span<L, D> {
         }
     }
 }
-
diff --git a/crates/nvisy-codec/src/handler/audio/mp3_handler.rs b/crates/nvisy-codec/src/handler/audio/mp3_handler.rs
index 3d932265..78006e5c 100644
--- a/crates/nvisy-codec/src/handler/audio/mp3_handler.rs
+++ b/crates/nvisy-codec/src/handler/audio/mp3_handler.rs
@@ -32,4 +32,3 @@ impl_audio_handler!(
     "mp3-handler",
     "mp3.encode"
 );
-
diff --git a/crates/nvisy-codec/src/handler/audio/wav_handler.rs b/crates/nvisy-codec/src/handler/audio/wav_handler.rs
index 20327cce..49611ca8 100644
--- a/crates/nvisy-codec/src/handler/audio/wav_handler.rs
+++ b/crates/nvisy-codec/src/handler/audio/wav_handler.rs
@@ -32,4 +32,3 @@ impl_audio_handler!(
     "wav-handler",
     "wav.encode"
 );
-
diff --git a/crates/nvisy-codec/src/handler/image/image_handler_macro.rs b/crates/nvisy-codec/src/handler/image/image_handler_macro.rs
index e21ad54e..88521d74 100644
--- a/crates/nvisy-codec/src/handler/image/image_handler_macro.rs
+++ b/crates/nvisy-codec/src/handler/image/image_handler_macro.rs
@@ -35,8 +35,7 @@ macro_rules! impl_image_handler {
         impl crate::handler::ImageHandler for $handler {
             fn locations(
                 &self,
-            ) -> crate::document::LocationStream<'_, nvisy_ontology::entity::ImageLocation>
-            {
+            ) -> crate::document::LocationStream<'_, nvisy_ontology::entity::ImageLocation> {
                 use ::std::iter;
 
                 let (w, h) = (self.image.width(), self.image.height());
diff --git a/crates/nvisy-codec/src/handler/rich/pdf_handler.rs b/crates/nvisy-codec/src/handler/rich/pdf_handler.rs
index f24439dd..61234363 100644
--- a/crates/nvisy-codec/src/handler/rich/pdf_handler.rs
+++ b/crates/nvisy-codec/src/handler/rich/pdf_handler.rs
@@ -23,9 +23,7 @@ use crate::document::{Located, LocationStream};
 use crate::handler::image::ImageData;
 use crate::handler::text::TextData;
 use crate::handler::{Handler, ImageHandler, TextHandler};
-use crate::transform::{
-    ImageRedaction, Redactions, TextRedaction, apply_text_redactions,
-};
+use crate::transform::{ImageRedaction, Redactions, TextRedaction, apply_text_redactions};
 
 const TARGET: &str = "rich-text-handler";
 
@@ -327,5 +325,4 @@ mod tests {
             "page one"
         );
     }
-
 }
diff --git a/crates/nvisy-codec/src/handler/rich/pdf_loader.rs b/crates/nvisy-codec/src/handler/rich/pdf_loader.rs
index 2a15dbd2..0f478547 100644
--- a/crates/nvisy-codec/src/handler/rich/pdf_loader.rs
+++ b/crates/nvisy-codec/src/handler/rich/pdf_loader.rs
@@ -121,5 +121,4 @@ mod tests {
         assert_eq!(doc.page_count(), 1);
         assert!(doc.page(0).unwrap().trim().is_empty());
     }
-
 }
diff --git a/crates/nvisy-codec/src/handler/tabular/csv_handler.rs b/crates/nvisy-codec/src/handler/tabular/csv_handler.rs
index 4901366d..5d916b4f 100644
--- a/crates/nvisy-codec/src/handler/tabular/csv_handler.rs
+++ b/crates/nvisy-codec/src/handler/tabular/csv_handler.rs
@@ -95,11 +95,7 @@ impl TabularHandler for CsvHandler {
                         column_index: col,
                         start_offset: None,
                         end_offset: None,
-                        column_name: self
-                            .data
-                            .headers
-                            .as_ref()
-                            .and_then(|h| h.get(col).cloned()),
+                        column_name: self.data.headers.as_ref().and_then(|h| h.get(col).cloned()),
                         sheet_name: None,
                     },
                 ));
diff --git a/crates/nvisy-codec/src/handler/tabular/csv_loader.rs b/crates/nvisy-codec/src/handler/tabular/csv_loader.rs
index ef78b1ed..7ef3d9a8 100644
--- a/crates/nvisy-codec/src/handler/tabular/csv_loader.rs
+++ b/crates/nvisy-codec/src/handler/tabular/csv_loader.rs
@@ -202,8 +202,6 @@ mod tests {
         assert!(err.to_string().contains("UTF-8"));
     }
 
-    // --- detect_delimiter unit tests ---
-
     #[test]
     fn detect_tab_delimited() {
         let text = "a\tb\tc\n1\t2\t3\n4\t5\t6\n";
diff --git a/crates/nvisy-codec/src/handler/text/html_handler.rs b/crates/nvisy-codec/src/handler/text/html_handler.rs
index c41bc976..fbd8e087 100644
--- a/crates/nvisy-codec/src/handler/text/html_handler.rs
+++ b/crates/nvisy-codec/src/handler/text/html_handler.rs
@@ -239,11 +239,8 @@ mod tests {
 
     #[tokio::test]
     async fn locations_returns_text_nodes() {
-        let h = handler_from_html(
-            "<html><head></head><body><p>Alpha</p><p>Beta</p></body></html>",
-        );
+        let h = handler_from_html("<html><head></head><body><p>Alpha</p><p>Beta</p></body></html>");
         let items: Vec<_> = h.locations().collect().await;
         assert_eq!(items.len(), 2);
     }
-
 }
diff --git a/crates/nvisy-codec/src/handler/text/json_handler.rs b/crates/nvisy-codec/src/handler/text/json_handler.rs
index c4e43771..cf36edf8 100644
--- a/crates/nvisy-codec/src/handler/text/json_handler.rs
+++ b/crates/nvisy-codec/src/handler/text/json_handler.rs
@@ -173,10 +173,7 @@ impl TextHandler for JsonHandler {
 
         for (path, new_value) in value_updates {
             let target = self.data.value.pointer_mut(&path.pointer).ok_or_else(|| {
-                Error::validation(
-                    format!("JSON pointer not found: {}", path.pointer),
-                    TARGET,
-                )
+                Error::validation(format!("JSON pointer not found: {}", path.pointer), TARGET)
             })?;
             if target.is_string() {
                 *target = serde_json::Value::String(new_value);
@@ -381,14 +378,10 @@ impl Iterator for JsonSpanIter {
 }
 
 /// Rename an object key at the given JSON pointer path.
-fn rename_key(
-    root: &mut serde_json::Value,
-    pointer: &str,
-    new_key: &str,
-) -> Result<(), Error> {
-    let (parent_ptr, old_key_segment) = pointer.rsplit_once('/').ok_or_else(|| {
-        Error::validation(format!("cannot rename root: {pointer}"), TARGET)
-    })?;
+fn rename_key(root: &mut serde_json::Value, pointer: &str, new_key: &str) -> Result<(), Error> {
+    let (parent_ptr, old_key_segment) = pointer
+        .rsplit_once('/')
+        .ok_or_else(|| Error::validation(format!("cannot rename root: {pointer}"), TARGET))?;
 
     let old_key = old_key_segment.replace("~1", "/").replace("~0", "~");
 
@@ -396,10 +389,7 @@ fn rename_key(
         root
     } else {
         root.pointer_mut(parent_ptr).ok_or_else(|| {
-            Error::validation(
-                format!("parent pointer not found: {parent_ptr}"),
-                TARGET,
-            )
+            Error::validation(format!("parent pointer not found: {parent_ptr}"), TARGET)
         })?
     };
 
@@ -456,11 +446,12 @@ mod tests {
     async fn read_returns_string() {
         let h = compact_handler(r#"{"name":"Alice"}"#);
         let items: Vec<_> = h.locations().collect().await;
-        let alice = futures::future::join_all(
-            items.iter().map(|l| h.read(&l.location)),
-        )
-        .await;
-        assert!(alice.iter().any(|d| d.as_ref().map(|d| d.as_str()) == Some("Alice")));
+        let alice = futures::future::join_all(items.iter().map(|l| h.read(&l.location))).await;
+        assert!(
+            alice
+                .iter()
+                .any(|d| d.as_ref().map(|d| d.as_str()) == Some("Alice"))
+        );
     }
 
     #[tokio::test]
diff --git a/crates/nvisy-codec/src/handler/text/txt_handler.rs b/crates/nvisy-codec/src/handler/text/txt_handler.rs
index a40c970a..71fc6c93 100644
--- a/crates/nvisy-codec/src/handler/text/txt_handler.rs
+++ b/crates/nvisy-codec/src/handler/text/txt_handler.rs
@@ -295,5 +295,4 @@ mod tests {
         assert_eq!(content.as_bytes(), b"no newline");
         Ok(())
     }
-
 }
diff --git a/crates/nvisy-codec/src/transform/mod.rs b/crates/nvisy-codec/src/transform/mod.rs
index c4f7db44..9a19111e 100644
--- a/crates/nvisy-codec/src/transform/mod.rs
+++ b/crates/nvisy-codec/src/transform/mod.rs
@@ -26,7 +26,7 @@ pub use self::image::{ImageOutput, ImageRedaction};
 pub use self::mergeable::Mergeable;
 pub use self::policy::{ConflictPolicy, InsertError};
 pub use self::redactions::Redactions;
-pub(crate) use self::tabular::apply_tabular_redactions;
 pub use self::tabular::TabularRedaction;
+pub(crate) use self::tabular::apply_tabular_redactions;
 pub(crate) use self::text::apply_text_redactions;
 pub use self::text::{TextOutput, TextRedaction};
diff --git a/crates/nvisy-codec/src/transform/tabular/apply.rs b/crates/nvisy-codec/src/transform/tabular/apply.rs
index c2ff24e0..de817bb9 100644
--- a/crates/nvisy-codec/src/transform/tabular/apply.rs
+++ b/crates/nvisy-codec/src/transform/tabular/apply.rs
@@ -49,4 +49,3 @@ pub(crate) fn apply_tabular_redactions(
 
     Ok(())
 }
-
diff --git a/crates/nvisy-engine/src/operation/envelope/document.rs b/crates/nvisy-engine/src/operation/envelope/document.rs
index fda04469..6d3d9ba4 100644
--- a/crates/nvisy-engine/src/operation/envelope/document.rs
+++ b/crates/nvisy-engine/src/operation/envelope/document.rs
@@ -181,5 +181,4 @@ impl Document {
         let handle = ContentHandle::decode(&content).await.expect("decode text");
         Self::new(handle, meta)
     }
-
 }
diff --git a/crates/nvisy-engine/src/operation/extraction/vision.rs b/crates/nvisy-engine/src/operation/extraction/vision.rs
index 8134ec33..06622757 100644
--- a/crates/nvisy-engine/src/operation/extraction/vision.rs
+++ b/crates/nvisy-engine/src/operation/extraction/vision.rs
@@ -9,7 +9,9 @@ use nvisy_codec::handler::ImageData;
 use nvisy_core::{Error, ErrorKind, Result};
 use nvisy_ontology::entity::{Entities, ImageLocation};
 use nvisy_ontology::workflow::VisualExtraction as VisualExtractionCfg;
-use nvisy_provider::agent::{ImageFormat, ImageInput, ImageOutput, OcrAgent, VerificationCandidate};
+use nvisy_provider::agent::{
+    ImageFormat, ImageInput, ImageOutput, OcrAgent, VerificationCandidate,
+};
 use nvisy_provider::http::HttpClient;
 
 use crate::operation::{DocumentEnvelope, Operation};
@@ -75,10 +77,7 @@ impl VisualExtractionOp {
     }
 
     /// Run OCR extraction on a batch of image spans.
-    async fn extract(
-        &self,
-        spans: &[Span<ImageLocation, ImageData>],
-    ) -> Result<Vec<ImageOutput>> {
+    async fn extract(&self, spans: &[Span<ImageLocation, ImageData>]) -> Result<Vec<ImageOutput>> {
         if spans.is_empty() {
             return Ok(Vec::new());
         }
diff --git a/crates/nvisy-engine/src/operation/mod.rs b/crates/nvisy-engine/src/operation/mod.rs
index 2973fd7c..1d9412d2 100644
--- a/crates/nvisy-engine/src/operation/mod.rs
+++ b/crates/nvisy-engine/src/operation/mod.rs
@@ -39,8 +39,5 @@ pub(crate) use self::validation::ValidationOp;
 /// registry, key provider) is accessible via `envelope.shared`.
 pub trait Operation {
     /// Execute the operation, mutating the envelope in place.
-    fn execute(
-        &self,
-        envelope: &mut DocumentEnvelope,
-    ) -> impl Future<Output = Result<()>> + Send;
+    fn execute(&self, envelope: &mut DocumentEnvelope) -> impl Future<Output = Result<()>> + Send;
 }
diff --git a/crates/nvisy-engine/src/operation/redaction/apply.rs b/crates/nvisy-engine/src/operation/redaction/apply.rs
index c5e694b2..06a1c898 100644
--- a/crates/nvisy-engine/src/operation/redaction/apply.rs
+++ b/crates/nvisy-engine/src/operation/redaction/apply.rs
@@ -16,7 +16,7 @@ use nvisy_core::{Error, Result};
 use nvisy_ontology::entity::{
     AudioLocation, Entity, EntityKind, ImageLocation, Location, TabularLocation, TextLocation,
 };
-use nvisy_ontology::policy::{AudioStrategy, ImageStrategy, Strategy, TextStrategy};
+use nvisy_ontology::policy::{AudioStrategy, ImageStrategy, TextStrategy};
 use sha2::{Digest, Sha256};
 use uuid::Uuid;
 
@@ -43,8 +43,12 @@ impl<'a> RedactionApplicator<'a> {
         let entity_map = entity_map(&self.envelope.audit.entities);
         let mut mapping_index = mapping_index(&self.envelope.redaction_map.entries);
 
-        let text = self.build_text_redactions(&entity_map, &mut mapping_index).await?;
-        let tabular = self.build_tabular_redactions(&entity_map, &mut mapping_index).await?;
+        let text = self
+            .build_text_redactions(&entity_map, &mut mapping_index)
+            .await?;
+        let tabular = self
+            .build_tabular_redactions(&entity_map, &mut mapping_index)
+            .await?;
         let image = self.build_image_redactions(&entity_map, &mut mapping_index)?;
         let audio = self.build_audio_redactions(&entity_map, &mut mapping_index)?;
 
@@ -82,11 +86,8 @@ impl<'a> RedactionApplicator<'a> {
             let Location::Text(ref loc) = entity.location else {
                 continue;
             };
-            let Strategy::Text(ref strategy) = record.redaction.strategy else {
-                log_modality_mismatch(entity.id, "text", &record.redaction.strategy);
-                continue;
-            };
 
+            let strategy = record.redaction.strategy.text_or_default();
             let value = self
                 .envelope
                 .document
@@ -95,7 +96,7 @@ impl<'a> RedactionApplicator<'a> {
                 .map(|d| d.into_inner())
                 .unwrap_or_default();
 
-            let output = text_output(&value, entity, strategy);
+            let output = text_output(&value, entity, &strategy);
             let entity_id = record.entity_id;
             let replacement = output.replacement_value().map(String::from);
 
@@ -138,11 +139,8 @@ impl<'a> RedactionApplicator<'a> {
             let Location::Tabular(ref loc) = entity.location else {
                 continue;
             };
-            let Strategy::Text(ref strategy) = record.redaction.strategy else {
-                log_modality_mismatch(entity.id, "tabular", &record.redaction.strategy);
-                continue;
-            };
 
+            let strategy = record.redaction.strategy.text_or_default();
             let value = self
                 .envelope
                 .document
@@ -151,7 +149,7 @@ impl<'a> RedactionApplicator<'a> {
                 .map(|d| d.into_inner())
                 .unwrap_or_default();
 
-            let output = text_output(&value, entity, strategy);
+            let output = text_output(&value, entity, &strategy);
             let entity_id = record.entity_id;
             let replacement = output.replacement_value().map(String::from);
 
@@ -198,12 +196,9 @@ impl<'a> RedactionApplicator<'a> {
             let Location::Image(ref loc) = entity.location else {
                 continue;
             };
-            let Strategy::Image(ref strategy) = record.redaction.strategy else {
-                log_modality_mismatch(entity.id, "image", &record.redaction.strategy);
-                continue;
-            };
 
-            let Some((output, placeholder)) = image_output(strategy) else {
+            let strategy = record.redaction.strategy.image_or_default();
+            let Some((output, placeholder)) = image_output(&strategy) else {
                 tracing::debug!(
                     target: TARGET,
                     entity_id = %entity.id,
@@ -248,12 +243,9 @@ impl<'a> RedactionApplicator<'a> {
             let Location::Audio(ref loc) = entity.location else {
                 continue;
             };
-            let Strategy::Audio(ref strategy) = record.redaction.strategy else {
-                log_modality_mismatch(entity.id, "audio", &record.redaction.strategy);
-                continue;
-            };
 
-            let Some((output, placeholder)) = audio_output(strategy) else {
+            let strategy = record.redaction.strategy.audio_or_default();
+            let Some((output, placeholder)) = audio_output(&strategy) else {
                 tracing::debug!(
                     target: TARGET,
                     entity_id = %entity.id,
@@ -299,7 +291,11 @@ fn entity_map(entities: &nvisy_ontology::entity::Entities) -> HashMap<Uuid, Enti
 fn mapping_index(
     mappings: &[nvisy_ontology::provenance::RedactionMapping],
 ) -> HashMap<Uuid, usize> {
-    mappings.iter().enumerate().map(|(i, m)| (m.entity_id, i)).collect()
+    mappings
+        .iter()
+        .enumerate()
+        .map(|(i, m)| (m.entity_id, i))
+        .collect()
 }
 
 /// Compute the codec [`TextOutput`] for a value + entity + strategy.
@@ -326,9 +322,7 @@ fn text_output(value: &str, entity: &Entity, strategy: &TextStrategy) -> TextOut
         }
         TextStrategy::Remove => TextOutput::Remove,
         TextStrategy::Hash => TextOutput::replace(hash_value(value)),
-        TextStrategy::Pseudonymize => {
-            TextOutput::replace(pseudonymize(&entity.entity_kind, value))
-        }
+        TextStrategy::Pseudonymize => TextOutput::replace(pseudonymize(&entity.entity_kind, value)),
         TextStrategy::Encrypt { .. } => {
             // TODO: real encryption — placeholder until the key vault is wired.
             TextOutput::replace(format!("[ENC:{}]", entity.entity_kind))
@@ -358,12 +352,16 @@ fn text_output(value: &str, entity: &Entity, strategy: &TextStrategy) -> TextOut
 /// Returns `None` when the strategy has no defined codec output.
 fn image_output(strategy: &ImageStrategy) -> Option<(ImageOutput, String)> {
     match strategy {
-        ImageStrategy::Blur { sigma } => {
-            Some((ImageOutput::Blur { sigma: *sigma }, format!("[IMAGE_BLUR:{sigma}]")))
-        }
+        ImageStrategy::Blur { sigma } => Some((
+            ImageOutput::Blur { sigma: *sigma },
+            format!("[IMAGE_BLUR:{sigma}]"),
+        )),
         ImageStrategy::Block { color } => Some((
             ImageOutput::Block { color: *color },
-            format!("[IMAGE_BLOCK:#{:02x}{:02x}{:02x}]", color.r, color.g, color.b),
+            format!(
+                "[IMAGE_BLOCK:#{:02x}{:02x}{:02x}]",
+                color.r, color.g, color.b
+            ),
         )),
         ImageStrategy::Pixelate { block_size } => Some((
             ImageOutput::Pixelate {
@@ -408,22 +406,12 @@ fn pseudonymize(entity_kind: &EntityKind, value: &str) -> String {
     format!("{entity_kind}_{id}")
 }
 
-fn log_modality_mismatch(entity_id: Uuid, location_modality: &str, strategy: &Strategy) {
-    tracing::trace!(
-        target: TARGET,
-        %entity_id,
-        location_modality,
-        strategy = ?strategy,
-        "strategy modality does not match entity location, skipping",
-    );
-}
-
 #[cfg(test)]
 mod tests {
     use nvisy_codec::ContentHandle;
     use nvisy_core::content::{Content, ContentData, ContentMetadata, ContentSource};
     use nvisy_ontology::entity::{Entities, Entity, EntityKind, Location, TabularLocation};
-    use nvisy_ontology::policy::ImageStrategy;
+    use nvisy_ontology::policy::{ImageStrategy, Strategy};
     use nvisy_ontology::provenance::{AuditEntry, RedactionMapping};
 
     use super::*;
@@ -455,11 +443,7 @@ mod tests {
         envelope_with(csv, "text/csv", entities).await
     }
 
-    async fn envelope_with(
-        body: &str,
-        content_type: &str,
-        entities: Entities,
-    ) -> DocumentEnvelope {
+    async fn envelope_with(body: &str, content_type: &str, entities: Entities) -> DocumentEnvelope {
         let data = ContentData::from_text(ContentSource::new(), body);
         let content =
             Content::with_metadata(data, ContentMetadata::new().with_content_type(content_type));
@@ -472,9 +456,14 @@ mod tests {
         envelope
     }
 
-    fn test_record(entity_id: Uuid, strategy: Strategy, original: &str) -> AuditEntry {
+    fn test_record(
+        entity_id: Uuid,
+        strategy: Strategy,
+        original: &str,
+        location: &Location,
+    ) -> AuditEntry {
         AuditEntry::builder()
-            .for_entity(entity_id, strategy, original)
+            .for_entity(entity_id, strategy, original, location)
             .build()
             .unwrap()
     }
@@ -492,10 +481,12 @@ mod tests {
     async fn mask_applies_and_records_replacement() {
         let entity = text_entity(6, 10);
         let entity_id = entity.id;
+        let location = entity.location.clone();
         let record = test_record(
             entity_id,
-            Strategy::Text(TextStrategy::Mask { mask_char: '*' }),
+            Strategy::text(TextStrategy::Mask { mask_char: '*' }),
             "John",
+            &location,
         );
 
         let entities: Entities = vec![entity].into();
@@ -517,7 +508,13 @@ mod tests {
     async fn remove_leaves_replacement_none() {
         let entity = text_entity(6, 10);
         let entity_id = entity.id;
-        let record = test_record(entity_id, Strategy::Text(TextStrategy::Remove), "John");
+        let location = entity.location.clone();
+        let record = test_record(
+            entity_id,
+            Strategy::text(TextStrategy::Remove),
+            "John",
+            &location,
+        );
 
         let entities: Entities = vec![entity].into();
         let mut envelope = test_envelope(entities).await;
@@ -532,12 +529,17 @@ mod tests {
     }
 
     #[tokio::test]
-    async fn skips_image_strategy_for_text_entity() {
+    async fn image_only_strategy_on_text_entity_uses_text_default() {
+        // A rule that only specified an image strategy now resolves to
+        // TextStrategy::default() on a text entity — no mismatch, just
+        // the fundamental default.
         let entity = text_entity(0, 4);
+        let location = entity.location.clone();
         let record = test_record(
             entity.id,
-            Strategy::Image(ImageStrategy::Blur { sigma: 15.0 }),
-            "face",
+            Strategy::image(ImageStrategy::Blur { sigma: 15.0 }),
+            "Hell",
+            &location,
         );
 
         let entities: Entities = vec![entity].into();
@@ -548,6 +550,13 @@ mod tests {
             .apply()
             .await
             .unwrap();
+
+        // TextStrategy::default() is Replace { placeholder: "" } — engine
+        // fills in [ENTITY_KIND]. PersonName from test_builder.
+        assert_eq!(
+            envelope.audit.entries[0].value.replacement.as_deref(),
+            Some("[PERSON_NAME]"),
+        );
     }
 
     #[test]
@@ -566,41 +575,40 @@ mod tests {
         assert!(a.contains('_'));
     }
 
-    // -- Tabular end-to-end tests --
-
     #[tokio::test]
     async fn tabular_full_cell_mask() {
-        // row 1, col 1 = "123-45-6789" (11 chars)
         let entity = tabular_entity(1, 1, 0, 11);
         let entity_id = entity.id;
+        let location = entity.location.clone();
         let record = test_record(
             entity_id,
-            Strategy::Text(TextStrategy::Mask { mask_char: '*' }),
+            Strategy::text(TextStrategy::Mask { mask_char: '*' }),
             "123-45-6789",
+            &location,
         );
 
         let entities: Entities = vec![entity.clone()].into();
-        let mut envelope =
-            test_envelope_csv(entities, "name,ssn\nAlice,123-45-6789\n").await;
+        let mut envelope = test_envelope_csv(entities, "name,ssn\nAlice,123-45-6789\n").await;
         envelope.audit.entries.push(record);
-        envelope
-            .redaction_map
-            .entries
-            .push(test_mapping(entity_id, entity.location.clone(), "123-45-6789"));
+        envelope.redaction_map.entries.push(test_mapping(
+            entity_id,
+            entity.location.clone(),
+            "123-45-6789",
+        ));
 
-        RedactionApplicator::new(&mut envelope).apply().await.unwrap();
+        RedactionApplicator::new(&mut envelope)
+            .apply()
+            .await
+            .unwrap();
 
-        // 11 chars -> 11 asterisks
         assert_eq!(
             envelope.audit.entries[0].value.replacement.as_deref(),
             Some("***********"),
         );
-        // Mapping was updated too.
         assert_eq!(
             envelope.redaction_map.entries[0].replacement.as_deref(),
             Some("***********"),
         );
-        // Document content was actually mutated.
         let value = envelope
             .document
             .read_tabular(entity.location.as_tabular().unwrap())
@@ -611,23 +619,26 @@ mod tests {
 
     #[tokio::test]
     async fn tabular_partial_cell_replace() {
-        // row 1, col 0 = "Alice Smith" — redact "Alice" (0..5)
         let entity = tabular_entity(1, 0, 0, 5);
         let entity_id = entity.id;
+        let location = entity.location.clone();
         let record = test_record(
             entity_id,
-            Strategy::Text(TextStrategy::Replace {
+            Strategy::text(TextStrategy::Replace {
                 placeholder: "[NAME]".to_owned(),
             }),
             "Alice",
+            &location,
         );
 
         let entities: Entities = vec![entity.clone()].into();
-        let mut envelope =
-            test_envelope_csv(entities, "name,ssn\nAlice Smith,123-45-6789\n").await;
+        let mut envelope = test_envelope_csv(entities, "name,ssn\nAlice Smith,123-45-6789\n").await;
         envelope.audit.entries.push(record);
 
-        RedactionApplicator::new(&mut envelope).apply().await.unwrap();
+        RedactionApplicator::new(&mut envelope)
+            .apply()
+            .await
+            .unwrap();
 
         let value = envelope
             .document
@@ -641,18 +652,22 @@ mod tests {
     async fn tabular_remove_leaves_empty_cell() {
         let entity = tabular_entity(1, 1, 0, 11);
         let entity_id = entity.id;
+        let location = entity.location.clone();
         let record = test_record(
             entity_id,
-            Strategy::Text(TextStrategy::Remove),
+            Strategy::text(TextStrategy::Remove),
             "123-45-6789",
+            &location,
         );
 
         let entities: Entities = vec![entity.clone()].into();
-        let mut envelope =
-            test_envelope_csv(entities, "name,ssn\nAlice,123-45-6789\n").await;
+        let mut envelope = test_envelope_csv(entities, "name,ssn\nAlice,123-45-6789\n").await;
         envelope.audit.entries.push(record);
 
-        RedactionApplicator::new(&mut envelope).apply().await.unwrap();
+        RedactionApplicator::new(&mut envelope)
+            .apply()
+            .await
+            .unwrap();
 
         let value = envelope
             .document
@@ -661,25 +676,4 @@ mod tests {
             .map(|d| d.into_inner());
         assert_eq!(value.as_deref(), Some(""));
     }
-
-    #[tokio::test]
-    async fn tabular_image_strategy_for_tabular_entity_skipped() {
-        // Mismatched modality: tabular location with image strategy.
-        // The applicator should skip it without erroring.
-        let entity = tabular_entity(1, 0, 0, 5);
-        let record = test_record(
-            entity.id,
-            Strategy::Image(ImageStrategy::Blur { sigma: 15.0 }),
-            "Alice",
-        );
-
-        let entities: Entities = vec![entity].into();
-        let mut envelope =
-            test_envelope_csv(entities, "name,ssn\nAlice,123\n").await;
-        envelope.audit.entries.push(record);
-
-        // No error, but no replacement either.
-        RedactionApplicator::new(&mut envelope).apply().await.unwrap();
-        assert!(envelope.audit.entries[0].value.replacement.is_none());
-    }
 }
diff --git a/crates/nvisy-engine/src/operation/redaction/evaluate.rs b/crates/nvisy-engine/src/operation/redaction/evaluate.rs
index 00d1b5c8..6d491e33 100644
--- a/crates/nvisy-engine/src/operation/redaction/evaluate.rs
+++ b/crates/nvisy-engine/src/operation/redaction/evaluate.rs
@@ -10,7 +10,7 @@
 use nvisy_core::Result;
 use nvisy_core::content::ContentMetadata;
 use nvisy_ontology::entity::{Entities, Entity};
-use nvisy_ontology::policy::{Action, Condition, DefaultStrategy, StrategyPolicy};
+use nvisy_ontology::policy::{Action, Condition, Strategy, StrategyPolicy};
 use nvisy_ontology::provenance::{AuditEntry, RedactionMapping};
 use nvisy_ontology::workflow::Redaction;
 use uuid::Uuid;
@@ -73,10 +73,16 @@ impl Operation for RedactionOp {
 
 /// Evaluate strategy policies against entities, producing audit entries
 /// and redaction mappings.
+///
+/// Each entity either matches a rule (in which case the rule's
+/// [`Strategy`] is merged with `defaults` before storage) or falls
+/// back to `defaults` outright once it clears the confidence
+/// threshold. Every entry stores a complete `Strategy`; at apply time
+/// the per-modality method is resolved via [`Strategy::for_location`].
 async fn evaluate(
     entities: &Entities,
     strategies: &[(Uuid, &StrategyPolicy)],
-    defaults: &DefaultStrategy,
+    defaults: &Strategy,
     default_threshold: f64,
     document_labels: &[&str],
     metadata: &ContentMetadata,
@@ -88,15 +94,15 @@ async fn evaluate(
     for entity in entities {
         let matched = find_matching_strategy(strategies, entity, document_labels, metadata);
 
-        let (spec, policy_id) = match matched {
-            Some((policy_id, strategy)) => match &strategy.action {
+        let (mut strategy, policy_id) = match matched {
+            Some((policy_id, rule)) => match &rule.action {
                 Action::Redact { strategy } => (strategy.clone(), Some(policy_id)),
                 _ => {
                     tracing::debug!(
                         target: TARGET,
                         entity_id = %entity.id,
                         %policy_id,
-                        action = ?strategy.action,
+                        action = ?rule.action,
                         "non-redact policy action",
                     );
                     continue;
@@ -106,20 +112,28 @@ async fn evaluate(
                 if entity.confidence < default_threshold {
                     continue;
                 }
-                let Some(spec) = defaults.for_location(&entity.location) else {
-                    continue;
-                };
-                (spec, None)
+                (Strategy::default(), None)
             }
         };
 
+        // Fold defaults under the rule-level strategy: rule fields win,
+        // unset fields fall back to the policy-set defaults, and any
+        // still-unset modalities resolve to their per-modality Default
+        // when the applicator calls Strategy::for_location.
+        strategy.merge(defaults);
+
         let entity_id = entity.id;
         let original_value = document
             .value_at(&entity.location)
             .await
             .unwrap_or_else(|| format!("[{}]", entity.location));
 
-        let mut builder = AuditEntry::builder().for_entity(entity_id, spec, original_value.clone());
+        let mut builder = AuditEntry::builder().for_entity(
+            entity_id,
+            strategy,
+            original_value.clone(),
+            &entity.location,
+        );
         if let Some(id) = policy_id {
             builder = builder.with_policy_id(id);
         }
@@ -205,7 +219,7 @@ impl ConditionExt for Condition {
 #[cfg(test)]
 mod tests {
     use nvisy_ontology::entity::Entity;
-    use nvisy_ontology::policy::{Strategy, TextStrategy};
+    use nvisy_ontology::policy::TextStrategy;
 
     use super::*;
     use crate::operation::Document;
@@ -216,11 +230,8 @@ mod tests {
             .test_build()
     }
 
-    fn defaults() -> DefaultStrategy {
-        DefaultStrategy {
-            text: Some(TextStrategy::Mask { mask_char: '*' }),
-            ..Default::default()
-        }
+    fn defaults() -> Strategy {
+        Strategy::text(TextStrategy::Mask { mask_char: '*' })
     }
 
     #[tokio::test]
@@ -261,10 +272,7 @@ mod tests {
     #[tokio::test]
     async fn uses_default_strategy_when_no_rules() {
         let doc = Document::from_text("secret").await;
-        let defaults = DefaultStrategy {
-            text: Some(TextStrategy::Remove),
-            ..Default::default()
-        };
+        let defaults = Strategy::text(TextStrategy::Remove);
         let entities: Entities = vec![test_entity("secret", 0.9)].into();
         let (entries, _mappings) = evaluate(
             &entities,
@@ -277,32 +285,11 @@ mod tests {
         )
         .await;
         assert_eq!(
-            entries[0].redaction.strategy,
-            Strategy::Text(TextStrategy::Remove)
+            entries[0].redaction.strategy.text.as_ref(),
+            Some(&TextStrategy::Remove),
         );
     }
 
-    #[tokio::test]
-    async fn skips_entity_without_matching_modality_default() {
-        let doc = Document::from_text("text-entity").await;
-        let defaults = DefaultStrategy {
-            image: Some(nvisy_ontology::policy::ImageStrategy::Blur { sigma: 15.0 }),
-            ..Default::default()
-        };
-        let entities: Entities = vec![test_entity("text-entity", 0.9)].into();
-        let (entries, _mappings) = evaluate(
-            &entities,
-            &[],
-            &defaults,
-            0.0,
-            &[],
-            &ContentMetadata::new(),
-            &doc,
-        )
-        .await;
-        assert!(entries.is_empty());
-    }
-
     #[tokio::test]
     async fn captures_original_value() {
         let doc = Document::from_text("secret-value").await;
diff --git a/crates/nvisy-engine/src/pipeline/default.rs b/crates/nvisy-engine/src/pipeline/default.rs
index edacf38e..b48801cc 100644
--- a/crates/nvisy-engine/src/pipeline/default.rs
+++ b/crates/nvisy-engine/src/pipeline/default.rs
@@ -192,10 +192,6 @@ impl Engine {
         self.inner.registry.base_dir()
     }
 
-    // ------------------------------------------------------------------
-    // Pipeline execution
-    // ------------------------------------------------------------------
-
     /// Create a new [`Pipeline`] bound to this engine's shared state.
     fn pipeline(&self) -> Pipeline {
         Pipeline::new(
@@ -260,10 +256,6 @@ impl Engine {
         Ok(run_id)
     }
 
-    // ------------------------------------------------------------------
-    // Run management
-    // ------------------------------------------------------------------
-
     /// Get a full [`RunSnapshot`] including per-node status for a single run.
     ///
     /// For completed runs (`Succeeded`/`PartialFailure`), audit trails are
diff --git a/crates/nvisy-ontology/src/artifacts/audio.rs b/crates/nvisy-ontology/src/artifacts/audio.rs
index 886b8779..9a0f4f06 100644
--- a/crates/nvisy-ontology/src/artifacts/audio.rs
+++ b/crates/nvisy-ontology/src/artifacts/audio.rs
@@ -121,5 +121,4 @@ mod tests {
         };
         assert!(t.time_span().is_none());
     }
-
 }
diff --git a/crates/nvisy-ontology/src/context/mod.rs b/crates/nvisy-ontology/src/context/mod.rs
index 1a378a6a..b5a3151a 100644
--- a/crates/nvisy-ontology/src/context/mod.rs
+++ b/crates/nvisy-ontology/src/context/mod.rs
@@ -53,7 +53,6 @@ mod tests {
         ctx.push(id);
         assert_eq!(ctx.len(), 1);
     }
-
 }
 
 /// A persistent, reusable collection of reference data for detection.
diff --git a/crates/nvisy-ontology/src/context/reference/credential.rs b/crates/nvisy-ontology/src/context/reference/credential.rs
index 9127d59b..eb4c63b9 100644
--- a/crates/nvisy-ontology/src/context/reference/credential.rs
+++ b/crates/nvisy-ontology/src/context/reference/credential.rs
@@ -74,5 +74,4 @@ mod tests {
         let back: CredentialData = serde_json::from_str(&json).unwrap();
         assert_eq!(back.value, "");
     }
-
 }
diff --git a/crates/nvisy-ontology/src/entity/annotation.rs b/crates/nvisy-ontology/src/entity/annotation.rs
index eef867a4..33c27079 100644
--- a/crates/nvisy-ontology/src/entity/annotation.rs
+++ b/crates/nvisy-ontology/src/entity/annotation.rs
@@ -321,5 +321,4 @@ mod tests {
         let labels = annotations.document_labels();
         assert_eq!(labels, vec!["medical", "gdpr"]);
     }
-
 }
diff --git a/crates/nvisy-ontology/src/entity/kind.rs b/crates/nvisy-ontology/src/entity/kind.rs
index 55eab964..49d6b4fe 100644
--- a/crates/nvisy-ontology/src/entity/kind.rs
+++ b/crates/nvisy-ontology/src/entity/kind.rs
@@ -472,5 +472,4 @@ mod tests {
             EntitySensitivity::Low
         );
     }
-
 }
diff --git a/crates/nvisy-ontology/src/entity/location/text.rs b/crates/nvisy-ontology/src/entity/location/text.rs
index 3ab8d83d..609b1f2d 100644
--- a/crates/nvisy-ontology/src/entity/location/text.rs
+++ b/crates/nvisy-ontology/src/entity/location/text.rs
@@ -99,5 +99,4 @@ mod tests {
     fn no_overlap_disjoint() {
         assert!(!loc(0, 5).overlaps(&loc(10, 15)));
     }
-
 }
diff --git a/crates/nvisy-ontology/src/policy/mod.rs b/crates/nvisy-ontology/src/policy/mod.rs
index 85462cd4..33e2bc3c 100644
--- a/crates/nvisy-ontology/src/policy/mod.rs
+++ b/crates/nvisy-ontology/src/policy/mod.rs
@@ -20,7 +20,7 @@ pub use self::condition::Condition;
 pub use self::retention::{Retention, RetentionPolicy, RetentionScope};
 pub use self::selector::EntitySelector;
 pub use self::strategy::{
-    Action, AudioStrategy, DefaultStrategy, ImageStrategy, Strategy, StrategyPolicy, TextStrategy,
+    Action, AudioStrategy, ImageStrategy, Strategy, StrategyPolicy, TextStrategy,
 };
 
 /// A named, versioned governance policy.
@@ -45,9 +45,14 @@ pub struct Policy {
     #[serde(skip_serializing_if = "Option::is_none")]
     pub description: Option<String>,
     /// Per-modality fallback strategies for unmatched entities.
+    ///
+    /// Combined into a single effective default across all policies in
+    /// the run via [`Policies::default_strategy`]; the applicator then
+    /// merges any rule-level [`Strategy`] with this default so every
+    /// modality always resolves to a method.
     #[builder(default, setter(into = false))]
-    #[serde(default, skip_serializing_if = "DefaultStrategy::is_empty")]
-    pub default_strategy: DefaultStrategy,
+    #[serde(default, skip_serializing_if = "Strategy::is_empty")]
+    pub default_strategy: Strategy,
     /// Entity redaction strategies.
     #[builder(default)]
     #[serde(default, skip_serializing_if = "Vec::is_empty")]
@@ -103,8 +108,8 @@ impl Policies {
     /// Earlier policies take precedence per-modality: if policy A sets
     /// a text default and policy B sets text + image defaults, the result
     /// uses A's text and B's image.
-    pub fn default_strategy(&self) -> DefaultStrategy {
-        let mut merged = DefaultStrategy::default();
+    pub fn default_strategy(&self) -> Strategy {
+        let mut merged = Strategy::default();
         for policy in &self.policies {
             merged.merge(&policy.default_strategy);
         }
diff --git a/crates/nvisy-ontology/src/policy/strategy/audio.rs b/crates/nvisy-ontology/src/policy/strategy/audio.rs
index 3adeee1c..53bb0cf6 100644
--- a/crates/nvisy-ontology/src/policy/strategy/audio.rs
+++ b/crates/nvisy-ontology/src/policy/strategy/audio.rs
@@ -4,12 +4,18 @@ use schemars::JsonSchema;
 use serde::{Deserialize, Serialize};
 
 /// Audio redaction strategy.
-#[derive(Debug, Clone, PartialEq)]
+///
+/// The [`Default`] impl returns [`Silence`] — preserves duration while
+/// removing the audible content.
+///
+/// [`Silence`]: AudioStrategy::Silence
+#[derive(Debug, Clone, Default, PartialEq)]
 #[derive(Serialize, Deserialize, JsonSchema)]
 #[serde(tag = "method", rename_all = "snake_case")]
 #[non_exhaustive]
 pub enum AudioStrategy {
     /// Replace with silence.
+    #[default]
     Silence,
     /// Remove the segment entirely.
     Remove,
diff --git a/crates/nvisy-ontology/src/policy/strategy/image.rs b/crates/nvisy-ontology/src/policy/strategy/image.rs
index 4ec26745..e315fe46 100644
--- a/crates/nvisy-ontology/src/policy/strategy/image.rs
+++ b/crates/nvisy-ontology/src/policy/strategy/image.rs
@@ -16,6 +16,12 @@ fn default_block_size() -> u32 {
 }
 
 /// Image redaction strategy with method-specific configuration.
+///
+/// The [`Default`] impl returns an opaque [`Block`] in [`Color::default`]
+/// (black) — the most-destructive option short of removing the region.
+///
+/// [`Block`]: ImageStrategy::Block
+/// [`Color::default`]: crate::primitive::Color::default
 #[derive(Debug, Clone, PartialEq)]
 #[derive(Serialize, Deserialize, JsonSchema)]
 #[serde(tag = "method", rename_all = "snake_case")]
@@ -40,3 +46,11 @@ pub enum ImageStrategy {
         block_size: u32,
     },
 }
+
+impl Default for ImageStrategy {
+    fn default() -> Self {
+        Self::Block {
+            color: Color::default(),
+        }
+    }
+}
diff --git a/crates/nvisy-ontology/src/policy/strategy/mod.rs b/crates/nvisy-ontology/src/policy/strategy/mod.rs
index 96b64a2e..767041df 100644
--- a/crates/nvisy-ontology/src/policy/strategy/mod.rs
+++ b/crates/nvisy-ontology/src/policy/strategy/mod.rs
@@ -2,14 +2,21 @@
 //!
 //! Each per-modality strategy ([`TextStrategy`], [`ImageStrategy`],
 //! [`AudioStrategy`]) pairs a redaction method with its configuration
-//! parameters. [`Strategy`] unifies them under a single tagged enum for
-//! policy rules and pipeline decisions.
+//! parameters. [`Strategy`] composes them: it carries an optional
+//! per-modality strategy for each of text/image/audio, falling back to
+//! that modality's [`Default`] when unset.
+//!
+//! A single [`Strategy`] value can be used both as a per-rule directive
+//! ("when this rule matches, use these methods") and as a per-policy
+//! default ("for any modality not specified by a matching rule, use
+//! these methods"). The applicator looks up the appropriate modality
+//! at runtime and never needs to dispatch on a strategy-vs-location
+//! modality mismatch — every modality always resolves to something.
 
 mod audio;
 mod image;
 mod text;
 
-use derive_more::From;
 use schemars::JsonSchema;
 use serde::{Deserialize, Serialize};
 
@@ -20,68 +27,73 @@ use super::condition::Condition;
 use super::selector::EntitySelector;
 use crate::entity::Location;
 
-/// Unified redaction strategy across all modalities.
+/// A composed redaction strategy across all modalities.
 ///
-/// Wraps a per-modality strategy variant carrying the method and its
-/// configuration parameters.
-#[derive(Debug, Clone, PartialEq)]
-#[derive(From, Serialize, Deserialize, JsonSchema)]
-#[serde(rename_all = "snake_case")]
-#[non_exhaustive]
-pub enum Strategy {
-    /// Text/tabular redaction strategy.
-    Text(TextStrategy),
-    /// Image redaction strategy.
-    Image(ImageStrategy),
-    /// Audio redaction strategy.
-    Audio(AudioStrategy),
-}
-
-impl Strategy {
-    /// Whether the redaction is reversible (the original value can be
-    /// recovered from the redacted output).
-    ///
-    /// Only [`TextStrategy::Encrypt`] and [`TextStrategy::Tokenize`]
-    /// are reversible: Encrypt uses key-based decryption, Tokenize
-    /// uses vault-based detokenization. All other strategies are
-    /// destructive.
-    pub fn is_reversible(&self) -> bool {
-        matches!(
-            self,
-            Self::Text(TextStrategy::Encrypt { .. } | TextStrategy::Tokenize { .. })
-        )
-    }
-}
-
-/// Per-modality fallback strategies for entities that match no explicit rule.
+/// Each field is optional: an unset field means "use the modality's
+/// own [`Default`]" when the strategy is applied. The per-modality
+/// accessors ([`text_or_default`], [`image_or_default`],
+/// [`audio_or_default`]) resolve to a concrete strategy without ever
+/// failing.
 ///
-/// Each field is optional: `None` means no default for that modality
-/// (unmatched entities in that modality are left unredacted). When
-/// multiple policies are combined, earlier policies take precedence
-/// per-modality via [`DefaultStrategy::merge`].
-#[derive(Debug, Clone, Default, Serialize, Deserialize, JsonSchema)]
+/// [`text_or_default`]: Strategy::text_or_default
+/// [`image_or_default`]: Strategy::image_or_default
+/// [`audio_or_default`]: Strategy::audio_or_default
+#[derive(Debug, Clone, Default, PartialEq)]
+#[derive(Serialize, Deserialize, JsonSchema)]
 #[serde(rename_all = "camelCase")]
-pub struct DefaultStrategy {
-    /// Fallback strategy for text entities.
+pub struct Strategy {
+    /// Override for text entities (and the text view of tabular entities).
     #[serde(default, skip_serializing_if = "Option::is_none")]
     pub text: Option<TextStrategy>,
-    /// Fallback strategy for image entities.
+    /// Override for image entities.
     #[serde(default, skip_serializing_if = "Option::is_none")]
     pub image: Option<ImageStrategy>,
-    /// Fallback strategy for audio entities.
+    /// Override for audio entities.
     #[serde(default, skip_serializing_if = "Option::is_none")]
     pub audio: Option<AudioStrategy>,
 }
 
-impl DefaultStrategy {
-    /// Returns `true` if no default strategy is set for any modality.
+impl Strategy {
+    /// Construct from a single text strategy.
+    pub fn text(strategy: TextStrategy) -> Self {
+        Self {
+            text: Some(strategy),
+            ..Self::default()
+        }
+    }
+
+    /// Construct from a single image strategy.
+    pub fn image(strategy: ImageStrategy) -> Self {
+        Self {
+            image: Some(strategy),
+            ..Self::default()
+        }
+    }
+
+    /// Construct from a single audio strategy.
+    pub fn audio(strategy: AudioStrategy) -> Self {
+        Self {
+            audio: Some(strategy),
+            ..Self::default()
+        }
+    }
+
+    /// `true` if no per-modality strategy is set.
+    ///
+    /// An empty strategy is valid at apply time (every modality falls
+    /// back to its default) but a rule with [`Action::Redact`] and an
+    /// empty strategy is a configuration smell — the validator emits
+    /// a warning.
     pub fn is_empty(&self) -> bool {
         self.text.is_none() && self.image.is_none() && self.audio.is_none()
     }
 
-    /// Merge `other` into `self`, filling in gaps without overriding
-    /// already-set modalities. Earlier policies take precedence.
-    pub fn merge(&mut self, other: &DefaultStrategy) {
+    /// Merge `other` into `self`, filling in modality slots that
+    /// `self` does not already set.
+    ///
+    /// Self's values take precedence per-modality. Used to compose a
+    /// rule-level strategy with the policy-level default strategy.
+    pub fn merge(&mut self, other: &Strategy) {
         if self.text.is_none() {
             self.text = other.text.clone();
         }
@@ -93,12 +105,38 @@ impl DefaultStrategy {
         }
     }
 
-    /// Look up the default strategy for a given entity location.
-    pub fn for_location(&self, location: &Location) -> Option<Strategy> {
+    /// Concrete [`TextStrategy`] to apply, falling back to
+    /// [`TextStrategy::default`] when no override is set.
+    pub fn text_or_default(&self) -> TextStrategy {
+        self.text.clone().unwrap_or_default()
+    }
+
+    /// Concrete [`ImageStrategy`] to apply, falling back to
+    /// [`ImageStrategy::default`] when no override is set.
+    pub fn image_or_default(&self) -> ImageStrategy {
+        self.image.clone().unwrap_or_default()
+    }
+
+    /// Concrete [`AudioStrategy`] to apply, falling back to
+    /// [`AudioStrategy::default`] when no override is set.
+    pub fn audio_or_default(&self) -> AudioStrategy {
+        self.audio.clone().unwrap_or_default()
+    }
+
+    /// Whether the redaction at `location` is reversible (the original
+    /// value can be recovered from the redacted output).
+    ///
+    /// Only [`TextStrategy::Encrypt`] and [`TextStrategy::Tokenize`]
+    /// are reversible: Encrypt uses key-based decryption, Tokenize
+    /// uses vault-based detokenization. All other strategies are
+    /// destructive.
+    pub fn is_reversible_for(&self, location: &Location) -> bool {
         match location {
-            Location::Text(_) | Location::Tabular(_) => self.text.clone().map(Strategy::Text),
-            Location::Image(_) => self.image.clone().map(Strategy::Image),
-            Location::Audio(_) => self.audio.clone().map(Strategy::Audio),
+            Location::Text(_) | Location::Tabular(_) => matches!(
+                self.text_or_default(),
+                TextStrategy::Encrypt { .. } | TextStrategy::Tokenize { .. },
+            ),
+            Location::Image(_) | Location::Audio(_) => false,
         }
     }
 }
diff --git a/crates/nvisy-ontology/src/policy/strategy/text.rs b/crates/nvisy-ontology/src/policy/strategy/text.rs
index b86f7662..20ca0f16 100644
--- a/crates/nvisy-ontology/src/policy/strategy/text.rs
+++ b/crates/nvisy-ontology/src/policy/strategy/text.rs
@@ -10,6 +10,12 @@ fn default_mask_char() -> char {
 }
 
 /// Text redaction strategy with method-specific configuration.
+///
+/// The [`Default`] impl returns [`Replace`] with an empty placeholder;
+/// the engine fills in `[ENTITY_KIND]` when the placeholder is empty,
+/// producing a neutral marker so users see something was redacted.
+///
+/// [`Replace`]: TextStrategy::Replace
 #[derive(Debug, Clone, PartialEq)]
 #[derive(Serialize, Deserialize, JsonSchema)]
 #[serde(tag = "method", rename_all = "snake_case")]
@@ -45,3 +51,11 @@ pub enum TextStrategy {
         vault_id: Option<String>,
     },
 }
+
+impl Default for TextStrategy {
+    fn default() -> Self {
+        Self::Replace {
+            placeholder: String::new(),
+        }
+    }
+}
diff --git a/crates/nvisy-ontology/src/provenance/entry.rs b/crates/nvisy-ontology/src/provenance/entry.rs
index 4a48f525..2355f057 100644
--- a/crates/nvisy-ontology/src/provenance/entry.rs
+++ b/crates/nvisy-ontology/src/provenance/entry.rs
@@ -8,6 +8,7 @@ use strum::{Display, EnumString};
 use uuid::Uuid;
 
 use super::review::ReviewDecision;
+use crate::entity::Location;
 use crate::policy::Strategy;
 
 /// Outcome status of a redaction operation.
@@ -113,14 +114,16 @@ impl AuditEntry {
 impl AuditEntryBuilder {
     /// Set the entity ID, strategy, and original value in one call.
     ///
-    /// `reversible` is derived from the strategy.
+    /// `reversible` is derived from the strategy resolved against
+    /// `location`'s modality.
     pub fn for_entity(
         self,
         entity_id: Uuid,
         strategy: Strategy,
         original: impl Into<String>,
+        location: &Location,
     ) -> Self {
-        let reversible = strategy.is_reversible();
+        let reversible = strategy.is_reversible_for(location);
         self.with_entity_id(entity_id)
             .with_redaction(RedactionSpec {
                 strategy,
diff --git a/crates/nvisy-provider/src/http/mod.rs b/crates/nvisy-provider/src/http/mod.rs
index 1d68656a..0462ce19 100644
--- a/crates/nvisy-provider/src/http/mod.rs
+++ b/crates/nvisy-provider/src/http/mod.rs
@@ -48,11 +48,7 @@ impl HttpClient {
             .pool_idle_timeout(Duration::from_secs(config.idle_timeout_secs))
             .build()
             .map_err(|e| {
-                Error::runtime(
-                    format!("failed to build HTTP client: {e}"),
-                    "http",
-                    false,
-                )
+                Error::runtime(format!("failed to build HTTP client: {e}"), "http", false)
             })?;
 
         Ok(Self(
@@ -98,10 +94,7 @@ pub trait RequestBuilderExt {
 }
 
 impl RequestBuilderExt for RequestBuilder {
-    async fn send_and_check(
-        self,
-        provider: &str,
-    ) -> Result<reqwest_middleware::reqwest::Response> {
+    async fn send_and_check(self, provider: &str) -> Result<reqwest_middleware::reqwest::Response> {
         let resp = self
             .send()
             .await
@@ -119,10 +112,7 @@ impl RequestBuilderExt for RequestBuilder {
         ))
     }
 
-    async fn send_and_parse<T: serde::de::DeserializeOwned>(
-        self,
-        provider: &str,
-    ) -> Result<T> {
+    async fn send_and_parse<T: serde::de::DeserializeOwned>(self, provider: &str) -> Result<T> {
         let resp = self.send_and_check(provider).await?;
         resp.json().await.map_err(|e| {
             Error::runtime(format!("{provider} JSON parse error: {e}"), provider, false)