docs: add comprehensive doc comments to all Rust source files

Document every public function, struct, field, constant, and non-trivial private function across idfoto-core and idfoto-cli. Module-level docs explain each module's role in the architecture. Comments explain the "why" (crypto choices, algorithm design, data model rationale) not just the "what". Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
2026-04-12 09:01:48 -04:00
parent 0d374f3faf
commit 847051216d
7 changed files with 823 additions and 38 deletions
--- a/crates/idfoto-core/src/crypto.rs
+++ b/crates/idfoto-core/src/crypto.rs
@@ -1,3 +1,48 @@
+//! Argon2id key derivation and XChaCha20-Poly1305 authenticated encryption.
+//!
+//! This module implements the low-level "encrypt bytes / decrypt bytes" layer.
+//! Higher-level typed wrappers (encrypt_entry, encrypt_manifest) live in [`crate::vault`].
+//!
+//! ## Why XChaCha20-Poly1305 over AES-GCM
+//!
+//! - **192-bit nonce** (vs. 96-bit for AES-GCM): eliminates nonce collision risk
+//!   even with random nonces across billions of encryptions. With AES-GCM's 96-bit
+//!   nonce, birthday-bound collisions become probable around 2^48 messages under
+//!   the same key -- a real concern for a long-lived vault.
+//! - **Fast on WASM and ARM without AES-NI**: ChaCha20 is a pure arithmetic cipher
+//!   (add/rotate/XOR) with no dependency on hardware AES acceleration. AES-GCM is
+//!   fast *only* with AES-NI; without it, software AES is both slow and vulnerable
+//!   to cache-timing side channels.
+//!
+//! ## Binary ciphertext format
+//!
+//! Every encrypted blob produced by [`encrypt`] has this layout:
+//!
+//! ```text
+//! [version: 1 byte] [nonce: 24 bytes] [ciphertext + Poly1305 tag: variable]
+//! ```
+//!
+//! - **Version byte** (`0x01`): allows future format changes without ambiguity.
+//!   Decryption rejects any version it does not recognize.
+//! - **Nonce** (24 bytes): randomly generated per encryption via [`OsRng`].
+//!   Stored alongside the ciphertext so the decryptor does not need out-of-band
+//!   nonce management.
+//! - **Ciphertext + tag**: the AEAD output. The Poly1305 tag (16 bytes) is
+//!   appended by the cipher implementation; we do not separate it.
+//!
+//! ## KDF pipeline
+//!
+//! [`derive_master_key`] concatenates the passphrase and image_secret as a single
+//! password input to Argon2id:
+//!
+//! ```text
+//! password = passphrase_bytes || image_secret (32 bytes)
+//! master_key = Argon2id(password, salt, params) -> 32 bytes
+//! ```
+//!
+//! Both factors contribute to the derived key -- compromising one without the
+//! other is insufficient. The salt is vault-specific and stored in `.idfoto/salt`.
+
 use argon2::{Algorithm, Argon2, Params, Version};
 use chacha20poly1305::{
    aead::{Aead, KeyInit},
@@ -8,14 +53,35 @@ use serde::{Deserialize, Serialize};

 use crate::error::{IdfotoError, Result};

+/// Current binary format version. Increment this if the ciphertext layout changes.
 const VERSION_BYTE: u8 = 0x01;
+
+/// XChaCha20-Poly1305 nonce length: 192 bits = 24 bytes.
 const NONCE_LEN: usize = 24;
+
+/// Poly1305 authentication tag length: 128 bits = 16 bytes.
+/// Used only for minimum-length validation during decryption.
 const TAG_LEN: usize = 16;
+
+/// Total header size: version byte + nonce. The ciphertext (including tag)
+/// follows immediately after the header.
 const HEADER_LEN: usize = 1 + NONCE_LEN; // version + nonce

+/// Encrypt arbitrary plaintext bytes under a 256-bit key using XChaCha20-Poly1305.
+///
+/// Returns the binary blob in the format: `version(1) || nonce(24) || ciphertext+tag`.
+/// A fresh random nonce is generated for each call via the OS CSPRNG.
+///
+/// # Errors
+///
+/// Returns [`IdfotoError::Encrypt`] if the underlying AEAD operation fails
+/// (extremely unlikely in practice).
 pub fn encrypt(key: &[u8; 32], plaintext: &[u8]) -> Result<Vec<u8>> {
    let cipher = XChaCha20Poly1305::new(key.into());

+    // Generate a fresh random 24-byte nonce for every encryption.
+    // With 192 bits of randomness, nonce reuse probability is negligible
+    // even across billions of encryptions under the same key.
    let mut nonce_bytes = [0u8; NONCE_LEN];
    OsRng.fill_bytes(&mut nonce_bytes);
    let nonce = XNonce::from(nonce_bytes);
@@ -33,7 +99,22 @@ pub fn encrypt(key: &[u8; 32], plaintext: &[u8]) -> Result<Vec<u8>> {
    Ok(output)
 }

+/// Decrypt a blob produced by [`encrypt`], returning the original plaintext.
+///
+/// Validates the version byte and minimum blob length before attempting
+/// authenticated decryption. If the key is wrong or the data has been
+/// tampered with, the Poly1305 tag verification fails and [`IdfotoError::Decrypt`]
+/// is returned -- with no information about which bytes were wrong (preventing
+/// padding oracle / chosen-ciphertext attacks).
+///
+/// # Errors
+///
+/// - [`IdfotoError::Format`] if the data is too short or has an unknown version byte.
+/// - [`IdfotoError::Decrypt`] if the AEAD tag verification fails (wrong key or
+///   tampered data).
 pub fn decrypt(key: &[u8; 32], data: &[u8]) -> Result<Vec<u8>> {
+    // Minimum valid blob: 1 (version) + 24 (nonce) + 16 (tag) = 41 bytes.
+    // A zero-length plaintext produces exactly 41 bytes of output.
    if data.len() < HEADER_LEN + TAG_LEN {
        return Err(IdfotoError::Format(
            "data too short to be valid ciphertext".into(),
@@ -59,13 +140,36 @@ pub fn decrypt(key: &[u8; 32], data: &[u8]) -> Result<Vec<u8>> {
    Ok(plaintext)
 }

+/// Tunable parameters for the Argon2id key derivation function.
+///
+/// These are stored in the vault's `.idfoto/params.json` so that every client
+/// derives the same master key from the same inputs. Making them configurable
+/// lets tests use fast params (m=256, t=1, p=1) while production uses strong
+/// params (m=64MiB, t=3, p=4).
+///
+/// The parameters follow Argon2id naming conventions:
+/// - `argon2_m`: memory cost in KiB
+/// - `argon2_t`: time cost (number of iterations)
+/// - `argon2_p`: parallelism degree (number of lanes)
 #[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct KdfParams {
+    /// Memory cost in KiB. Default is 65536 (64 MiB), which makes GPU/ASIC
+    /// brute-force attacks expensive. Tests use 256 KiB for speed.
    pub argon2_m: u32,
+    /// Time cost (iteration count). Default is 3. Higher values increase CPU
+    /// time linearly. Combined with high memory cost, this makes each key
+    /// derivation take ~1 second on modern hardware.
    pub argon2_t: u32,
+    /// Parallelism degree. Default is 4. Sets the number of independent lanes
+    /// in the Argon2id memory-hard computation.
    pub argon2_p: u32,
 }

+/// Production-strength default parameters: 64 MiB memory, 3 iterations, 4 lanes.
+///
+/// These are calibrated to take roughly 0.5-1 second on a modern desktop CPU,
+/// making brute-force attacks impractical while keeping interactive unlock fast
+/// enough for daily use.
 impl Default for KdfParams {
    fn default() -> Self {
        Self {
@@ -76,6 +180,28 @@ impl Default for KdfParams {
    }
 }

+/// Derive a 256-bit master key from the user's passphrase and reference image secret.
+///
+/// The two factors (passphrase + image_secret) are concatenated into a single
+/// password input to Argon2id. This means both factors contribute entropy to
+/// the derived key -- compromising one factor alone is insufficient.
+///
+/// # Arguments
+///
+/// - `passphrase`: the user's passphrase as raw UTF-8 bytes.
+/// - `image_secret`: the 32-byte secret extracted from the reference JPEG via
+///   [`crate::imgsecret::extract`].
+/// - `salt`: a 32-byte vault-specific salt (stored in `.idfoto/salt`).
+/// - `params`: the Argon2id tuning parameters (stored in `.idfoto/params.json`).
+///
+/// # Returns
+///
+/// A 32-byte master key suitable for use with [`encrypt`] and [`decrypt`].
+///
+/// # Errors
+///
+/// Returns [`IdfotoError::Kdf`] if the Argon2id parameters are invalid (e.g.,
+/// memory cost below the library's minimum).
 pub fn derive_master_key(
    passphrase: &[u8],
    image_secret: &[u8; 32],
@@ -92,7 +218,10 @@ pub fn derive_master_key(

    let argon2 = Argon2::new(Algorithm::Argon2id, Version::V0x13, argon2_params);

-    // Concatenate passphrase + image_secret as the password input
+    // Concatenate passphrase + image_secret as the password input.
+    // This ensures both factors contribute to the derived key: knowing only
+    // the passphrase (without the reference image) or only the image secret
+    // (without the passphrase) is insufficient to derive the correct master key.
    let mut password = Vec::with_capacity(passphrase.len() + 32);
    password.extend_from_slice(passphrase);
    password.extend_from_slice(image_secret);
--- a/crates/idfoto-core/src/entry.rs
+++ b/crates/idfoto-core/src/entry.rs
@@ -1,8 +1,48 @@
+//! Vault data model: entries, manifest entries, and the manifest index.
+//!
+//! The vault stores credentials in two tiers:
+//!
+//! 1. **Individual entries** (`entries/<id>.enc`): each file contains a single
+//!    [`Entry`] encrypted with the master key. Only decrypted when the user
+//!    needs to read or edit a specific credential.
+//!
+//! 2. **Manifest** (`manifest.enc`): a single encrypted file containing a
+//!    [`Manifest`] -- a map from entry IDs to [`ManifestEntry`] summaries.
+//!    This lets the CLI list and search entries by decrypting only one file,
+//!    rather than decrypting every entry in the vault.
+//!
+//! ## Entry IDs
+//!
+//! Entry IDs are random 8-character lowercase hex strings (4 bytes of entropy,
+//! ~4 billion possible values). This is sufficient for family-scale vaults while
+//! keeping filenames short and filesystem-friendly.
+//!
+//! ## Serialization strategy
+//!
+//! All structs derive `Serialize`/`Deserialize` for JSON encoding. Optional fields
+//! use `#[serde(skip_serializing_if = "Option::is_none")]` to keep the JSON compact
+//! -- omitting null fields reduces ciphertext size and avoids leaking structural
+//! information about which optional fields a credential uses.
+
 use rand::Rng;
 use serde::{Deserialize, Serialize};
 use std::collections::HashMap;

-/// A single password entry (stored encrypted in entries/<id>.enc).
+/// A full credential entry stored encrypted in `entries/<id>.enc`.
+///
+/// Contains all sensitive data for a single credential. Each entry is encrypted
+/// independently, so accessing one entry does not require decrypting others.
+///
+/// ## Fields
+///
+/// - `name`: human-readable label (e.g., "GitHub", "Work Email"). Required.
+/// - `url`: the login URL. Optional; used for autofill matching in the browser extension.
+/// - `username`: the account username or email. Optional.
+/// - `password`: the credential password. Required (this is the core secret).
+/// - `notes`: free-form text (e.g., security questions, recovery codes). Optional.
+/// - `totp_secret`: base32-encoded TOTP secret for 2FA. Optional.
+/// - `created_at`: ISO 8601 timestamp (or Unix seconds) when the entry was created.
+/// - `updated_at`: ISO 8601 timestamp (or Unix seconds) of the last modification.
 #[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct Entry {
    pub name: String,
@@ -19,25 +59,46 @@ pub struct Entry {
    pub updated_at: String,
 }

-/// Summary info about an entry (stored in the manifest).
+/// Summary metadata for a single entry, stored in the manifest.
+///
+/// This is a lightweight projection of [`Entry`] that contains only the
+/// non-sensitive fields needed for listing and searching. The password,
+/// notes, and TOTP secret are intentionally excluded so that listing
+/// entries requires decrypting only the manifest, not every individual entry.
 #[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct ManifestEntry {
+    /// Human-readable label for display and search matching.
    pub name: String,
+    /// Login URL for search matching and browser extension autofill.
    #[serde(skip_serializing_if = "Option::is_none")]
    pub url: Option<String>,
+    /// Account username for display in entry listings.
    #[serde(skip_serializing_if = "Option::is_none")]
    pub username: Option<String>,
+    /// Timestamp of last modification, used for sorting and display.
    pub updated_at: String,
 }

-/// The vault manifest — maps entry IDs to their metadata.
+/// The vault manifest -- an encrypted index mapping entry IDs to their metadata.
+///
+/// The manifest serves two purposes:
+///
+/// 1. **Efficient listing**: decrypting the single manifest file is enough to show
+///    all entry names, URLs, and usernames without touching individual entry files.
+/// 2. **Search**: the [`search`](Manifest::search) method performs case-insensitive
+///    substring matching against entry names and URLs.
+///
+/// The `version` field allows future schema migrations if the manifest format evolves.
 #[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct Manifest {
+    /// Map from entry ID (8-char hex string) to entry metadata.
    pub entries: HashMap<String, ManifestEntry>,
+    /// Schema version. Currently always `1`.
    pub version: u32,
 }

 impl Manifest {
+    /// Create a new empty manifest with version 1.
    pub fn new() -> Self {
        Manifest {
            entries: HashMap::new(),
@@ -45,14 +106,23 @@ impl Manifest {
        }
    }

+    /// Insert or update an entry in the manifest.
+    ///
+    /// If an entry with the same ID already exists, it is overwritten.
+    /// This is used both for `add` (new entry) and `edit` (update existing).
    pub fn add_entry(&mut self, id: String, entry: ManifestEntry) {
        self.entries.insert(id, entry);
    }

+    /// Remove an entry from the manifest by ID, returning its metadata if it existed.
    pub fn remove_entry(&mut self, id: &str) -> Option<ManifestEntry> {
        self.entries.remove(id)
    }

+    /// Search entries by case-insensitive substring match against name and URL.
+    ///
+    /// Returns a vector of `(id, entry)` pairs for all matching entries. An entry
+    /// matches if the query appears in its name or URL (case-insensitive).
    pub fn search(&self, query: &str) -> Vec<(&String, &ManifestEntry)> {
        let q = query.to_lowercase();
        self.entries
@@ -75,6 +145,10 @@ impl Default for Manifest {
 }

 /// Generate a random 8-character hex string to use as an entry ID.
+///
+/// Uses 4 random bytes (32 bits of entropy), producing IDs like `"a1b2c3d4"`.
+/// This gives ~4 billion possible values, which is more than sufficient for
+/// a family-scale vault (typically < 1000 entries).
 pub fn generate_entry_id() -> String {
    let mut rng = rand::thread_rng();
    let bytes: [u8; 4] = rng.gen();
--- a/crates/idfoto-core/src/error.rs
+++ b/crates/idfoto-core/src/error.rs
@@ -1,25 +1,59 @@
+//! Unified error type for the idfoto-core crate.
+//!
+//! Every fallible function in this crate returns [`Result<T>`], which is an alias
+//! for `std::result::Result<T, IdfotoError>`. Using a single error enum keeps the
+//! public API surface predictable and makes error handling in callers (CLI, WASM
+//! bindings, mobile FFI) straightforward.
+
 use thiserror::Error;

+/// All errors that can originate from idfoto-core operations.
+///
+/// Variants are ordered roughly by the pipeline stage where they occur:
+/// KDF -> encryption -> decryption -> format parsing -> entry lookup -> image
+/// steganography -> serialization -> device keys.
 #[derive(Debug, Error)]
 pub enum IdfotoError {
+    /// The Argon2id key derivation failed. This typically means invalid KDF
+    /// parameters were supplied (e.g., memory cost below Argon2's minimum).
    #[error("key derivation failed: {0}")]
    Kdf(String),

+    /// XChaCha20-Poly1305 encryption failed. In practice this is extremely rare
+    /// -- the only realistic cause is an internal library error, since the cipher
+    /// accepts arbitrary-length plaintext.
    #[error("encryption failed: {0}")]
    Encrypt(String),

+    /// Authenticated decryption failed. This means either the wrong master key
+    /// was used (wrong passphrase or wrong reference image) or the ciphertext
+    /// was tampered with / corrupted in transit or at rest. The error message is
+    /// intentionally vague to avoid leaking information about which factor was
+    /// wrong (passphrase vs. image).
    #[error("decryption failed: wrong key or corrupted data")]
    Decrypt,

+    /// The binary ciphertext blob does not match the expected format (e.g.,
+    /// too short to contain the version byte + nonce + tag, or an unrecognized
+    /// version byte). This usually indicates file corruption or a version
+    /// mismatch between the writer and reader.
    #[error("invalid vault format: {0}")]
    Format(String),

+    /// A vault entry was looked up by ID but does not exist in the manifest.
+    /// The string payload is the missing entry ID.
    #[error("entry not found: {0}")]
    EntryNotFound(String),

+    /// A general error from the image steganography subsystem (imgsecret).
+    /// Covers issues like failing to decode the carrier JPEG or failing to
+    /// encode the output JPEG after modification.
    #[error("imgsecret: {0}")]
    ImgSecret(String),

+    /// The carrier image is too small to hold the embedded secret with
+    /// sufficient redundancy. The embed region (central 70% of the image)
+    /// must contain at least `BLOCKS_PER_COPY * MIN_COPIES` 8x8 blocks.
    #[error("image too small: need at least {min_width}x{min_height}, got {actual_width}x{actual_height}")]
    ImageTooSmall {
        min_width: u32,
@@ -28,14 +62,25 @@ pub enum IdfotoError {
        actual_height: u32,
    },

+    /// Secret extraction from a JPEG failed. This can mean:
+    /// - The image never had a secret embedded in it.
+    /// - The image was recompressed below Q85, destroying the QIM watermarks.
+    /// - The image was cropped beyond the 15% crumple zone.
+    /// - Majority-vote confidence fell below the 60% threshold on one or more bits.
    #[error("extraction failed: no valid secret found in image")]
    ExtractionFailed,

+    /// JSON serialization or deserialization of an entry or manifest failed.
+    /// Wraps [`serde_json::Error`] transparently via `#[from]`.
    #[error("json error: {0}")]
    Json(#[from] serde_json::Error),

+    /// An error related to device ed25519 key operations. Device keys are
+    /// separate from the vault KDF -- revoking a device does not require
+    /// rotating the passphrase or reference image.
    #[error("device key error: {0}")]
    DeviceKey(String),
 }

+/// Crate-wide result alias, reducing boilerplate in function signatures.
 pub type Result<T> = std::result::Result<T, IdfotoError>;
--- a/crates/idfoto-core/src/imgsecret.rs
+++ b/crates/idfoto-core/src/imgsecret.rs
@@ -1,7 +1,43 @@
-//! DCT-based secret embedding that survives JPEG re-encoding and mild cropping.
+//! DCT-based steganographic embedding of a 256-bit secret in JPEG images.
 //!
-//! Hides a 256-bit secret in the mid-frequency DCT coefficients of the luminance
-//! channel using Quantization Index Modulation (QIM) with majority voting.
+//! This is the novel component of idfoto. It hides a 32-byte secret inside a
+//! JPEG image's luminance channel using Quantization Index Modulation (QIM) on
+//! mid-frequency DCT coefficients, with majority voting across multiple redundant
+//! copies for robustness.
+//!
+//! ## High-level algorithm
+//!
+//! ### Embedding (`embed`)
+//!
+//! 1. Decode the carrier JPEG and extract the luminance (Y) channel.
+//! 2. Compute the "embed region" -- the central 70% of the image (15% margin
+//!    on each side acts as a crumple zone for mild cropping).
+//! 3. Divide the embed region into 8x8 pixel blocks and select evenly-spaced
+//!    blocks for embedding.
+//! 4. For each copy of the secret (5-50 copies depending on image size):
+//!    - For each of the 22 blocks needed to hold 256 bits (12 bits per block):
+//!      - Apply the 2D DCT to the 8x8 block.
+//!      - Embed bits into 12 mid-frequency DCT coefficients using QIM.
+//!      - Apply the inverse DCT to write the modified block back.
+//! 5. Reconstruct the JPEG by replacing only the Y channel and re-encoding.
+//!
+//! ### Extraction (`extract`)
+//!
+//! 1. Decode the JPEG and extract the Y channel.
+//! 2. Try the canonical extraction (assuming the image is uncropped).
+//! 3. If that fails, try crop-recovery: search for plausible original dimensions
+//!    and pixel offsets, reconstructing the block grid accordingly.
+//! 4. For each copy of the secret, extract bits from DCT coefficients via QIM.
+//! 5. Majority-vote each bit position across all copies. Require >= 60% confidence.
+//!
+//! ## Robustness
+//!
+//! The combination of QIM with a high quantization step (50.0), mid-frequency
+//! coefficient placement, and majority voting across many copies makes the
+//! watermark survive:
+//! - JPEG recompression down to quality ~85
+//! - Mild cropping (up to ~10% from edges, within the 15% crumple zone)
+//! - Color space conversions (embedding is in luminance only)

 use crate::error::{IdfotoError, Result};
 use image::codecs::jpeg::JpegEncoder;
@@ -12,15 +48,55 @@ use std::io::Cursor;

 // ─── Constants ───────────────────────────────────────────────────────────────

+/// DCT block size. JPEG uses 8x8 blocks, so we match that to minimize
+/// interference with the JPEG codec's own quantization.
 const BLOCK_SIZE: usize = 8;
+
+/// QIM quantization step. Higher values make the watermark more robust to
+/// recompression but introduce more visible artifacts. A value of 50.0 is
+/// higher than the typical academic value of 25 -- this is intentional because
+/// we need to survive JPEG recompression at Q85 and below, which applies
+/// aggressive quantization to mid-frequency coefficients. The trade-off is
+/// acceptable because the reference image is a personal photo, not a
+/// publication-quality image.
 const QUANT_STEP: f64 = 50.0;
+
+/// Minimum image dimension (width or height) in pixels. Images smaller than
+/// this cannot hold enough 8x8 blocks for reliable embedding.
 const MIN_DIMENSION: u32 = 100;
+
+/// Number of secret bits to embed: 256 bits = 32 bytes.
 const SECRET_BITS: usize = 256;
+
+/// Minimum number of redundant copies of the secret. More copies improve
+/// extraction reliability via majority voting, but require more blocks.
 const MIN_COPIES: usize = 5;
+
+/// Number of mid-frequency DCT positions used per block. Each block carries
+/// 12 bits of the secret. This matches `EMBED_POSITIONS.len()`.
 const BITS_PER_BLOCK: usize = 12; // EMBED_POSITIONS.len()
+
+/// Number of 8x8 blocks needed to hold one complete copy of the 256-bit secret.
+/// ceil(256 / 12) = 22 blocks per copy.
 const BLOCKS_PER_COPY: usize = (SECRET_BITS + BITS_PER_BLOCK - 1) / BITS_PER_BLOCK; // 22

-/// Mid-frequency DCT positions (zig-zag positions 4–15)
+/// Mid-frequency DCT coefficient positions for embedding, specified as
+/// (row, col) indices into the 8x8 DCT coefficient matrix.
+///
+/// These correspond to zig-zag scan positions 4 through 15 -- the "sweet spot"
+/// between low-frequency coefficients (which carry visible image structure and
+/// are heavily quantized by JPEG) and high-frequency coefficients (which carry
+/// noise/detail and are aggressively zeroed by JPEG compression).
+///
+/// Mid-frequency coefficients survive JPEG recompression better than high-frequency
+/// ones, while causing less visible distortion than modifying low-frequency ones.
+///
+/// The zig-zag ordering is the standard JPEG scan order:
+/// ```text
+/// Zig-zag positions 4-7:   (0,3) (1,2) (2,1) (3,0)
+/// Zig-zag positions 8-11:  (0,4) (1,3) (2,2) (3,1)
+/// Zig-zag positions 12-15: (4,0) (0,5) (1,4) (2,3)
+/// ```
 const EMBED_POSITIONS: [(usize, usize); 12] = [
    (0, 3),
    (1, 2),
@@ -38,17 +114,31 @@ const EMBED_POSITIONS: [(usize, usize); 12] = [

 // ─── YChannel ────────────────────────────────────────────────────────────────

+/// The luminance (Y) channel of an image, stored as a flat array of f64 values.
+///
+/// We embed exclusively in the luminance channel because:
+/// - Human vision is more sensitive to luminance than chrominance, so the
+///   luminance channel has more "room" for watermarking in the frequency domain.
+/// - JPEG compresses chrominance channels more aggressively (typically 4:2:0
+///   subsampling), which would destroy embedded data.
+/// - Working with a single channel keeps the DCT operations simple and fast.
 struct YChannel {
+    /// Row-major luminance values. `data[y * width + x]` gives the luminance
+    /// at pixel (x, y). Values are in the range [0, 255] after extraction
+    /// from RGB, but may temporarily go slightly outside this range during
+    /// DCT manipulation.
    data: Vec<f64>,
    width: usize,
    height: usize,
 }

 impl YChannel {
+    /// Get the luminance value at pixel (x, y).
    fn get(&self, x: usize, y: usize) -> f64 {
        self.data[y * self.width + x]
    }

+    /// Set the luminance value at pixel (x, y).
    fn set(&mut self, x: usize, y: usize, val: f64) {
        self.data[y * self.width + x] = val;
    }
@@ -56,19 +146,36 @@ impl YChannel {

 // ─── EmbedRegion ─────────────────────────────────────────────────────────────

+/// Defines the central region of the image where embedding occurs.
+///
+/// The embed region is the central 70% of the image -- a 15% margin is excluded
+/// on each side. This margin acts as a "crumple zone": if the image is mildly
+/// cropped (e.g., a social media platform trims edges), the embedded data in the
+/// center remains intact. The 15% margin is sufficient to tolerate up to ~10%
+/// cropping from any single edge.
 struct EmbedRegion {
+    /// Pixel offset from the left edge to the start of the embed region.
    x_offset: usize,
+    /// Pixel offset from the top edge to the start of the embed region.
    y_offset: usize,
+    /// Width of the embed region in pixels.
    #[allow(dead_code)]
    region_width: usize,
+    /// Height of the embed region in pixels.
    #[allow(dead_code)]
    region_height: usize,
+    /// Number of complete 8x8 blocks that fit horizontally in the embed region.
    blocks_x: usize,
+    /// Number of complete 8x8 blocks that fit vertically in the embed region.
    blocks_y: usize,
 }

 // ─── Helper functions ────────────────────────────────────────────────────────

+/// Decode a JPEG from raw bytes and extract the luminance (Y) channel.
+///
+/// Converts each RGB pixel to luminance using the ITU-R BT.601 formula:
+/// `Y = 0.299*R + 0.587*G + 0.114*B`
 fn extract_y_channel(jpeg_bytes: &[u8]) -> Result<YChannel> {
    let reader = ImageReader::new(Cursor::new(jpeg_bytes))
        .with_guessed_format()
@@ -82,6 +189,7 @@ fn extract_y_channel(jpeg_bytes: &[u8]) -> Result<YChannel> {
    for y in 0..height {
        for x in 0..width {
            let p = rgb.get_pixel(x as u32, y as u32);
+            // ITU-R BT.601 luma coefficients
            let luma = 0.299 * p[0] as f64 + 0.587 * p[1] as f64 + 0.114 * p[2] as f64;
            data.push(luma);
        }
@@ -93,10 +201,15 @@ fn extract_y_channel(jpeg_bytes: &[u8]) -> Result<YChannel> {
    })
 }

+/// Compute the embed region for a YChannel (convenience wrapper).
 fn central_region(y: &YChannel) -> EmbedRegion {
    compute_region(y.width, y.height)
 }

+/// Compute the central embed region for given image dimensions.
+///
+/// The region excludes a 15% margin on each side, leaving the central 70%.
+/// The margin acts as a crumple zone for crop tolerance.
 fn compute_region(width: usize, height: usize) -> EmbedRegion {
    let margin_x = (width as f64 * 0.15) as usize;
    let margin_y = (height as f64 * 0.15) as usize;
@@ -116,6 +229,11 @@ fn compute_region(width: usize, height: usize) -> EmbedRegion {
    }
 }

+/// Read an 8x8 pixel block from the Y channel at absolute pixel coordinates.
+///
+/// Returns `None` if the block would extend beyond the image boundaries
+/// (used during crop-recovery extraction where some blocks may have been
+/// cropped away).
 fn read_block_abs(y: &YChannel, px: usize, py: usize) -> Option<[[f64; 8]; 8]> {
    if px + 8 > y.width || py + 8 > y.height {
        return None;
@@ -129,12 +247,16 @@ fn read_block_abs(y: &YChannel, px: usize, py: usize) -> Option<[[f64; 8]; 8]> {
    Some(block)
 }

+/// Read an 8x8 block from the Y channel using block coordinates relative to
+/// the embed region.
 fn read_block(y: &YChannel, bx: usize, by: usize, region: &EmbedRegion) -> [[f64; 8]; 8] {
    let start_x = region.x_offset + bx * BLOCK_SIZE;
    let start_y = region.y_offset + by * BLOCK_SIZE;
    read_block_abs(y, start_x, start_y).unwrap()
 }

+/// Write an 8x8 block back to the Y channel using block coordinates relative
+/// to the embed region.
 fn write_block(y: &mut YChannel, bx: usize, by: usize, region: &EmbedRegion, block: &[[f64; 8]; 8]) {
    let start_x = region.x_offset + bx * BLOCK_SIZE;
    let start_y = region.y_offset + by * BLOCK_SIZE;
@@ -146,7 +268,22 @@ fn write_block(y: &mut YChannel, bx: usize, by: usize, region: &EmbedRegion, blo
 }

 // ─── DCT ─────────────────────────────────────────────────────────────────────
+//
+// The Discrete Cosine Transform (DCT) converts a spatial-domain signal (pixel
+// values) into a frequency-domain representation (coefficients). JPEG compression
+// itself uses the 8x8 Type-II DCT, so working in the same domain lets us embed
+// data where JPEG's own quantization is least destructive.
+//
+// We implement the DCT from scratch (rather than depending on a library) to keep
+// the crate dependency-light and WASM-friendly. The 8x8 size is small enough
+// that the naive O(N^2) computation is fast.

+/// 1D Type-II DCT of an 8-element signal.
+///
+/// Applies the orthonormal DCT-II:
+///   X[k] = c(k) * sum_{i=0}^{7} x[i] * cos((2i+1)*k*pi/16)
+///
+/// where c(0) = sqrt(1/8) and c(k) = sqrt(2/8) for k > 0.
 fn dct1d(input: &[f64; 8]) -> [f64; 8] {
    let mut output = [0.0f64; 8];
    for k in 0..8 {
@@ -164,6 +301,10 @@ fn dct1d(input: &[f64; 8]) -> [f64; 8] {
    output
 }

+/// 1D Type-III DCT (inverse DCT) of an 8-element signal.
+///
+/// Reconstructs the spatial-domain signal from DCT coefficients:
+///   x[i] = sum_{k=0}^{7} c(k) * X[k] * cos((2i+1)*k*pi/16)
 fn idct1d(input: &[f64; 8]) -> [f64; 8] {
    let mut output = [0.0f64; 8];
    for i in 0..8 {
@@ -181,11 +322,18 @@ fn idct1d(input: &[f64; 8]) -> [f64; 8] {
    output
 }

+/// 2D DCT of an 8x8 block, computed as separable 1D DCTs.
+///
+/// First applies the 1D DCT to each row, then to each column of the result.
+/// This is mathematically equivalent to the full 2D DCT but faster (O(N^3)
+/// instead of O(N^4) for the naive 2D formulation).
 fn dct2_8x8(block: &[[f64; 8]; 8]) -> [[f64; 8]; 8] {
+    // Step 1: DCT along rows
    let mut temp = [[0.0f64; 8]; 8];
    for row in 0..8 {
        temp[row] = dct1d(&block[row]);
    }
+    // Step 2: DCT along columns
    let mut result = [[0.0f64; 8]; 8];
    for col in 0..8 {
        let mut column = [0.0f64; 8];
@@ -200,7 +348,12 @@ fn dct2_8x8(block: &[[f64; 8]; 8]) -> [[f64; 8]; 8] {
    result
 }

+/// 2D inverse DCT of an 8x8 block, computed as separable 1D inverse DCTs.
+///
+/// Reverses the 2D DCT: first applies IDCT along columns, then along rows.
+/// (The order is reversed compared to the forward transform.)
 fn idct2_8x8(block: &[[f64; 8]; 8]) -> [[f64; 8]; 8] {
+    // Step 1: IDCT along columns
    let mut temp = [[0.0f64; 8]; 8];
    for col in 0..8 {
        let mut column = [0.0f64; 8];
@@ -212,6 +365,7 @@ fn idct2_8x8(block: &[[f64; 8]; 8]) -> [[f64; 8]; 8] {
            temp[row][col] = transformed[row];
        }
    }
+    // Step 2: IDCT along rows
    let mut result = [[0.0f64; 8]; 8];
    for row in 0..8 {
        result[row] = idct1d(&temp[row]);
@@ -220,7 +374,28 @@ fn idct2_8x8(block: &[[f64; 8]; 8]) -> [[f64; 8]; 8] {
 }

 // ─── QIM ─────────────────────────────────────────────────────────────────────
+//
+// Quantization Index Modulation (QIM) is the core technique for encoding bits
+// into DCT coefficients. It works by quantizing each coefficient to one of two
+// interleaved grids, where the grid selection encodes the bit value.
+//
+// For bit 0: quantize to the nearest multiple of Q  (grid: ..., -Q, 0, Q, 2Q, ...)
+// For bit 1: quantize to the nearest multiple of Q, offset by Q/2  (grid: ..., -Q/2, Q/2, 3Q/2, ...)
+//
+// Extraction simply measures which grid the coefficient is closest to.
+//
+// QIM is preferred over spread-spectrum or LSB methods because it is:
+// - Robust to recompression (the quantization step is larger than JPEG's own)
+// - Simple to implement and analyze
+// - Deterministic (no pseudo-random spreading sequence to synchronize)

+/// Embed a single bit into a DCT coefficient using QIM.
+///
+/// Quantizes the coefficient to the nearest point on the grid selected by `bit`:
+/// - `bit=0`: grid at multiples of `q` (i.e., 0, q, 2q, ...)
+/// - `bit=1`: grid at multiples of `q` offset by `q/2` (i.e., q/2, 3q/2, ...)
+///
+/// The returned value is the modified coefficient.
 fn qim_embed(coef: f64, bit: u8, q: f64) -> f64 {
    let offset = if bit == 1 { q / 2.0 } else { 0.0 };
    let shifted = coef - offset;
@@ -228,8 +403,15 @@ fn qim_embed(coef: f64, bit: u8, q: f64) -> f64 {
    quantized + offset
 }

+/// Extract a single bit from a DCT coefficient using QIM.
+///
+/// Computes the distance from the coefficient to each grid (bit-0 grid and
+/// bit-1 grid) and returns whichever grid is closer. This is the ML (maximum
+/// likelihood) decoder for QIM under additive noise.
 fn qim_extract(coef: f64, q: f64) -> u8 {
+    // Distance to the nearest bit-0 grid point
    let d0 = (coef - (coef / q).round() * q).abs();
+    // Distance to the nearest bit-1 grid point (offset by q/2)
    let offset = q / 2.0;
    let shifted = coef - offset;
    let d1 = (shifted - (shifted / q).round() * q).abs();
@@ -238,6 +420,10 @@ fn qim_extract(coef: f64, q: f64) -> u8 {

 // ─── Bit conversion ──────────────────────────────────────────────────────────

+/// Convert a byte slice to a vector of individual bits (MSB first).
+///
+/// Each byte is expanded to 8 bits, with bit 7 (MSB) first.
+/// Example: `[0xCA]` -> `[1, 1, 0, 0, 1, 0, 1, 0]`
 fn bytes_to_bits(bytes: &[u8]) -> Vec<u8> {
    let mut bits = Vec::with_capacity(bytes.len() * 8);
    for &byte in bytes {
@@ -248,6 +434,9 @@ fn bytes_to_bits(bytes: &[u8]) -> Vec<u8> {
    bits
 }

+/// Convert a vector of individual bits (MSB first) back to bytes.
+///
+/// Pads the last byte with zeros if the bit count is not a multiple of 8.
 fn bits_to_bytes(bits: &[u8]) -> Vec<u8> {
    let mut bytes = Vec::with_capacity((bits.len() + 7) / 8);
    for chunk in bits.chunks(8) {
@@ -263,7 +452,18 @@ fn bits_to_bytes(bits: &[u8]) -> Vec<u8> {
 // ─── Block selection ─────────────────────────────────────────────────────────

 /// Compute the absolute pixel positions of embed blocks for a given image size.
-/// Returns Vec<(px, py)> — top-left corners of 8×8 blocks.
+///
+/// This function deterministically maps image dimensions to a list of block
+/// positions. Both the embedder and extractor call this function with the same
+/// dimensions to agree on where blocks are. During crop recovery, the extractor
+/// tries different assumed original dimensions to find the correct grid.
+///
+/// Returns `Vec<(px, py)>` -- top-left corners of 8x8 blocks in pixel coordinates.
+/// Returns an empty vec if the image is too small to embed.
+///
+/// Blocks are selected with even spacing (stride) across the embed region to
+/// spread the watermark uniformly, making it more resilient to localized damage.
+/// The number of copies is capped at 50 to avoid diminishing returns.
 fn compute_embed_positions(img_width: usize, img_height: usize) -> Vec<(usize, usize)> {
    let region = compute_region(img_width, img_height);
    let total_blocks = region.blocks_x * region.blocks_y;
@@ -273,6 +473,7 @@ fn compute_embed_positions(img_width: usize, img_height: usize) -> Vec<(usize, u
    let num_copies = (total_blocks / BLOCKS_PER_COPY).min(50);
    let target_count = num_copies * BLOCKS_PER_COPY;

+    // Stride ensures blocks are evenly distributed across the embed region
    let stride = (total_blocks / target_count).max(1);
    let mut positions = Vec::with_capacity(target_count);
    let mut idx = 0;
@@ -287,11 +488,17 @@ fn compute_embed_positions(img_width: usize, img_height: usize) -> Vec<(usize, u
    positions
 }

+/// Select embed blocks using block-coordinate indices relative to the embed region.
+///
+/// Similar to [`compute_embed_positions`] but returns `(bx, by)` block indices
+/// rather than absolute pixel positions. Used during embedding where block
+/// coordinates are more convenient for the read_block/write_block API.
 fn select_embed_blocks(region: &EmbedRegion, target_count: usize) -> Vec<(usize, usize)> {
    let total_blocks = region.blocks_x * region.blocks_y;
    if total_blocks == 0 || target_count == 0 {
        return Vec::new();
    }
+    // Even stride distributes blocks uniformly across the region
    let stride = (total_blocks / target_count).max(1);
    let mut blocks = Vec::with_capacity(target_count);
    let mut idx = 0;
@@ -306,6 +513,17 @@ fn select_embed_blocks(region: &EmbedRegion, target_count: usize) -> Vec<(usize,

 // ─── Reconstruct JPEG ────────────────────────────────────────────────────────

+/// Reconstruct a JPEG image after modifying its luminance channel.
+///
+/// This function takes the original JPEG (for its Cb/Cr chrominance data) and
+/// the modified Y channel, then:
+///
+/// 1. Decodes the original JPEG to get per-pixel Cb and Cr values.
+/// 2. For each pixel, combines the modified Y with the original Cb/Cr.
+/// 3. Converts YCbCr back to RGB using the ITU-R BT.601 inverse formula.
+/// 4. Re-encodes as JPEG at quality 92 (high enough to preserve the watermark).
+///
+/// Only the luminance changes; chrominance is preserved from the original.
 fn reconstruct_jpeg(original_jpeg: &[u8], y_modified: &YChannel) -> Result<Vec<u8>> {
    let reader = ImageReader::new(Cursor::new(original_jpeg))
        .with_guessed_format()
@@ -325,12 +543,15 @@ fn reconstruct_jpeg(original_jpeg: &[u8], y_modified: &YChannel) -> Result<Vec<u
            let g = orig[1] as f64;
            let b = orig[2] as f64;

+            // Extract Cb and Cr from the original pixel (we only modify Y)
            let _y_orig = 0.299 * r + 0.587 * g + 0.114 * b;
            let cb = -0.168736 * r - 0.331264 * g + 0.5 * b + 128.0;
            let cr = 0.5 * r - 0.418688 * g - 0.081312 * b + 128.0;

+            // Use the modified Y value from our watermarked luminance channel
            let y_new = y_modified.get(px as usize, py as usize);

+            // Convert YCbCr -> RGB using ITU-R BT.601 inverse
            let r_new = y_new + 1.402 * (cr - 128.0);
            let g_new = y_new - 0.344136 * (cb - 128.0) - 0.714136 * (cr - 128.0);
            let b_new = y_new + 1.772 * (cb - 128.0);
@@ -357,7 +578,28 @@ fn reconstruct_jpeg(original_jpeg: &[u8], y_modified: &YChannel) -> Result<Vec<u

 // ─── Public API ──────────────────────────────────────────────────────────────

-/// Embed a 256-bit secret into a carrier JPEG. Returns modified JPEG bytes.
+/// Embed a 256-bit secret into a carrier JPEG image.
+///
+/// Returns the modified JPEG bytes with the secret hidden in the luminance
+/// channel's mid-frequency DCT coefficients.
+///
+/// ## Pipeline
+///
+/// 1. Decode the carrier and extract the Y (luminance) channel.
+/// 2. Validate that the image is large enough (>= 100x100 pixels, and enough
+///    blocks in the central region for at least 5 redundant copies).
+/// 3. Compute how many copies fit (up to 50) and select evenly-spaced blocks.
+/// 4. For each copy, iterate through the 22 blocks that hold 256 bits:
+///    - Forward DCT the 8x8 block.
+///    - Embed 12 bits per block into the mid-frequency coefficients via QIM.
+///    - Inverse DCT to write the modified spatial-domain values back.
+/// 5. Reconstruct the JPEG with the modified Y channel and original Cb/Cr.
+///
+/// # Errors
+///
+/// - [`IdfotoError::ImageTooSmall`] if the image is below minimum dimensions
+///   or does not have enough blocks for reliable embedding.
+/// - [`IdfotoError::ImgSecret`] if the image cannot be decoded or re-encoded.
 pub fn embed(carrier_jpeg: &[u8], secret: &[u8; 32]) -> Result<Vec<u8>> {
    let mut y = extract_y_channel(carrier_jpeg)?;

@@ -382,12 +624,15 @@ pub fn embed(carrier_jpeg: &[u8], secret: &[u8; 32]) -> Result<Vec<u8>> {
        });
    }

+    // Cap at 50 copies -- beyond that, additional redundancy has diminishing
+    // returns and the image modification becomes more visible.
    let num_copies = (total_blocks / BLOCKS_PER_COPY).min(50);
    let bits = bytes_to_bits(secret);

    let blocks_needed = num_copies * BLOCKS_PER_COPY;
    let embed_blocks = select_embed_blocks(&region, blocks_needed);

+    // Embed each copy of the secret into its assigned blocks
    for copy in 0..num_copies {
        for block_idx in 0..BLOCKS_PER_COPY {
            let global_idx = copy * BLOCKS_PER_COPY + block_idx;
@@ -398,6 +643,8 @@ pub fn embed(carrier_jpeg: &[u8], secret: &[u8; 32]) -> Result<Vec<u8>> {
            let mut block = read_block(&y, bx, by, &region);
            let mut dct = dct2_8x8(&block);

+            // Embed up to 12 bits (BITS_PER_BLOCK) in this block's
+            // mid-frequency DCT coefficients
            for (pos_idx, &(row, col)) in EMBED_POSITIONS.iter().enumerate() {
                let bit_idx = block_idx * BITS_PER_BLOCK + pos_idx;
                if bit_idx >= SECRET_BITS {
@@ -414,14 +661,31 @@ pub fn embed(carrier_jpeg: &[u8], secret: &[u8; 32]) -> Result<Vec<u8>> {
    reconstruct_jpeg(carrier_jpeg, &y)
 }

-/// Extract a 256-bit secret from a (possibly re-encoded/cropped) JPEG.
+/// Extract a 256-bit secret from a (possibly re-encoded or mildly cropped) JPEG.
+///
+/// Delegates to [`extract_with_crop_recovery`] which first tries canonical
+/// extraction (assuming the image has its original dimensions), then falls back
+/// to searching for plausible original dimensions if the image was cropped.
+///
+/// # Errors
+///
+/// - [`IdfotoError::ExtractionFailed`] if no valid secret could be recovered
+///   (image was never watermarked, or was too heavily recompressed/cropped).
 pub fn extract(jpeg_bytes: &[u8]) -> Result<[u8; 32]> {
    extract_with_crop_recovery(jpeg_bytes)
 }

-/// Try to extract using a specific assumed original image size and pixel offset.
-/// `orig_w`/`orig_h` determine the block layout (which blocks, how many copies).
-/// `dx`/`dy` shift all block positions when reading from the actual image.
+/// Attempt to extract the secret assuming specific original image dimensions
+/// and a pixel offset (for crop recovery).
+///
+/// The block grid is computed based on `orig_w`/`orig_h` (the assumed original
+/// dimensions), and then each block position is shifted by `dx`/`dy` when
+/// reading from the actual (possibly cropped) image.
+///
+/// Uses majority voting across all copies: for each of the 256 bit positions,
+/// the extracted bit from every copy votes, and the majority wins. A minimum
+/// confidence threshold of 60% is required -- below that, the extraction is
+/// considered unreliable and fails.
 fn try_extract_with_layout(
    y: &YChannel,
    orig_w: usize,
@@ -438,6 +702,7 @@ fn try_extract_with_layout(
    let total_blocks = region.blocks_x * region.blocks_y;
    let num_copies = (total_blocks / BLOCKS_PER_COPY).min(50);

+    // Accumulate votes for each bit position across all copies
    let mut votes_one = vec![0usize; SECRET_BITS];
    let mut votes_total = vec![0usize; SECRET_BITS];

@@ -447,6 +712,8 @@ fn try_extract_with_layout(
            if global_idx >= positions.len() {
                break;
            }
+            // Apply crop offset to find the actual block position in the
+            // (possibly cropped) image
            let (orig_px, orig_py) = positions[global_idx];
            let actual_px = orig_px as isize + dx;
            let actual_py = orig_py as isize + dy;
@@ -462,6 +729,7 @@ fn try_extract_with_layout(
            };
            let dct = dct2_8x8(&block);

+            // Extract bits from mid-frequency coefficients and tally votes
            for (pos_idx, &(row, col)) in EMBED_POSITIONS.iter().enumerate() {
                let bit_idx = block_idx * BITS_PER_BLOCK + pos_idx;
                if bit_idx >= SECRET_BITS {
@@ -476,7 +744,9 @@ fn try_extract_with_layout(
        }
    }

-    // Majority vote with confidence check
+    // Majority vote with confidence check: each bit must have >= 60% agreement
+    // across copies. Below that threshold, the watermark is considered too
+    // degraded for reliable extraction.
    let mut result_bits = vec![0u8; SECRET_BITS];
    for i in 0..SECRET_BITS {
        if votes_total[i] == 0 {
@@ -498,6 +768,19 @@ fn try_extract_with_layout(
    Ok(secret)
 }

+/// Extract with automatic crop recovery.
+///
+/// Tries extraction in order of decreasing likelihood:
+///
+/// 1. **Uncropped**: assume the image has its original dimensions (most common case).
+/// 2. **Width-only crop (8-pixel aligned)**: try original widths from current up to
+///    +20%, stepping by 8 pixels (JPEG block alignment). Assumes right-side crop
+///    (left edge unchanged, dx=0).
+/// 3. **Height-only crop (8-pixel aligned)**: same strategy for vertical crops.
+/// 4. **Width crop (non-aligned)**: finer 1-pixel step for non-block-aligned crops.
+///
+/// The search space is limited to 20% expansion in each dimension, which covers
+/// the 15% crumple zone plus some margin for measurement error.
 fn extract_with_crop_recovery(jpeg_bytes: &[u8]) -> Result<[u8; 32]> {
    let y = extract_y_channel(jpeg_bytes)?;

@@ -505,7 +788,7 @@ fn extract_with_crop_recovery(jpeg_bytes: &[u8]) -> Result<[u8; 32]> {
        return Err(IdfotoError::ExtractionFailed);
    }

-    // Try assuming the image is uncropped (original size = current size)
+    // Try 1: assume the image is uncropped (original size = current size)
    if let Ok(secret) = try_extract_with_layout(&y, y.width, y.height, 0, 0) {
        return Ok(secret);
    }
@@ -522,7 +805,7 @@ fn extract_with_crop_recovery(jpeg_bytes: &[u8]) -> Result<[u8; 32]> {
    let max_orig_w = (y.width as f64 * 1.20) as usize;
    let max_orig_h = (y.height as f64 * 1.20) as usize;

-    // Try width-only crops first (most common: crop from one side)
+    // Try 2: width-only crops, block-aligned steps (most common crop scenario)
    for orig_w in (y.width..=max_orig_w).step_by(BLOCK_SIZE) {
        // Right-side crop: dx = 0 (left edge unchanged)
        if let Ok(secret) = try_extract_with_layout(&y, orig_w, y.height, 0, 0) {
@@ -530,17 +813,17 @@ fn extract_with_crop_recovery(jpeg_bytes: &[u8]) -> Result<[u8; 32]> {
        }
    }

-    // Try height-only crops
+    // Try 3: height-only crops, block-aligned steps
    for orig_h in (y.height..=max_orig_h).step_by(BLOCK_SIZE) {
        if let Ok(secret) = try_extract_with_layout(&y, y.width, orig_h, 0, 0) {
            return Ok(secret);
        }
    }

-    // Try width crops with finer step (non-8-aligned crops)
+    // Try 4: width crops with finer step (non-8-aligned crops are rarer but possible)
    for orig_w in (y.width..=max_orig_w).step_by(1) {
        if orig_w % BLOCK_SIZE == 0 {
-            continue; // already tried
+            continue; // already tried in step 2
        }
        if let Ok(secret) = try_extract_with_layout(&y, orig_w, y.height, 0, 0) {
            return Ok(secret);
--- a/crates/idfoto-core/src/lib.rs
+++ b/crates/idfoto-core/src/lib.rs
@@ -1,3 +1,37 @@
+//! # idfoto-core
+//!
+//! Platform-agnostic core library for the idfoto password manager.
+//!
+//! This crate is intentionally **bytes-in/bytes-out** -- it performs no filesystem
+//! access, no network I/O, and no git operations. All inputs arrive as byte slices
+//! or typed structs, and all outputs are returned as byte vectors or typed structs.
+//! This design makes the crate portable to WASM, Android (via JNI/UniFFI), and iOS
+//! without any conditional compilation or platform shims.
+//!
+//! ## Modules
+//!
+//! - [`error`] -- The unified error type ([`IdfotoError`]) used across the crate.
+//! - [`crypto`] -- Argon2id key derivation and XChaCha20-Poly1305 authenticated
+//!   encryption. This is the low-level "encrypt bytes / decrypt bytes" layer.
+//! - [`entry`] -- The vault data model: [`Entry`] (full credential),
+//!   [`ManifestEntry`] (searchable index metadata), and [`Manifest`] (the entry
+//!   index that lets you list/search without decrypting every entry).
+//! - [`vault`] -- Typed wrappers around [`crypto`] that serialize structs to JSON
+//!   before encrypting, and deserialize after decrypting.
+//! - [`imgsecret`] -- DCT-based steganography for embedding and extracting a
+//!   256-bit secret in a JPEG image. This is the novel component that provides the
+//!   second authentication factor.
+//!
+//! ## Crypto pipeline
+//!
+//! ```text
+//! passphrase (UTF-8 bytes) || image_secret (32 bytes from reference JPEG)
+//!   -> Argon2id(salt=vault_salt, m=64MiB, t=3, p=4)
+//!   -> master_key (32 bytes)
+//!   -> XChaCha20-Poly1305(nonce=random 24 bytes)
+//!   -> encrypted entry/manifest
+//! ```
+
 pub mod error;
 pub use error::{IdfotoError, Result};

--- a/crates/idfoto-core/src/vault.rs
+++ b/crates/idfoto-core/src/vault.rs
@@ -1,23 +1,72 @@
+//! Typed encryption/decryption wrappers for vault entries and manifests.
+//!
+//! This module bridges the gap between the raw bytes-in/bytes-out layer in
+//! [`crate::crypto`] and the typed data model in [`crate::entry`]. Each function
+//! follows the same pattern:
+//!
+//! - **Encrypt**: serialize the struct to JSON via serde, then encrypt the JSON
+//!   bytes with [`crate::crypto::encrypt`].
+//! - **Decrypt**: decrypt the ciphertext with [`crate::crypto::decrypt`], then
+//!   deserialize the resulting JSON bytes back into the typed struct.
+//!
+//! ## Why a single master key
+//!
+//! All entries and the manifest are encrypted under the same `master_key`. This is
+//! simpler than a per-entry subkey hierarchy and sufficient for family-scale vaults
+//! (typically < 1000 entries). The security properties are equivalent: an attacker
+//! who compromises the master key can decrypt everything regardless of whether
+//! subkeys exist, and the vault's threat model already assumes the master key is
+//! the single point of trust (protected by the two-factor KDF).
+
 use crate::crypto;
 use crate::entry::{Entry, Manifest};
 use crate::error::Result;

+/// Serialize an [`Entry`] to JSON and encrypt it under the master key.
+///
+/// The resulting bytes are written to `entries/<id>.enc` by the CLI.
+///
+/// # Errors
+///
+/// - [`crate::IdfotoError::Json`] if JSON serialization fails (should not happen
+///   with well-formed Entry structs).
+/// - [`crate::IdfotoError::Encrypt`] if the underlying AEAD operation fails.
 pub fn encrypt_entry(master_key: &[u8; 32], entry: &Entry) -> Result<Vec<u8>> {
    let json = serde_json::to_vec(entry)?;
    crypto::encrypt(master_key, &json)
 }

+/// Decrypt an entry blob and deserialize it back into an [`Entry`].
+///
+/// # Errors
+///
+/// - [`crate::IdfotoError::Decrypt`] if the master key is wrong or the data is
+///   tampered.
+/// - [`crate::IdfotoError::Format`] if the ciphertext blob has an invalid header.
+/// - [`crate::IdfotoError::Json`] if the decrypted JSON is malformed.
 pub fn decrypt_entry(master_key: &[u8; 32], data: &[u8]) -> Result<Entry> {
    let json = crypto::decrypt(master_key, data)?;
    let entry: Entry = serde_json::from_slice(&json)?;
    Ok(entry)
 }

+/// Serialize a [`Manifest`] to JSON and encrypt it under the master key.
+///
+/// The resulting bytes are written to `manifest.enc` by the CLI.
+///
+/// # Errors
+///
+/// Same as [`encrypt_entry`].
 pub fn encrypt_manifest(master_key: &[u8; 32], manifest: &Manifest) -> Result<Vec<u8>> {
    let json = serde_json::to_vec(manifest)?;
    crypto::encrypt(master_key, &json)
 }

+/// Decrypt a manifest blob and deserialize it back into a [`Manifest`].
+///
+/// # Errors
+///
+/// Same as [`decrypt_entry`].
 pub fn decrypt_manifest(master_key: &[u8; 32], data: &[u8]) -> Result<Manifest> {
    let json = crypto::decrypt(master_key, data)?;
    let manifest: Manifest = serde_json::from_slice(&json)?;