diff --git a/docs/dev/adrs/accepted/crysview-structure-visualization.md b/docs/dev/adrs/accepted/crysview-structure-visualization.md
index c6dd4c154..b5fc2281a 100644
--- a/docs/dev/adrs/accepted/crysview-structure-visualization.md
+++ b/docs/dev/adrs/accepted/crysview-structure-visualization.md
@@ -22,8 +22,8 @@ parameters a refinement is adjusting.
 
 A working prototype establishes the target experience and the data it
 needs. It lives at
-[`crysview-threejs-demo.html`](crysview-threejs-demo.html) and
-demonstrates, against a non-orthogonal unit cell:
+[`crysview-threejs-demo.html`](crysview-structure-visualization/crysview-threejs-demo.html)
+and demonstrates, against a non-orthogonal unit cell:
 
 - atoms as spheres with element radius and colour;
 - anisotropic ADP ellipsoids (semi-axis lengths plus orientation);
diff --git a/docs/dev/adrs/accepted/crysview-threejs-demo.html b/docs/dev/adrs/accepted/crysview-structure-visualization/crysview-threejs-demo.html
similarity index 100%
rename from docs/dev/adrs/accepted/crysview-threejs-demo.html
rename to docs/dev/adrs/accepted/crysview-structure-visualization/crysview-threejs-demo.html
diff --git a/docs/dev/adrs/index.md b/docs/dev/adrs/index.md
index 9a04a6a6c..fe759d3ee 100644
--- a/docs/dev/adrs/index.md
+++ b/docs/dev/adrs/index.md
@@ -13,43 +13,46 @@ folders.
 
 ## ADR Index
 
-| Group                | Status     | Title                                     | Short description                                                                                                     | Link                                                                                        |
-| -------------------- | ---------- | ----------------------------------------- | --------------------------------------------------------------------------------------------------------------------- | ------------------------------------------------------------------------------------------- |
-| Analysis and fitting | Accepted   | Fit Mode Categories and Fit Execution API | Splits fitting configuration from execution and defines active sibling fit-mode categories.                           | [`fit-mode-categories.md`](accepted/fit-mode-categories.md)                                 |
-| Analysis and fitting | Accepted   | Runtime Fit Results                       | Keeps full fit outputs runtime-only in the current design unless a narrower persistence ADR is accepted.              | [`runtime-fit-results.md`](accepted/runtime-fit-results.md)                                 |
-| Analysis and fitting | Accepted   | Analysis CIF Fit State                    | Defines the persisted fit-state projection in `analysis/analysis.cif` and `analysis/results.h5`.                      | [`analysis-cif-fit-state.md`](accepted/analysis-cif-fit-state.md)                           |
-| Analysis and fitting | Accepted   | Parameter Correlation Persistence         | Persists deterministic and posterior correlation summaries in `_fit_parameter_correlation`                            | [`parameter-correlation-persistence.md`](accepted/parameter-correlation-persistence.md)     |
-| Analysis and fitting | Suggestion | Fit Output Files and Data Exports         | Narrows remaining archive/export questions after adopting `results.csv` and `results.h5`.                             | [`fit-output-files-and-data-exports.md`](suggestions/fit-output-files-and-data-exports.md)  |
-| Analysis and fitting | Accepted   | Minimizer Category Consolidation          | Collapses the seven Bayesian categories into one owner-level switchable `minimizer` category with HDF5 sidecar.       | [`minimizer-category-consolidation.md`](accepted/minimizer-category-consolidation.md)       |
-| Analysis and fitting | Accepted   | Minimizer Input/Output Split              | Keeps `analysis.minimizer` input-only and moves scalar fit outputs to paired `analysis.fit_result` classes.           | [`minimizer-input-output-split.md`](accepted/minimizer-input-output-split.md)               |
-| Analysis and fitting | Superseded | Parameter-Level Posterior Projection      | Superseded by minimizer-category consolidation; kept as historical context for `parameter.posterior`.                 | [`parameter-posterior-summary.md`](suggestions/parameter-posterior-summary.md)              |
-| Analysis and fitting | Accepted   | Undo Fit                                  | Builds rollback semantics and CLI behavior on already-persisted pre-fit scalar snapshots.                             | [`undo-fit.md`](accepted/undo-fit.md)                                                       |
-| Core model           | Accepted   | Category Owners and Real Datablocks       | Introduces `CategoryOwner` so singleton sections do not pretend to be real CIF datablocks.                            | [`category-owner-sections.md`](accepted/category-owner-sections.md)                         |
-| Core model           | Accepted   | Enum-Backed Closed Value Sets             | Requires finite option sets to use `(str, Enum)` classes for validation and dispatch.                                 | [`enum-backed-closed-values.md`](accepted/enum-backed-closed-values.md)                     |
-| Core model           | Accepted   | Guarded Public Properties                 | Uses property setters as the public writability contract for guarded objects.                                         | [`guarded-public-properties.md`](accepted/guarded-public-properties.md)                     |
-| Core model           | Accepted   | Two-Level Category Parameter Access       | Keeps parameter access to `datablock.category.parameter` or `datablock.collection[id].parameter`.                     | [`category-parameter-access.md`](accepted/category-parameter-access.md)                     |
-| Documentation        | Accepted   | Descriptor Property Docstring Template    | Makes descriptor metadata the source of truth for public property docstrings and annotations.                         | [`property-docstring-template.md`](accepted/property-docstring-template.md)                 |
-| Documentation        | Accepted   | Development Documentation Structure       | Defines the `docs/dev` layout for ADRs, issues, plans, package structure, and roadmap.                                | [`development-docs-structure.md`](accepted/development-docs-structure.md)                   |
-| Documentation        | Accepted   | Help Method Discoverability               | Requires primary public objects and facades to expose consistent `help()` output.                                     | [`help-discoverability.md`](accepted/help-discoverability.md)                               |
-| Documentation        | Accepted   | Notebook Generation Source of Truth       | Treats tutorial `.py` files as editable sources and notebooks as generated artifacts.                                 | [`notebook-generation.md`](accepted/notebook-generation.md)                                 |
-| Documentation        | Suggestion | Documentation CI and Build Verification   | Proposes strict MkDocs builds, API-derived docs, snippet smoke tests, link checks, and prose/spelling checks.         | [`documentation-ci-build.md`](suggestions/documentation-ci-build.md)                        |
-| Experiment model     | Accepted   | Immutable Experiment Type                 | Makes experiment type axes creation-time state rather than mutable runtime state.                                     | [`immutable-experiment-type.md`](accepted/immutable-experiment-type.md)                     |
-| Factories            | Accepted   | Factory Contracts and Metadata            | Standardizes factory construction, metadata, compatibility, and registration behavior.                                | [`factory-contracts.md`](accepted/factory-contracts.md)                                     |
-| Naming               | Accepted   | Factory Tag Naming                        | Defines canonical factory tag style and standard abbreviations.                                                       | [`factory-tag-naming.md`](accepted/factory-tag-naming.md)                                   |
-| Persistence          | Accepted   | Free-Flag CIF Encoding                    | Encodes fit free/fixed state through CIF uncertainty syntax instead of a separate free list.                          | [`free-flag-cif-encoding.md`](accepted/free-flag-cif-encoding.md)                           |
-| Persistence          | Accepted   | Loop Category Keys and Identity Naming    | Documents loop collection keys and naming rules aligned with CIF category keys.                                       | [`loop-category-key-identity.md`](accepted/loop-category-key-identity.md)                   |
-| Persistence          | Accepted   | Project Facade and Persistence Layout     | Documents the current `Project` facade and saved directory layout.                                                    | [`project-facade-and-persistence.md`](accepted/project-facade-and-persistence.md)           |
-| Persistence          | Accepted   | IUCr CIF Tag Alignment                    | Aligns default CIF tags with IUCr dictionaries and adds a clean IUCr-aligned report export.                           | [`iucr-cif-tag-alignment.md`](accepted/iucr-cif-tag-alignment.md)                           |
-| Persistence          | Accepted   | Python and CIF Category Correspondence    | Compares current Python paths and CIF tags, then records scoped one-to-one mapping for project-level categories.      | [`python-cif-category-correspondence.md`](accepted/python-cif-category-correspondence.md)   |
-| Quality              | Accepted   | Lint Complexity Thresholds                | Treats ruff PLR complexity limits as design guardrails that should not be bypassed.                                   | [`lint-complexity-thresholds.md`](accepted/lint-complexity-thresholds.md)                   |
-| Quality              | Accepted   | Test Strategy                             | Defines layered unit, functional, integration, script, and notebook testing.                                          | [`test-strategy.md`](accepted/test-strategy.md)                                             |
-| Structure model      | Accepted   | Type-Neutral ADP Parameters               | Keeps ADP parameter object identities stable across B/U and iso/ani switches.                                         | [`type-neutral-adp-parameters.md`](accepted/type-neutral-adp-parameters.md)                 |
-| User-facing API      | Accepted   | Crystal Structure 3D Visualization        | Adds a renderer-neutral scene model drawn by ASCII and interactive Three.js engines for viewing crystal structures.   | [`crysview-structure-visualization.md`](accepted/crysview-structure-visualization.md)       |
-| User-facing API      | Accepted   | Display UX Facade                         | Defines `project.display` and `project.rendering` responsibilities and display method names.                          | [`display-ux.md`](accepted/display-ux.md)                                                   |
-| User-facing API      | Accepted   | Fit Results Display Naming                | Short, IUCr/GUM-aligned column headers (`s.u.`, `value`, `95% CI`) with a footnote glossary on every fit table.       | [`fit-results-display-naming.md`](accepted/fit-results-display-naming.md)                   |
-| User-facing API      | Accepted   | Project Summary Rendering                 | Defines project report configuration plus terminal, HTML, TeX, PDF, and clean report-CIF metadata policy.             | [`project-summary-rendering.md`](accepted/project-summary-rendering.md)                     |
-| User-facing API      | Accepted   | Selector Families                         | Distinguishes backend selectors, switchable-category selectors, and active-sibling selectors.                         | [`selector-families.md`](accepted/selector-families.md)                                     |
-| User-facing API      | Accepted   | String Paths and Live Descriptors         | Separates persisted field selectors from references to live model parameters.                                         | [`string-paths-and-live-descriptors.md`](accepted/string-paths-and-live-descriptors.md)     |
-| User-facing API      | Accepted   | Switchable Category API                   | Places multi-type category selectors on the owner and omits public selectors for fixed or single-type categories.     | [`switchable-category-api.md`](accepted/switchable-category-api.md)                         |
-| User-facing API      | Accepted   | Switchable Category Owned Selectors       | Moves the writable `type` selector and `show_supported()` onto the category itself; collapses the CIF duplication.    | [`switchable-category-owned-selectors.md`](accepted/switchable-category-owned-selectors.md) |
-| User-facing API      | Accepted   | Value-Selector Discovery                  | Gives enumerated value fields a per-descriptor `show_supported()`, beside the three category-level selector families. | [`value-selector-discovery.md`](accepted/value-selector-discovery.md)                       |
+| Group                | Status     | Title                                        | Short description                                                                                                     | Link                                                                                        |
+| -------------------- | ---------- | -------------------------------------------- | --------------------------------------------------------------------------------------------------------------------- | ------------------------------------------------------------------------------------------- |
+| Analysis and fitting | Accepted   | Fit Mode Categories and Fit Execution API    | Splits fitting configuration from execution and defines active sibling fit-mode categories.                           | [`fit-mode-categories.md`](accepted/fit-mode-categories.md)                                 |
+| Analysis and fitting | Accepted   | Runtime Fit Results                          | Keeps full fit outputs runtime-only in the current design unless a narrower persistence ADR is accepted.              | [`runtime-fit-results.md`](accepted/runtime-fit-results.md)                                 |
+| Analysis and fitting | Accepted   | Analysis CIF Fit State                       | Defines the persisted fit-state projection in `analysis/analysis.cif` and `analysis/results.h5`.                      | [`analysis-cif-fit-state.md`](accepted/analysis-cif-fit-state.md)                           |
+| Analysis and fitting | Accepted   | Parameter Correlation Persistence            | Persists deterministic and posterior correlation summaries in `_fit_parameter_correlation`                            | [`parameter-correlation-persistence.md`](accepted/parameter-correlation-persistence.md)     |
+| Analysis and fitting | Suggestion | Fit Output Files and Data Exports            | Narrows remaining archive/export questions after adopting `results.csv` and `results.h5`.                             | [`fit-output-files-and-data-exports.md`](suggestions/fit-output-files-and-data-exports.md)  |
+| Analysis and fitting | Accepted   | Minimizer Category Consolidation             | Collapses the seven Bayesian categories into one owner-level switchable `minimizer` category with HDF5 sidecar.       | [`minimizer-category-consolidation.md`](accepted/minimizer-category-consolidation.md)       |
+| Analysis and fitting | Accepted   | Minimizer Input/Output Split                 | Keeps `analysis.minimizer` input-only and moves scalar fit outputs to paired `analysis.fit_result` classes.           | [`minimizer-input-output-split.md`](accepted/minimizer-input-output-split.md)               |
+| Analysis and fitting | Superseded | Parameter-Level Posterior Projection         | Superseded by minimizer-category consolidation; kept as historical context for `parameter.posterior`.                 | [`parameter-posterior-summary.md`](suggestions/parameter-posterior-summary.md)              |
+| Analysis and fitting | Accepted   | Undo Fit                                     | Builds rollback semantics and CLI behavior on already-persisted pre-fit scalar snapshots.                             | [`undo-fit.md`](accepted/undo-fit.md)                                                       |
+| Core model           | Accepted   | Category Owners and Real Datablocks          | Introduces `CategoryOwner` so singleton sections do not pretend to be real CIF datablocks.                            | [`category-owner-sections.md`](accepted/category-owner-sections.md)                         |
+| Core model           | Accepted   | Enum-Backed Closed Value Sets                | Requires finite option sets to use `(str, Enum)` classes for validation and dispatch.                                 | [`enum-backed-closed-values.md`](accepted/enum-backed-closed-values.md)                     |
+| Core model           | Accepted   | Guarded Public Properties                    | Uses property setters as the public writability contract for guarded objects.                                         | [`guarded-public-properties.md`](accepted/guarded-public-properties.md)                     |
+| Core model           | Accepted   | Two-Level Category Parameter Access          | Keeps parameter access to `datablock.category.parameter` or `datablock.collection[id].parameter`.                     | [`category-parameter-access.md`](accepted/category-parameter-access.md)                     |
+| Documentation        | Accepted   | Descriptor Property Docstring Template       | Makes descriptor metadata the source of truth for public property docstrings and annotations.                         | [`property-docstring-template.md`](accepted/property-docstring-template.md)                 |
+| Documentation        | Accepted   | Development Documentation Structure          | Defines the `docs/dev` layout for ADRs, issues, plans, package structure, and roadmap.                                | [`development-docs-structure.md`](accepted/development-docs-structure.md)                   |
+| Documentation        | Accepted   | Help Method Discoverability                  | Requires primary public objects and facades to expose consistent `help()` output.                                     | [`help-discoverability.md`](accepted/help-discoverability.md)                               |
+| Documentation        | Accepted   | Notebook Generation Source of Truth          | Treats tutorial `.py` files as editable sources and notebooks as generated artifacts.                                 | [`notebook-generation.md`](accepted/notebook-generation.md)                                 |
+| Documentation        | Suggestion | Documentation CI and Build Verification      | Proposes strict MkDocs builds, API-derived docs, snippet smoke tests, link checks, and prose/spelling checks.         | [`documentation-ci-build.md`](suggestions/documentation-ci-build.md)                        |
+| Experiment model     | Accepted   | Immutable Experiment Type                    | Makes experiment type axes creation-time state rather than mutable runtime state.                                     | [`immutable-experiment-type.md`](accepted/immutable-experiment-type.md)                     |
+| Experiment model     | Suggestion | Automatic Line-Segment Background Estimation | Detects line-segment background control points from the measured pattern, peak-insensitive and editable.              | [`background-auto-estimate.md`](suggestions/background-auto-estimate.md)                    |
+| Factories            | Accepted   | Factory Contracts and Metadata               | Standardizes factory construction, metadata, compatibility, and registration behavior.                                | [`factory-contracts.md`](accepted/factory-contracts.md)                                     |
+| Naming               | Accepted   | Factory Tag Naming                           | Defines canonical factory tag style and standard abbreviations.                                                       | [`factory-tag-naming.md`](accepted/factory-tag-naming.md)                                   |
+| Persistence          | Accepted   | Free-Flag CIF Encoding                       | Encodes fit free/fixed state through CIF uncertainty syntax instead of a separate free list.                          | [`free-flag-cif-encoding.md`](accepted/free-flag-cif-encoding.md)                           |
+| Persistence          | Accepted   | Loop Category Keys and Identity Naming       | Documents loop collection keys and naming rules aligned with CIF category keys.                                       | [`loop-category-key-identity.md`](accepted/loop-category-key-identity.md)                   |
+| Persistence          | Accepted   | Project Facade and Persistence Layout        | Documents the current `Project` facade and saved directory layout.                                                    | [`project-facade-and-persistence.md`](accepted/project-facade-and-persistence.md)           |
+| Persistence          | Accepted   | IUCr CIF Tag Alignment                       | Aligns default CIF tags with IUCr dictionaries and adds a clean IUCr-aligned report export.                           | [`iucr-cif-tag-alignment.md`](accepted/iucr-cif-tag-alignment.md)                           |
+| Persistence          | Accepted   | Python and CIF Category Correspondence       | Compares current Python paths and CIF tags, then records scoped one-to-one mapping for project-level categories.      | [`python-cif-category-correspondence.md`](accepted/python-cif-category-correspondence.md)   |
+| Quality              | Accepted   | Lint Complexity Thresholds                   | Treats ruff PLR complexity limits as design guardrails that should not be bypassed.                                   | [`lint-complexity-thresholds.md`](accepted/lint-complexity-thresholds.md)                   |
+| Quality              | Accepted   | Test Strategy                                | Defines layered unit, functional, integration, script, and notebook testing.                                          | [`test-strategy.md`](accepted/test-strategy.md)                                             |
+| Structure model      | Accepted   | Type-Neutral ADP Parameters                  | Keeps ADP parameter object identities stable across B/U and iso/ani switches.                                         | [`type-neutral-adp-parameters.md`](accepted/type-neutral-adp-parameters.md)                 |
+| Structure model      | Suggestion | Automatic Wyckoff Position Detection         | Detects Wyckoff letter, multiplicity, and site symmetry from space group and coordinates; calculators consume them.   | [`wyckoff-letter-detection.md`](suggestions/wyckoff-letter-detection.md)                    |
+| Structure model      | Suggestion | Complete Space-Group Reference Database      | One-time build of a complete space_groups.json.gz (all 230 groups) from cctbx, verified against multiple sources.     | [`space-group-database.md`](suggestions/space-group-database.md)                            |
+| User-facing API      | Accepted   | Crystal Structure 3D Visualization           | Adds a renderer-neutral scene model drawn by ASCII and interactive Three.js engines for viewing crystal structures.   | [`crysview-structure-visualization.md`](accepted/crysview-structure-visualization.md)       |
+| User-facing API      | Accepted   | Display UX Facade                            | Defines `project.display` and `project.rendering` responsibilities and display method names.                          | [`display-ux.md`](accepted/display-ux.md)                                                   |
+| User-facing API      | Accepted   | Fit Results Display Naming                   | Short, IUCr/GUM-aligned column headers (`s.u.`, `value`, `95% CI`) with a footnote glossary on every fit table.       | [`fit-results-display-naming.md`](accepted/fit-results-display-naming.md)                   |
+| User-facing API      | Accepted   | Project Summary Rendering                    | Defines project report configuration plus terminal, HTML, TeX, PDF, and clean report-CIF metadata policy.             | [`project-summary-rendering.md`](accepted/project-summary-rendering.md)                     |
+| User-facing API      | Accepted   | Selector Families                            | Distinguishes backend selectors, switchable-category selectors, and active-sibling selectors.                         | [`selector-families.md`](accepted/selector-families.md)                                     |
+| User-facing API      | Accepted   | String Paths and Live Descriptors            | Separates persisted field selectors from references to live model parameters.                                         | [`string-paths-and-live-descriptors.md`](accepted/string-paths-and-live-descriptors.md)     |
+| User-facing API      | Accepted   | Switchable Category API                      | Places multi-type category selectors on the owner and omits public selectors for fixed or single-type categories.     | [`switchable-category-api.md`](accepted/switchable-category-api.md)                         |
+| User-facing API      | Accepted   | Switchable Category Owned Selectors          | Moves the writable `type` selector and `show_supported()` onto the category itself; collapses the CIF duplication.    | [`switchable-category-owned-selectors.md`](accepted/switchable-category-owned-selectors.md) |
+| User-facing API      | Accepted   | Value-Selector Discovery                     | Gives enumerated value fields a per-descriptor `show_supported()`, beside the three category-level selector families. | [`value-selector-discovery.md`](accepted/value-selector-discovery.md)                       |
diff --git a/docs/dev/adrs/suggestions/background-auto-estimate.md b/docs/dev/adrs/suggestions/background-auto-estimate.md
new file mode 100644
index 000000000..1baca4e89
--- /dev/null
+++ b/docs/dev/adrs/suggestions/background-auto-estimate.md
@@ -0,0 +1,532 @@
+# ADR: Automatic Line-Segment Background Estimation
+
+**Status:** Proposed **Date:** 2026-06-01
+
+## Group
+
+Experiment model.
+
+> This ADR follows [`AGENTS.md`](../../../../AGENTS.md). It adds one new
+> dependency, `pybaselines` (§4). The user approved it directly in the
+> drafting conversation, which is the explicit approval
+> [`AGENTS.md`](../../../../AGENTS.md) → **Architecture** requires. The
+> implementation plan must still **name `pybaselines` explicitly** in
+> its dependency-changing step (for example a
+> `P1.x — Add pybaselines dependency` line): `/draft-impl-1` and
+> `/draft-impl-2` are authorized to edit `pyproject.toml`, `pixi.toml`,
+> and `pixi.lock` only by the accepted plan text naming the package, not
+> by this drafting thread's approval alone. No other deliberate
+> exception to those instructions is taken.
+
+## Context
+
+A line-segment background is a set of `(x, intensity)` control points
+that are linearly interpolated across the pattern
+([`line_segment.py:147`](../../../../src/easydiffraction/datablocks/experiment/categories/background/line_segment.py)).
+Today the user must supply every point by hand —
+`experiment.background.create(id='1', x=12.0, y=85.0)` in Python, or a
+`_pd_background.*` loop in CIF. With no points, the model evaluates to
+zero
+([`line_segment.py:175`](../../../../src/easydiffraction/datablocks/experiment/categories/background/line_segment.py)).
+There is no automatic estimation anywhere in the library.
+
+Hand-placing points well is tedious and easy to get wrong, and the
+audience is scientists who are often not programmers. Two rules make it
+genuinely hard:
+
+1. **Points must flank peaks, not sit on them.** A point placed on a
+   peak shoulder pulls the interpolated background up _into_ the peak
+   and steals intensity from the very quantity being refined.
+2. **In strongly overlapped regions there is no true background point.**
+   The pattern never returns to baseline between dense reflections, so
+   the valley floor sits _above_ the real background. Naively picking
+   local minima there inflates the background and biases integrated
+   intensities low.
+
+A third complication is specific to constant-wavelength (CWL) data and
+to _when_ an automatic background is typically wanted. CWL peak width is
+**not constant** — FWHM grows with angle (the Caglioti
+`U·tan²θ + V·tanθ + W` trend) — so a single "peak width" is already an
+approximation across the pattern. Worse, an automatic background is
+usually reached for at the very **first** modelling step, when the
+peak-profile parameters (`U`, `V`, `W` on `self._parent.peak`) are only
+roughly set. Any width taken from that unrefined resolution model would
+be badly wrong exactly when the feature is first used.
+
+The resolution of that timing problem is to never derive the width from
+the _model_: the **measured pattern already contains the true peak
+widths**, and those are independent of how well the profile parameters
+are set. Measuring the width directly from `data.intensity_meas` is
+therefore reliable from step one. It also reframes the iterative
+workflow the user described — _estimate a background, refine the rest of
+the model, then re-estimate_ — correctly: re-running does **not**
+improve the measured peak widths (the data does not change). What it
+gains is the **fitted model**. After at least one calculation,
+`data.intensity_calc` (the total model) and `data.intensity_bkg` are
+populated
+([`bragg_pd.py:574`](../../../../src/easydiffraction/datablocks/experiment/categories/data/bragg_pd.py),
+[`bragg_pd.py:582`](../../../../src/easydiffraction/datablocks/experiment/categories/data/bragg_pd.py)),
+so the peak-only model `intensity_calc − intensity_bkg` becomes
+available. Subtracting it from the measured pattern removes the fitted
+peaks while keeping the background, giving a peak-subtracted pattern on
+which a second pass estimates the absolute background and places better
+anchors — especially across overlapped clusters the data alone cannot
+resolve. (§5 gives the exact array and shows why the emitted heights are
+absolute background values, not residual corrections.) So re-estimation
+is a first-class workflow, not just a convenience.
+
+This is a well-studied problem in powder diffraction. The classic
+peak-clipping methods (Sonneveld & Visser, 1975; Brückner, 2000) and the
+SNIP algorithm estimate a smooth background _underneath_ the peaks, even
+where the data never reaches it. The de-facto Python library is
+`pybaselines` (50+ algorithms; its `classification` family also returns
+a boolean mask of which points are baseline); notably, **GSAS-II's
+automatic fixed-point background (`autoBkgCalc`) is a thin wrapper
+around `pybaselines`** feeding exactly this fixed-point model.
+
+Everything an estimator needs is already reachable from the category.
+The existing `_update()` reads the live pattern through the parent
+([`line_segment.py:172`](../../../../src/easydiffraction/datablocks/experiment/categories/background/line_segment.py)):
+`self._parent.data` exposes `data.x`, `data.intensity_meas`,
+`data.intensity_calc`, and `data.intensity_bkg` as NumPy arrays over the
+**active** points — excluded regions are already filtered out
+([`bragg_pd.py:539`](../../../../src/easydiffraction/datablocks/experiment/categories/data/bragg_pd.py),
+[`bragg_pd.py:679`](../../../../src/easydiffraction/datablocks/experiment/categories/data/bragg_pd.py)).
+The parent also carries the experiment-type axes
+(`self._parent.type.beam_mode.value`).
+
+The produced points are first-class and need no new persistence: each
+point's `intensity` is a `Parameter` with a `free` flag
+([`variable.py:447`](../../../../src/easydiffraction/core/variable.py))
+persisted through the existing free/fixed CIF encoding
+([`free-flag-cif-encoding.md`](../accepted/free-flag-cif-encoding.md)),
+and the `_pd_background.*` loop already round-trips them. So an
+auto-estimator's only job is to compute good `(x, intensity)` values and
+write them into the collection; the user then reviews them and chooses,
+per point, fixed or refinable.
+
+`background` is a Family-A switchable category
+([`switchable-category-owned-selectors.md`](../accepted/switchable-category-owned-selectors.md));
+`LineSegmentBackground` is the default type
+([`factory.py`](../../../../src/easydiffraction/datablocks/experiment/categories/background/factory.py)).
+Point-based estimation is specific to the line-segment model
+(`ChebyshevPolynomialBackground` has coefficients, not points), so the
+new behaviour attaches to the concrete line-segment class, not to the
+shared switchable surface.
+
+## Decision
+
+### 1. A user-invoked `auto_estimate()`, never automatic
+
+Add a public method to `LineSegmentBackground`:
+
+```python
+def auto_estimate(
+    self,
+    *,
+    method: str = 'auto',
+    width: float | None = None,
+    smoothness: float | None = None,
+    n_points: int | None = None,
+    use_model: bool = True,
+) -> None:
+    """Detect background control points from the measured pattern."""
+```
+
+A bare `experiment.background.auto_estimate()` must work — no required
+arguments, no manual tuning (§3 makes that real). It reads
+`self._parent.data`, computes points, and writes them into the
+collection. It is the seed of the iterative loop in §5, not a one-shot.
+It returns `None` (it fills the collection, like other category
+mutators) and logs a one-line summary — chosen method, width, and point
+count — for the review step.
+
+It is **explicitly on-demand**, never run inside `_update()` or at
+calculation time. The library does not silently estimate or re-estimate
+its own background while fitting — that would contradict the project's
+"no runtime self-validation of generated output" stance and would
+surprise a user who has hand-tuned points.
+
+The method is discoverable via the category's `help()` per
+[`help-discoverability.md`](../accepted/help-discoverability.md).
+`method` is a keyword argument validated against a closed
+`BackgroundEstimatorMethodEnum` with exactly four Phase-1 members —
+`auto`, `snip`, `arpls`, `fabc` — per
+[`enum-backed-closed-values.md`](../accepted/enum-backed-closed-values.md).
+`auto` is the default and a stable alias for "let the library choose";
+in Phase 1 it resolves to the single default method, `arpls` (§3). The
+argument selects an algorithm for _this call only_ — it is not a
+persisted descriptor and appears in no CIF block; the generated points
+are the sole persisted output. The remaining overrides are continuous
+numbers or booleans. No `**kwargs` (per
+[`AGENTS.md`](../../../../AGENTS.md) → **Code Style**).
+
+### 2. Two-stage algorithm: estimate the curve, then place sparse anchors
+
+The hard problem (overlap) and the easy problem (anchor placement) are
+decoupled.
+
+**Stage 1 — a peak-insensitive background curve `B(x)`.** Estimate a
+smooth background over the whole grid using a method that reconstructs
+the curve _under_ the peaks (peak-clipping / penalised least squares),
+not the raw valley floor. This is what makes overlap regions correct:
+even where the data never returns to baseline, `B(x)` is extrapolated
+from the surrounding clipped trend.
+
+**Stage 2 — thin `B(x)` to a minimal set of line segments.** Reduce the
+dense curve to a sparse `(x, intensity)` set with
+Ramer–Douglas–Peucker-style polyline simplification: many anchors where
+the background curves, few on flat stretches, with the first and last
+grid points always kept so interpolation covers the full range.
+Optionally cap the count at `n_points`.
+
+Two invariants protect peak intensities:
+
+- **Anchor heights come from `B(x)`, never from the raw data.** This is
+  the single most important rule against intensity inflation: even when
+  an anchor lands in a shallow valley whose floor is above the true
+  background, its height is the de-peaked `B(x)` value.
+- **Each anchor's height is clipped to
+  `0 ≤ intensity ≤ intensity_meas`** — always against the original
+  measured intensities, in both the data-only and model-guided paths
+  (never against the peak-subtracted array). A background cannot exceed
+  the observation, and (for these probes) cannot be negative.
+
+**Overlap is handled by abstention, stated honestly.** Inside a dense
+multiplet there is no information to place a true background point from
+the data alone, so the estimator deliberately does **not** force one
+there — one segment spans the cluster, interpolating across it using the
+de-peaked `B(x)` at the cluster's flanks. (A model-guided re-run, §5,
+can do better because it knows where the peaks are.)
+
+### 3. Auto-parameterization: adapt to the dataset and the experiment type
+
+Every algorithm in Stage 1 keys off one length scale — the peak width in
+data points. A fixed default (e.g. a 50-point window) is right for one
+dataset and wrong for the next, because CWL 2θ steps, TOF time bins, lab
+vs synchrotron resolution, and neutron vs X-ray all differ.
+`auto_estimate()` therefore derives its parameters at call time:
+
+- **Peak width `W` (in points) is measured from the data, not the
+  model.** `scipy.signal.find_peaks` on the most prominent peaks then
+  `scipy.signal.peak_widths`. Because CWL FWHM grows with angle
+  (§Context), `W` is taken as a robust **upper** estimate (a high
+  percentile of the measured widths), so the Stage-1 window/smoothness
+  is large enough to clear the broadest peaks; mildly over-smoothing the
+  background under the sharp low-angle peaks is harmless, since the
+  background is smooth there anyway. The peak/resolution model
+  (`self._parent.peak`) is **not** used by default — at the typical
+  first-use moment its `U/V/W` are unrefined and would mislead. A future
+  opt-in could consult it once refined, but the data-derived width is
+  correct from step one and is the default.
+- **Noise σ** — a robust estimate from the median absolute deviation of
+  the second difference of the intensities (insensitive to peaks). Feeds
+  the classification threshold and the RDP tolerance (`c · σ`), so the
+  number of anchors follows the real background curvature rather than a
+  magic count.
+- **Window / smoothness / threshold** — derived from `W`, σ, and the
+  point count `N`, then handed to the backend (§4).
+- **Algorithm choice** — one method everywhere to start. A single robust
+  penalised-least-squares default (proposed `arpls`, whose one global
+  smoothness parameter handles both the CWL angular width spread and TOF
+  curvature) is used for every experiment, with all per-dataset
+  adaptation coming from the auto-derived width, noise, and tolerance
+  above; `method=` selects a specific algorithm explicitly. A
+  `beam_mode`- or `radiation_probe`-specific policy is **not**
+  introduced on speculation — the single default and the exact constants
+  are confirmed by benchmarking against the tutorial corpus (§Testing),
+  and a per-type policy is added only if that corpus shows one method is
+  not enough (§Deferred Work).
+
+The whole path is deterministic (no RNG), so reruns on the same inputs
+yield identical points. When width or peak detection degenerates (too
+few points, no detectable peaks), the estimator falls back to a
+conservative metadata-derived width and emits **one** clear
+`log.warning` telling the user to inspect and adjust — it does not
+silently emit a bad background.
+
+### 4. Backend: `pybaselines` (approved dependency) plus an in-house layer
+
+`pybaselines` is added as a project dependency (BSD-3; runtime deps
+NumPy and SciPy, both already required) and supplies **Stage 1**: the
+peak-insensitive curve `B(x)` (`snip`, `arpls`) and, for the
+classification methods (`fabc`, `fastchrom`, `dietrich`), a boolean
+baseline `mask` with a `min_length` guard that is a natural
+candidate-anchor pool abstaining in overlap. This is the same library
+GSAS-II's `autoBkgCalc` delegates to.
+
+The in-house layer owns everything `pybaselines` cannot know about a
+diffraction pattern: the §3 auto-parameterization (data-derived width,
+noise, and resolving `method='auto'` to the single default), the Stage-2
+thinning and `[0, measured]` clipping, the model-guided re-estimation
+(§5), and the point lifecycle. `pybaselines`' library defaults are
+deliberately generic and would be wrong per-dataset, so the value is in
+feeding it the right parameters, not in calling it raw.
+
+### 5. Re-estimation is a first-class workflow
+
+The intended usage is a loop, and the API supports it directly:
+
+1. `auto_estimate()` early, from the measured data alone (no model yet)
+   — a fixed starting background.
+2. Refine the rest of the model (cell, scale, peak profile, …), with the
+   background fixed or, point-by-point, freed.
+3. `auto_estimate()` **again**. Now `data.intensity_calc` is populated,
+   so with `use_model=True` (default) the estimator forms the peak-only
+   model array `intensity_calc − intensity_bkg` and passes the Stage-1
+   helper the **peak-subtracted measured intensities**
+
+   `y = intensity_meas − (intensity_calc − intensity_bkg)`
+
+   — the measured pattern with the fitted peaks removed, **not** the fit
+   residual `intensity_meas − intensity_calc`. Because only the
+   peak-only model is subtracted (the current background stays in `y`),
+   the baseline `B(x)` estimated from `y` is the **absolute**
+   background, so the emitted control points are absolute
+   `_pd_background` heights and no add-back of `intensity_bkg` is
+   needed. The same peak-only model array also yields the model's peak
+   positions (the existing `find_peaks` pass, run on it rather than on
+   the raw data), which place anchors at better **x positions** — in
+   genuine inter-peak gaps, including across overlapped clusters the
+   data alone could not resolve. Everything comes only from the
+   backend-independent `data.intensity_meas` / `data.intensity_calc` /
+   `data.intensity_bkg` arrays, so the improvement is identical for
+   every calculator (Cryspy, CrysFML); it does **not** read
+   `experiment.refln` reflection metadata, which is calculator-specific
+   and may be absent or cleared. The data-only path — no calculation yet
+   (`intensity_calc` all zero), or `use_model=False` — passes
+   `y = intensity_meas` instead; both paths estimate an absolute
+   background and clip heights to the original measured intensities
+   (§2).
+
+**Every call overwrites and re-fixes.** `auto_estimate()` always clears
+the collection and rebuilds it — there is no append mode — and the
+rebuilt points are **fixed** (`free=False`) regardless of whether the
+previous points had been freed during refinement. A second call is
+therefore a fresh fixed seed, not a merge: calling it again overwrites
+the points and re-fixes them even if they were free. This keeps the loop
+predictable (each pass starts from a clean, fixed background) and
+idempotent (same inputs → same points). Clearing everything — including
+any hand-added points — is the deliberate "overwrite" contract;
+preserving manual points is deferred. When the collection is non-empty,
+the call logs a one-line notice that it is replacing the existing
+points, so a user who hand-tuned a background is not surprised; the
+first call, with nothing to replace, is silent.
+
+**Always fixed; no `free` argument.** Generated points are always
+created fixed (`intensity.free = False`) — there is no caller-selectable
+free option, so the "always re-fixes" contract above holds without
+exception. The user reviews the points and flips individual ones — or
+all — to refinable (`point.y.free = True`) afterward. This matches
+fixed-point background practice and the stated review-then-refine
+workflow.
+
+**Mechanics.** Points get sequential string ids (`'1', '2', …`)
+consistent with the existing `LineSegment.id` descriptor and its CIF
+tag. Excluded regions are honoured for free, since `data.*` iterate
+active points only.
+
+### 6. Where the code lives
+
+A backend-agnostic estimator helper —
+`estimate_background_curve(x, y, *, beam_mode, peaks=None, width=None, ...) -> (curve, anchors)`
+— lives in a new small module in the background package (e.g.
+`datablocks/experiment/categories/background/estimate.py`). It is pure
+array-in/array-out (the optional `peaks` argument carries model peak
+positions detected from the peak-only model array per §5 — not
+reflection metadata), holds no model state, wraps `pybaselines` for
+Stage 1, and keeps the §3 parameterization and Stage-2 thinning in-house
+— so it stays unit-testable in isolation and pulls no domain logic into
+`core/`. `LineSegmentBackground.auto_estimate()` is a thin adapter: read
+the pattern (and model, if present), call the helper, clip, and
+`create()` the points. Helpers are extracted as needed to stay under the
+lint complexity thresholds
+([`lint-complexity-thresholds.md`](../accepted/lint-complexity-thresholds.md))
+rather than raising them.
+
+The same helper can later serve `ChebyshevPolynomialBackground` (fit its
+coefficients to `B(x)`), but that is **not** built now — see _Deferred
+Work_ — to avoid an abstraction before its second concrete use.
+
+## Open Questions
+
+The four design questions raised in review are resolved: noise-relative
+Stage-2 thinning (§3), always-overwrite with a replace notice (§5), a
+single Stage-1 method for now (§3), and a void method that logs a
+one-line summary (§1). What remains is empirical calibration, done
+against the tutorial corpus during implementation:
+
+- The exact Stage-2 tolerance multiplier (`c · σ`, proposed `c ≈ 2`) and
+  the width percentile (proposed ~75th) need tuning against real
+  datasets.
+- Whether the single Stage-1 method holds across the whole corpus
+  (CWL/TOF, neutron/X-ray) or a `beam_mode`/`radiation_probe` policy is
+  eventually needed (see §Deferred Work).
+
+## Consequences
+
+### Positive
+
+- One call, no arguments, gives scientists a sensible, reviewable
+  starting background — including in overlap regions, where heights come
+  from the de-peaked curve.
+- Robust across datasets _and_ experiment types because the length scale
+  is measured from the data per call (§3) rather than hardcoded — and
+  reliable at the first modelling step, when the resolution model is
+  not.
+- Supports the natural estimate → refine → re-estimate loop (§5): a
+  later pass uses the fitted model to improve anchor placement, and
+  re-running is safe, idempotent, and re-fixes the points.
+- Output is ordinary line-segment points: editable, individually
+  fixable/refinable, and already CIF-persisted — **no new CIF tags or
+  serialization work**.
+- Reuses the same backend (`pybaselines`) the GSAS-II fixed-point
+  background relies on.
+
+### Trade-offs
+
+- Adds one dependency, `pybaselines` (approved; BSD-3,
+  NumPy/SciPy-only).
+- Not infallible with literally zero input: amorphous/diffuse humps and
+  pathological overlap can still bias the first (data-only) pass. The
+  honest contract is "a good starting estimate you then refine,"
+  surfaced by a warning when the estimate is unreliable — not a
+  guarantee of correctness.
+- Adds an estimator module and a new public method to maintain.
+
+### Compatibility Outcomes
+
+- Purely additive: the manual `create()` workflow, existing projects,
+  and the default background type are all unchanged. Nothing auto-runs.
+- A project saved after `auto_estimate()` is an ordinary line-segment
+  background; it reloads with no new fields.
+
+## Alternatives Considered
+
+- **Call `pybaselines` with its library defaults.** Rejected: its
+  generic defaults (a one-size `lam`, an untuned SNIP window) are wrong
+  per-dataset, so the §3 auto-parameterization layer is needed
+  regardless. `pybaselines` supplies the curve; the diffraction-aware
+  parameters come from us.
+- **Derive the peak width from the resolution model (`U/V/W`).**
+  Rejected as the default: the model is unrefined at the typical
+  first-use moment and would give a badly wrong width — the user's own
+  observation. The measured pattern carries the true widths and is
+  model-independent.
+- **Ship a built-in estimator and make `pybaselines` optional.**
+  Rejected now that the dependency is approved: a single hard backend
+  removes import-availability branching and two divergent code paths,
+  and gives the better algorithms (`arpls`, `fabc`, the classification
+  mask) unconditionally.
+- **Naive valley / local-minima picking on the raw data.** Rejected: it
+  inflates the background in overlapped regions — the exact problem in
+  §Context.
+- **Run estimation automatically at calculation time** (fill if empty).
+  Rejected: hides a modelling choice, fights hand-tuned points, and
+  re-validates generated output at runtime — all against project
+  principles.
+- **Merge or append, rather than overwrite, on re-run** (keep
+  freed/refined points; an earlier draft exposed a `replace=False`
+  append mode). Rejected: it makes the loop unpredictable and lets a
+  stale point survive a better estimate, and no real use case justified
+  the second mode. Every call overwrites and re-fixes — one predictable
+  behaviour.
+- **Generalise `auto_estimate()` onto `BackgroundBase` now** so
+  Chebyshev shares it. Deferred: the shared _estimator helper_ (§6)
+  already captures the reusable core; a base-level method awaits the
+  second implementation.
+
+## Testing
+
+Per [`test-strategy.md`](../accepted/test-strategy.md), unit-level tests
+(no calculation engine, no network, no sleeping) on the pure estimator
+helper:
+
+- **Synthetic patterns with a known analytic background** (flat, linear
+  slope, smooth curve, TOF-like decay) plus planted Gaussian peaks,
+  including a deliberately overlapped multiplet. Assert the recovered
+  points reproduce the true background within tolerance, that **no
+  anchor lands on a planted peak**, and that none exceeds the local
+  data.
+- **CWL angular broadening**: peaks whose FWHM grows with x. Assert the
+  upper-percentile width keeps the background from being pulled up under
+  the broad high-angle peaks.
+- **Model-guided re-run**: with a supplied peak-only model over an
+  overlapped cluster, assert better anchor placement (in true gaps) than
+  the data-only pass on the same pattern, **and** that the emitted
+  control-point heights are absolute background values matching the
+  synthetic pattern's known background — not residual corrections around
+  the input background.
+- **Re-estimation lifecycle**: a second `auto_estimate()` clears prior
+  points and produces **fixed** points even when the previous ones were
+  freed; ids stay sequential.
+- **Determinism**: identical inputs → identical points.
+- **Graceful degradation**: a peakless or near-empty pattern triggers
+  the single fallback warning rather than an exception or a garbage
+  background.
+
+**Tutorial corpus as real-world reference.** The ~25 tutorial scripts in
+`docs/docs/tutorials/*.py` already build real experiments with
+well-defined backgrounds across both beam modes and both probes — CWL
+(e.g. the sloping background in
+[`ed-17.py`](../../../../docs/docs/tutorials/ed-17.py) and
+[`ed-2.py`](../../../../docs/docs/tutorials/ed-2.py)) and TOF (e.g.
+[`ed-13.py`](../../../../docs/docs/tutorials/ed-13.py),
+[`ed-16.py`](../../../../docs/docs/tutorials/ed-16.py)). Their
+hand-placed line-segment points are ground truth: stripping them and
+re-running `auto_estimate()` should reproduce a comparable background
+curve within tolerance. This gives broad, real coverage across space
+groups, beam modes, and probes at almost no authoring cost, and is the
+reference set used to calibrate the default constants and confirm the
+single Stage-1 method. These corpus checks run at the functional /
+script level where the tutorial experiments are already loaded, not at
+unit level.
+
+The estimator module mirrors into
+`tests/unit/easydiffraction/datablocks/experiment/categories/background/`
+per the test-structure mirror rule.
+
+## Deferred Work
+
+- A spatially-varying / per-region Stage-1 window that follows the CWL
+  angular broadening exactly (the upper-percentile single window is the
+  adequate first cut).
+- Beam-mode- and radiation-probe-specific Stage-1 method/parameter
+  defaults, if benchmarking the single default against the tutorial
+  corpus (CWL/TOF, neutron/X-ray) shows one method is not enough.
+- `ChebyshevPolynomialBackground.auto_estimate()` fitting coefficients
+  to the same `B(x)`, promoting the method to `BackgroundBase` once a
+  second implementation exists.
+- An opt-in path that consults the peak/resolution model for the width
+  _once it is refined_, as a cross-check on the data-derived width.
+- Using `experiment.refln` calculated reflection positions (when a
+  calculator provides them) as an alternative or cross-check to the peak
+  positions detected from the peak-only model array — deferred to keep
+  the model-guided path backend-independent.
+- A plot/diagnostic preview of the chosen curve and points via the
+  display layer ([`display-ux.md`](../accepted/display-ux.md)).
+- Tagging auto-generated points so a re-run can preserve hand-added
+  ones.
+- Total-scattering backgrounds (`pdffit2`) are out of scope — the
+  line-segment model does not apply there.
+
+## Related ADRs
+
+- [`switchable-category-owned-selectors.md`](../accepted/switchable-category-owned-selectors.md)
+  — `background` is a Family-A switchable category; `auto_estimate()` is
+  a type-specific method on `LineSegmentBackground`, not part of the
+  selector surface.
+- [`free-flag-cif-encoding.md`](../accepted/free-flag-cif-encoding.md) —
+  generated points carry a fixed/fittable `free` flag persisted through
+  CIF uncertainty syntax; no new tags.
+- [`guarded-public-properties.md`](../accepted/guarded-public-properties.md)
+  — each point's `intensity` is an editable `Parameter`.
+- [`enum-backed-closed-values.md`](../accepted/enum-backed-closed-values.md)
+  — the `method` argument is an enum-backed closed value set.
+- [`help-discoverability.md`](../accepted/help-discoverability.md) —
+  `auto_estimate()` is surfaced in the category's `help()`.
+- [`lint-complexity-thresholds.md`](../accepted/lint-complexity-thresholds.md)
+  — the estimator stays within complexity guardrails via extracted
+  helpers.
+- [`test-strategy.md`](../accepted/test-strategy.md) — layered tests,
+  mirror rule, no engines at unit level.
diff --git a/docs/dev/adrs/suggestions/plotting-docs-performance.md b/docs/dev/adrs/suggestions/plotting-docs-performance.md
new file mode 100644
index 000000000..99d2cf528
--- /dev/null
+++ b/docs/dev/adrs/suggestions/plotting-docs-performance.md
@@ -0,0 +1,434 @@
+# ADR: Plotting & Docs Performance for Interactive Figures
+
+**Status:** Proposed **Date:** 2026-06-02
+
+## Group
+
+Documentation.
+
+> This ADR follows [`AGENTS.md`](../../../../AGENTS.md). It spans the
+> documentation build (MkDocs) and the display serialization contract,
+> so it also relates to the User-facing API ADRs
+> [`display-ux.md`](../accepted/display-ux.md) and
+> [`crysview-structure-visualization.md`](../accepted/crysview-structure-visualization.md).
+> No public Python API change is intended; the change is in how figure
+> HTML and its JavaScript runtime are delivered.
+
+## Context
+
+### Symptom
+
+Generated tutorial pages that contain many interactive figures (mostly
+Plotly, plus the occasional Three.js crystal-structure view) can take
+from several to a few dozen seconds before the page becomes responsive.
+The plots are valuable and should stay interactive; the goal is to keep
+interactivity while making the page usable immediately and letting plots
+appear progressively.
+
+### How figures reach a docs page today
+
+1. Tutorial sources are `docs/docs/tutorials/ed-*.py`; notebooks are
+   generated artifacts (per
+   [`notebook-generation.md`](../accepted/notebook-generation.md)) and
+   are committed with **outputs stripped** (`notebook-strip`).
+2. The docs CI
+   ([`.github/workflows/docs.yml`](../../../../.github/workflows/docs.yml))
+   runs `notebook-exec-ci` to **execute** every notebook, baking the
+   rendered cell outputs into the `.ipynb`, then `mkdocs build` with
+   `mkdocs-jupyter` configured `execute: false` simply embeds those
+   pre-rendered outputs into the HTML.
+3. Each Plotly figure is emitted by `PlotlyPlotter._show_figure`
+   ([`src/easydiffraction/display/plotters/plotly.py`](../../../../src/easydiffraction/display/plotters/plotly.py))
+   as a `text/html` output via
+   `serialize_html(fig, include_plotlyjs='cdn')` wrapped in
+   `IPython.display.HTML`. The resulting HTML, **per figure**, carries:
+   - a `<div>` plus an inline `<script>` calling `Plotly.newPlot(...)`
+     with the full trace JSON,
+   - a `<script src="https://cdn.plot.ly/plotly-*.min.js">` tag (from
+     `include_plotlyjs='cdn'`),
+   - roughly 15 KB of post-scripts (theme-sync + resize + legend toggle)
+     **duplicated in every figure**.
+4. `mkdocs.yml` additionally loads **RequireJS from a second CDN**
+   (`include_requirejs: true`, commented "Required for Plotly").
+5. Three.js structure views are produced by
+   `ThreeJsStructureRenderer.render`
+   ([`src/easydiffraction/display/structure/renderers/threejs.py`](../../../../src/easydiffraction/display/structure/renderers/threejs.py))
+   with `offline=True` by default, which **base64-inlines the entire
+   Three.js module set (~1.5 MB) into the HTML of every scene** and
+   injects a per-scene `<script type="importmap">`.
+
+### Why it is slow — two independent bottlenecks
+
+- **Network / cold start.** A plot-heavy page depends on up to three
+  external CDNs at view time: `cdn.plot.ly` (full Plotly bundle, ~3–4 MB
+  minified, ~1 MB gzipped), `cdnjs` (RequireJS), and `jsdelivr`
+  (Three.js, when not offline). For a scientific audience often behind
+  slow or filtered institutional networks, this alone produces the
+  multi-second-to-stall behavior. The Plotly bundle is fetched once and
+  cached, but the page still blocks on it.
+- **CPU / eager render.** Every `Plotly.newPlot` runs **synchronously as
+  the page parses**. Fifteen to twenty figures means fifteen to twenty
+  back-to-back layout+draw passes on the main thread before the page is
+  interactive, regardless of whether a figure is on screen.
+
+### Blast radius: one serializer, three delivery targets
+
+The same serialization paths feed three contexts with **conflicting**
+runtime needs, which is the crux of any robust fix:
+
+| Target                | Who                                                                                         | Runtime requirement                                                                                                                                                                                                          |
+| --------------------- | ------------------------------------------------------------------------------------------- | ---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| **Live notebook**     | `_show_figure` in Jupyter                                                                   | Runtime must be reachable from the running kernel/browser (today: Plotly via CDN; Three.js inlined).                                                                                                                         |
+| **MkDocs site**       | executed-notebook HTML embedded by `mkdocs-jupyter`                                         | Wants the runtime loaded **once per page** and figures rendered **lazily**.                                                                                                                                                  |
+| **Standalone report** | `report/html_renderer.py` → `PlotlyPlotter.serialize_html` / Three.js `render(offline=...)` | Delivery set by the existing `offline` flag — embedded/self-contained when `offline=True`, CDN when `offline=False` (default). Authoritative per [`project-summary-rendering.md`](../accepted/project-summary-rendering.md). |
+
+A useful precedent already lives in the report renderer
+([`src/easydiffraction/report/html_renderer.py`](../../../../src/easydiffraction/report/html_renderer.py)):
+it embeds Plotly in the **first** figure and then passes
+`include_plotlyjs=False` for the rest, so a multi-figure report ships
+the runtime once. Docs do not get this because each notebook cell is
+serialized independently with `'cdn'`. The robust direction is to
+**generalize that "load once, reference after" idea across a whole docs
+page**, and add lazy activation on top.
+
+### Long-term-support constraint: versioned docs outlive CDNs
+
+Docs are published with `mike` (versioned). A page built today that
+links a moving CDN URL can silently break years later when the CDN drops
+or changes that asset, leaving **old, frozen doc versions** unable to
+render their figures. Pinning and self-hosting the runtime **per doc
+version** makes each published version self-consistent and archival — a
+strong reason to prefer self-hosting over any CDN for the long term.
+
+### Known latent bug surfaced while investigating
+
+Each Three.js scene injects its own `<script type="importmap">`. A page
+with **two** structure views therefore emits two importmaps; multiple
+importmaps are not reliably supported across browsers, so a second
+structure view on one page can fail to load its modules. Hoisting a
+single page-level importmap on docs pages (Decision 6) also fixes this;
+standalone reports that render multiple scenes share the same latent bug
+and are noted in **Deferred work**.
+
+## Decision
+
+Adopt **Option B: a shared, self-hosted figure runtime with lazy,
+progressive activation**, driven by an explicit _embedding mode_ on the
+serialization path. The following sub-choices were selected in
+discussion on 2026-06-02 (see **Resolved decisions** below): a themed
+"Loading…" **skeleton** placeholder (not static-image-first);
+**committed canonical vendored snapshots** — only the Three.js
+docs-serving copy is generated at build, while Plotly's docs-only
+partial bundle is committed (Decision 1); and **Plotly and Three.js
+delivered together** in one change. Concretely:
+
+1. **Self-host pinned runtimes, no runtime CDN; committed canonical
+   snapshots with an explicit docs-sync contract.** Each vendored
+   runtime is a committed snapshot (as `src/.../vendor/threejs` is
+   today) with exactly one canonical home, and the way it reaches the
+   served site is named, not implicit:
+   - **Three.js** — canonical at
+     `src/.../display/structure/renderers/vendor/threejs` (the installed
+     wheel needs it for offline reports and notebooks). MkDocs can only
+     serve files under `docs/docs`, so the docs **serving** copy is
+     **generated at build, not committed** (git-ignored under
+     `docs/docs/assets/javascripts/vendor/`) by a new
+     `docs-sync-vendored-js` pixi task that copies the canonical bytes.
+     Wire that task as a `depends-on` of `docs-build` and `docs-serve`,
+     and run it before `mkdocs build` in `docs.yml`, so local serve,
+     local build, and CI stay in lockstep with one source of truth.
+   - **Plotly** — a partial `plotly-cartesian` bundle (covers `Scatter`,
+     `Heatmap`, bars, error bars, shapes, annotations, text; excludes
+     unused WebGL/3D/maps). This runtime is **docs-only** — offline
+     reports embed the full Plotly bundle from the installed `plotly`
+     package, so no wheel copy exists — so its canonical home is the
+     **committed** docs vendor dir
+     `docs/docs/assets/javascripts/vendor/plotly/`, which is also where
+     MkDocs serves it (no sync step needed).
+
+   So the committed-vs-generated split is decided: vendored snapshots
+   are committed at their canonical home; only the Three.js docs
+   _serving_ copy is generated by `docs-sync-vendored-js`. Drift between
+   a canonical snapshot and its pinned version is caught by
+   `bump_vendored_js.py --check` (Decision 5), not by comparing two
+   committed copies. Each runtime loads **once per page**: Plotly and
+   the shared figure loader via `extra_javascript`, Three.js via a
+   single page-level importmap. Drop the RequireJS CDN and
+   `include_requirejs` if verification confirms it is no longer needed.
+
+2. **Introduce a figure _embedding mode_** (a `(str, Enum)` per
+   [`enum-backed-closed-values.md`](../accepted/enum-backed-closed-values.md))
+   threaded through `serialize_html` and the Three.js `render`:
+   - `INLINE` — live Jupyter: render eagerly with the runtime reachable
+     as today. **Default.**
+   - `SHARED` — docs: emit a **placeholder** (reserved aspect ratio,
+     themed "Loading…" skeleton, no layout shift) plus the figure spec
+     as a `<script type="application/json">` payload and a
+     `data-ed-figure` hook; reference the page-shared runtime. **No**
+     per-figure runtime, **no** per-figure post-scripts.
+   - `STANDALONE` — reports: render eagerly into a self-contained
+     fragment. Runtime delivery is **not** decided here but by the
+     caller's existing `offline` flag (see Decision 4).
+
+   **Mode routing (the central decision).** Tutorial figures are
+   serialized during notebook _execution_ (`notebook-exec-ci`), before
+   MkDocs sees them, and `mkdocs-jupyter` runs `execute: false` — so the
+   already-baked cell HTML must itself carry `SHARED` output; no
+   `extra_javascript` or downstream step can retrofit it. The active
+   mode is therefore resolved **centrally** from an environment variable
+   (`EASYDIFFRACTION_FIGURE_EMBED_MODE`) by one helper alongside
+   `in_jupyter`/`in_pycharm` in `utils/environment.py`, validated to the
+   enum and defaulting to `INLINE`. The docs notebook-execution tasks
+   (`notebook-exec-ci`, and `notebook-exec` for local docs preview) set
+   it to `shared`; ordinary Jupyter sessions leave it unset and stay
+   `INLINE`. Reports never consult the variable — the report API passes
+   `STANDALONE` explicitly. Because `SHARED` output is an inert
+   placeholder plus JSON, notebook execution does **not** need the
+   runtime present; MkDocs serves the runtime at view time (Decision 1).
+
+3. **One shared `ed-figures.js`, loaded once per page**, owns what is
+   currently duplicated per figure: it discovers `data-ed-figure`
+   placeholders, lazily calls `Plotly.newPlot` (and boots Three.js
+   scenes) via `IntersectionObserver` when each scrolls near the
+   viewport, and centralizes theme-sync, resize, and legend-toggle
+   logic. Eager fallback when `IntersectionObserver` is absent or when
+   printing.
+
+4. **Reports keep their existing `offline` contract, authoritative and
+   unchanged.** Per
+   [`project-summary-rendering.md`](../accepted/project-summary-rendering.md),
+   `render_html_report(offline=...)` already decides runtime delivery:
+   `offline=True` embeds a self-contained runtime; `offline=False` (the
+   default) links the CDN, embedding Plotly in the first figure and
+   referencing it thereafter. The embedding mode does **not** touch this
+   — reports render `STANDALONE` (eager, self-contained _fragment_) and
+   still pick embed-vs-CDN solely via `offline`. The `SHARED`/lazy
+   shared-runtime mechanism is **docs-only** and never applies to
+   reports. "Self-contained" is thus the `offline=True` report case, not
+   a new blanket requirement on every report.
+
+5. **A version-bump script + pixi task for the vendored runtimes.** Add
+   `tools/bump_vendored_js.py`, mirroring the existing
+   `tools/update_docs_assets.py` (same `pooch`-based fetch — `pooch` is
+   already a dependency, so **no new dependency** is introduced). It
+   reads a **single pinned table** (Plotly + Three.js versions, source
+   URLs, and expected SHA-256 hashes), fetches each file from
+   jsDelivr/npm with `pooch`'s `known_hash` integrity check, writes each
+   into its canonical vendor home (Decision 1: `src/.../vendor/threejs`
+   for Three.js, the committed docs vendor dir for Plotly), and
+   **regenerates that home's `LICENSES.md`** in the existing format
+   (`vendor/threejs/LICENSES.md`: file→source-URL table, version line,
+   licence). Wire it as a pixi task alongside `docs-update-assets` (e.g.
+   `vendor-update-js`). Bumping a runtime then becomes: edit the pinned
+   version + hash, run one task, commit the refreshed snapshot and
+   regenerated license. A `--check` mode (re-hash the vendored files
+   against the pinned table without writing) can guard against drift or
+   accidental edits in CI, complementing the `pyproject.toml` exclusion
+   of vendored paths from lint/format. The pinned table is the single
+   source of truth for the versions that the Three.js renderer
+   (`_CDN`/import map) and the Plotly bundle reference, so `src` and
+   docs cannot drift.
+
+6. **Inject the page-level Three.js importmap via the Material theme
+   override.** A page may hold several structure views, but a document
+   can carry only one reliable `<script type="importmap">`, and it must
+   precede any module script — so `extra_javascript` (which links plain
+   `.js` files) cannot deliver it. Decision: emit **one** static
+   importmap from the existing `docs/overrides/main.html` by adding an
+   `{% block extrahead %}` that renders it into `<head>`, with entries
+   resolved against `{{ base_url }}` so they stay correct under `mike`'s
+   versioned subpaths:
+
+   ```jinja
+   {% block extrahead %}
+     {{ super() }}
+     <script type="importmap">
+     {"imports": {
+       "three": "{{ base_url }}/assets/javascripts/vendor/threejs/three.module.js",
+       "three/addons/controls/OrbitControls.js": "{{ base_url }}/assets/javascripts/vendor/threejs/OrbitControls.js",
+       "three/addons/renderers/CSS2DRenderer.js": "{{ base_url }}/assets/javascripts/vendor/threejs/CSS2DRenderer.js"
+     }}
+     </script>
+   {% endblock %}
+   ```
+
+   In `SHARED` mode the Three.js renderer then emits **only** the module
+   bootstrap (bare `three` / `three/addons/...` specifiers) and **no**
+   per-scene importmap, so every scene on a page resolves against this
+   single head-level map. `STANDALONE` reports are unaffected — they
+   keep their self-contained inline importmap (a standalone file has no
+   theme override). Injecting the map on every page is harmless where no
+   scene consumes it (the tiny JSON is inert), keeping the override
+   simple.
+
+This pays the network bill once per page from the same origin, removes
+the per-figure JS duplication, and turns first paint from "render every
+figure" into "render nothing until seen" — addressing both bottlenecks
+while keeping every plot fully interactive.
+
+## Options considered
+
+### Option A — Tactical: lazy activation only
+
+Keep each figure's self-contained, CDN-loaded HTML exactly as today, but
+wrap the existing per-figure post-script so `Plotly.newPlot` fires from
+an `IntersectionObserver` behind a "Loading…" placeholder.
+
+- **Pros:** smallest change; isolated to the post-script; delivers the
+  "plots appear one by one" UX the request asked for.
+- **Cons:** does **not** fix the network bottleneck (still CDN, still
+  RequireJS, Three.js still inlined per scene, importmap bug remains);
+  keeps ~15 KB × N duplicated post-scripts; leaves the long-term CDN
+  fragility for versioned docs. Robustness: low.
+
+### Option B — Shared self-hosted runtime + lazy activation _(recommended)_
+
+As in **Decision** above: self-host pinned runtimes loaded once per
+page, an explicit embedding mode, and a shared lazy loader.
+
+- **Pros:** fixes **both** bottlenecks; firewall-proof and archival
+  (versioned docs stay self-consistent); de-duplicates and centralizes
+  figure JS (maintainability); fixes the importmap bug; generalizes the
+  pattern reports already use; keeps reports self-contained.
+- **Cons:** the most work now — touches `serialize_html`, the Three.js
+  renderer, `mkdocs.yml`, a vendoring/build step, and a new shared JS
+  asset; requires careful handling of the three delivery targets and of
+  the live-notebook experience. Robustness: high. **Matches the stated
+  preference to accept more work now for long-term robustness.**
+
+### Option C — MkDocs post-processing plugin
+
+Leave the Python serialization mostly as-is and add a custom MkDocs
+plugin (or adopt `mkdocs-plotly-plugin`, already eyed in a `docs.yml`
+comment) that post-processes built pages to strip duplicate runtimes,
+inject one shared runtime, and add the lazy loader globally.
+
+- **Pros:** centralizes behavior in the build; minimal Python display
+  changes.
+- **Cons:** adds a bespoke build dependency to maintain against MkDocs
+  and Plotly upgrades; "spooky action" in a post-build pass that is
+  harder to test than deterministic serialization;
+  `mkdocs-plotly-plugin` targets `.plotly` JSON files in Markdown, not
+  executed-notebook outputs, so it is not a drop-in. Robustness: medium,
+  but with ongoing maintenance cost and weaker testability than B.
+
+### Comparison
+
+| Concern                                     | A — tactical | B — shared+lazy | C — plugin             |
+| ------------------------------------------- | ------------ | --------------- | ---------------------- |
+| Plots appear progressively                  | ✅           | ✅              | ✅                     |
+| Removes runtime-CDN dependency              | ❌           | ✅              | ✅                     |
+| Smaller runtime (partial bundle)            | ❌           | ✅              | possible               |
+| De-duplicates per-figure JS                 | ❌           | ✅              | ✅                     |
+| Fixes Three.js importmap bug                | ❌           | ✅              | maybe                  |
+| Archival / version-frozen docs              | ❌           | ✅              | ✅                     |
+| Reports keep `offline` contract (unchanged) | ✅           | ✅              | ✅                     |
+| Implementation cost now                     | low          | high            | medium                 |
+| Long-term maintenance cost                  | low          | low             | higher (custom plugin) |
+| Testable in unit tests                      | partial      | ✅              | weak                   |
+
+## Consequences
+
+### Positive
+
+- Page is responsive immediately; figures render on demand, one by one.
+- One same-origin runtime fetch per page, cached across the site;
+  partial bundle roughly halves the Plotly download.
+- Per-figure HTML shrinks substantially (no embedded runtime, no
+  duplicated post-scripts), so executed `.ipynb` artifacts and built
+  pages are smaller.
+- Versioned docs become self-consistent and archival; no runtime CDN.
+- Theme-sync / resize / legend logic lives in one auditable place.
+- The multiple-importmap Three.js bug is fixed.
+
+### Negative / cost
+
+- Larger change across display, report (verification only), docs build,
+  and a new vendored asset + build step.
+- Vendored runtimes must be kept current, but the bump script + pixi
+  task (Decision 5) reduce this to editing a pinned version + hash and
+  running one task; licenses regenerate and an optional `--check` mode
+  guards against drift.
+- The shared loader is now load-bearing for docs rendering; it needs its
+  own tests and a no-/failed-JS fallback story.
+
+### Neutral
+
+- No intended change to public Python API or to how authors write
+  tutorials; the figures look and behave the same, only faster.
+
+## Risks and mitigations
+
+- **Live-notebook rendering.** `SHARED` placeholders need the docs
+  loader, so they must never reach a live Jupyter session. Settled by
+  the env-var routing (Decision 2): only the docs notebook-execution
+  tasks request `SHARED`; an unset variable resolves to `INLINE`. Cover
+  the resolver with a unit test asserting both the default and the
+  docs-build override.
+- **Report `offline` contract.** Keep
+  [`project-summary-rendering.md`](../accepted/project-summary-rendering.md)
+  authoritative (Decision 4); the existing `offline=True` /
+  `offline=False` report tests must stay green and gain no `SHARED`
+  behavior.
+- **Partial bundle missing a trace type.** Audit every trace/type used
+  across tutorials and reports before pinning `plotly-cartesian`; fall
+  back to the full bundle if any `scattergl`/3D/map usage exists.
+- **`IntersectionObserver` / no-JS / print.** Provide eager fallback
+  when the observer is unavailable and when `matchMedia('print')`
+  matches, plus a `<noscript>` note.
+- **RequireJS coupling.** `include_requirejs: true` exists for Plotly
+  today; only drop it after confirming the self-hosted, `False`-mode
+  output renders without it under `mkdocs-jupyter`.
+
+## Resolved decisions
+
+Settled in discussion on 2026-06-02:
+
+1. **Placeholder fidelity → skeleton.** Use a themed "Loading…" skeleton
+   with the figure's reserved aspect ratio (no layout shift). A
+   static-image-first variant (kaleido/SVG pre-render upgrading to
+   interactive) is **deferred**, not adopted now.
+2. **Vendoring → committed canonical snapshots; only Three.js synced.**
+   Three.js stays canonical in `src/.../vendor/threejs`; its docs
+   _serving_ copy is generated at build by `docs-sync-vendored-js`. The
+   Plotly partial bundle is docs-only and committed at its docs vendor
+   home (offline reports use the full Plotly bundle from the `plotly`
+   package, so it needs no wheel copy). One source of truth per runtime,
+   drift-guarded by `bump_vendored_js.py --check` (Decisions 1 and 5).
+3. **Scope/sequencing → both engines together.** Plotly and Three.js are
+   delivered in one ADR/plan/change rather than staged.
+
+## Remaining open questions
+
+1. **Activation trigger.** Lazy on scroll-near only, or also a
+   click-to-activate mode for the very heaviest figures? _Lean:
+   scroll-near now; click-to-activate deferred unless a page proves
+   pathological._
+2. **RequireJS.** Remove `include_requirejs` outright, or keep it for
+   safety during migration and drop it once the `False`-mode,
+   self-hosted output is confirmed to render under `mkdocs-jupyter`?
+   _Lean: keep during migration, remove in the same change after
+   verification._
+
+## Deferred work
+
+- Static-image-first placeholders (kaleido) if skeletons prove
+  insufficient on the heaviest pages.
+- Trace downsampling for very dense series in the docs view (smaller
+  payload + faster draw) — a separate, data-side optimization.
+- A docs CI budget check (page weight / figure count) to catch
+  regressions, aligning with
+  [`documentation-ci-build.md`](suggestions/documentation-ci-build.md).
+- Hoist a single importmap into the **report** template `<head>` for
+  standalone reports that render multiple Three.js scenes (the same
+  per-scene-importmap bug as docs, but governed by
+  [`project-summary-rendering.md`](../accepted/project-summary-rendering.md)).
+  Out of scope here since it touches the report contract; flagged so it
+  is not lost.
+
+## Alternatives considered
+
+See **Options A and C** above; both are rejected in favor of B for
+long-term robustness, though A is a viable fast first step if a staged
+rollout is preferred (it is a strict subset of B's lazy-activation
+work).
diff --git a/docs/dev/adrs/suggestions/space-group-database.md b/docs/dev/adrs/suggestions/space-group-database.md
new file mode 100644
index 000000000..cc1cf3566
--- /dev/null
+++ b/docs/dev/adrs/suggestions/space-group-database.md
@@ -0,0 +1,515 @@
+# ADR: Complete Space-Group Reference Database
+
+**Status:** Proposed **Date:** 2026-06-01
+
+## Group
+
+Structure model.
+
+> This ADR follows [`AGENTS.md`](../../../../AGENTS.md). It is a
+> prerequisite for
+> [`wyckoff-letter-detection.md`](wyckoff-letter-detection.md): Wyckoff
+> detection can only resolve letters for space groups present in the
+> bundled table, and that table is currently incomplete.
+
+## Context
+
+The packaged space-group reference data,
+`src/easydiffraction/crystallography/space_groups.py` →
+`space_groups.pkl.gz`, is the single source the crystallography
+submodule uses for symmetry constraints (cell, atom-site coordinate, and
+ADP) and that the proposed Wyckoff-detection feature will use for
+letters, multiplicities, and site symmetries. An audit of the current
+pickle found it substantially incomplete and irregular:
+
+- **613 entries covering only 188 of 230** International Tables groups.
+- **42 groups have no entries at all** — and they are mostly the
+  _simplest primitive_ ones: tetragonal P4, P4₁, P4₂, P4₃, P-4, I-4,
+  P4/m, P4₂/m, P4/n, P4₂/n; almost the entire primitive trigonal set P3
+  … P-3c1; the whole hexagonal P6 set P6 … P6₃/m; and cubic P23, P2₁3,
+  Pm-3, Pn-3, Pa-3.
+- **18 groups are missing settings** — monoclinic IT 3–15 carry only
+  cell-choice-1; five orthorhombic groups (48, 50, 59, 68, 70) miss the
+  `1a-cb` setting; cubic 228 misses origin choice 2.
+
+Having I4 but not P4, and dropping nearly all primitive
+trigonal/hexagonal groups, is not a principled subset — it points to a
+bug in whatever generated the original pickle. The provenance and
+generation of that file are unknown and unreproducible. As a result,
+both the existing symmetry-constraint code and the planned Wyckoff
+feature silently do nothing for very common groups.
+
+Several authoritative reference sources are already gathered under
+`tmp/space-groups/`:
+
+- `data/cryspy/wyckoff.dat` — **byte-identical to cryspy's** Wyckoff
+  table (verified); complete for all 230 groups (representatives,
+  multiplicities, site symmetries).
+- `data/avogadro/spacegroupdata.h` and `data/sginfo/sginfo.dat` —
+  independently gathered setting and multiplicity references.
+- `data/cctbx/bricks.cpp` and `data/cctbx/symbols.cpp` — cctbx/sgtbx
+  source snapshots kept for provenance; installed cctbx/sgtbx is used
+  for extraction.
+- `data/raspa/raspa-space-group-information.csv` — a settings table
+  extracted from the RASPA manual appendix (IT № → Hermann-Mauguin /
+  Hall → cell choice → centring → crystal system); no Wyckoff data.
+- `data/international-tables/International-Tables-for-crystallography.pdf`
+  (Vol A) and `data/international-tables/ITC-Vol.C.pdf` — authoritative
+  manual curation sources (PDF).
+- `data/iucr/cif_core.dic` — CIF Core dictionary.
+
+One-time source-extraction and generation helpers live under
+`tmp/space-groups/helper-tools/`. They are local, ignored curation
+tooling rather than branch deliverables; the durable record is the final
+generated database, the checked-in ADR companion curation overrides, and
+the provenance recorded in this ADR.
+
+`gemmi 0.7.5` is in the environment; `cctbx` is not installed (only its
+source snippets are present).
+
+The goal: a **complete, self-owned** `space_groups.json.gz` covering all
+230 groups × all standard settings plus every coordinate-code alias the
+current `SpaceGroup` category can produce × full Wyckoff orbits, built
+**once** with its software provenance recorded (§Build provenance).
+
+## Decision
+
+### 1. Scope and schema
+
+Cover **all 230 IT groups × every standard setting and public
+coordinate-code alias × every Wyckoff position**, where each position
+stores its `multiplicity`, `site_symmetry`, and the full `coords_xyz`
+orbit.
+
+The schema **extends the existing one additively**: every current key is
+preserved so consumers (`crystallography.py`, the calculators, CIF code)
+keep working, and a few **symmetry-core** metadata keys are added
+alongside. Each space-group setting carries:
+
+- the existing keys — `IT_number`, `setting`,
+  `IT_coordinate_system_code`, `name_H-M_alt`, `crystal_system`, and
+  `Wyckoff_positions`
+  (`{letter: {multiplicity, site_symmetry, coords_xyz}}`);
+- added per-setting metadata — `hall_symbol`, the full general-position
+  `symop` list, `generators`, `point_group`, `laue_class`, and
+  `centring`.
+
+Per the maintainer's scope choice this is the **symmetry core only**;
+further fields cctbx exposes are listed in Deferred Work for the future.
+
+Coordinates and operators stay **strings** (e.g. `'(x,1/2,0)'`,
+`'-x,y,-z'`) to match the existing parser (`_parse_rotation_matrix`,
+`sympify`) in `crystallography.py` and to keep the file JSON-native
+(§2). Triclinic no-setting groups keep the `None` coordinate code, as
+today (see the `''`→`None` normalisation in
+[`wyckoff-letter-detection.md`](wyckoff-letter-detection.md) §2).
+
+**Query surface preserved.** On disk the JSON is a list of setting
+records, each carrying the canonical `IT_number` and
+`IT_coordinate_system_code` fields — there is no separate `coord_code`
+storage field; that name is only the runtime variable for the tuple key.
+On load the module reconstructs the same in-memory `SPACE_GROUPS` dict
+keyed by `(IT_number, IT_coordinate_system_code)`, so every current
+lookup keeps working unchanged. Because each record also carries
+`name_H-M_alt` and `hall_symbol`, the database can rebuild an
+**H-M-short-symbol → IT_number** index equivalent to cryspy's
+`get_it_number_by_name_hm_short` (1:1 — each of the 230 groups has a
+single short symbol), with the setting selected separately per IT number
+exactly as the `SpaceGroup` category does today. A fuller "H-M symbol
+_with_ setting → specific `(IT_number, IT_coordinate_system_code)`"
+lookup is a multimap (one symbol can map to several settings/origins)
+and is out of committed scope; actually dropping the cryspy dependency
+is left to Deferred Work. The point here is only that the new database
+is **at least as queryable as today**, by both IT number +
+coordinate-system code and by Hermann-Mauguin symbol. The generated
+database therefore includes 816 records: 530 cctbx-tabulated settings,
+226 cryspy reference-settings aliases, and 60 runtime coordinate-code
+aliases, so every coordinate code the `SpaceGroup` category can produce
+— i.e. every `get_it_coordinate_system_codes_by_it_number` value — is a
+valid `SPACE_GROUPS` key.
+
+### 2. JSON storage removes the unpickle workaround
+
+The database is stored as **gzip-compressed JSON**
+(`space_groups.json.gz`), not a pickle. `space_groups.py` today loads a
+pickle through a bespoke `_RestrictedUnpickler` that permits only
+built-in types — a security workaround for a file that holds nothing but
+dicts, lists, strings, ints, and `None`. Switching to JSON **deletes
+that workaround**: the loader decompresses and `json.load`s the stream,
+then rebuilds the `(IT_number, coord_code)`-keyed dict (§1). JSON cannot
+execute code, is human-readable, diffable, and language-agnostic; the
+only constraint on the generator is to emit JSON-native types, which the
+string-based schema already satisfies.
+
+### 3. Generation sources: cryspy first, cctbx for setting metadata
+
+Build the Wyckoff-facing part of the database from **cryspy
+`wyckoff.dat`** first. It is complete for all 230 IT groups, carries the
+letters and representative coordinate orbits, and stores the dotted
+International-Tables-style site-symmetry strings that
+`wyckoff-letter-detection.md` needs. This keeps the minimum
+implementation close to the source already used by the calculator while
+moving ownership of the data into EasyDiffraction.
+
+Use **cctbx/sgtbx** for the setting-level metadata that cryspy's Wyckoff
+table does not provide in the same form: full symmetry operators,
+generators, point group, Laue class, Hall symbol candidates, and
+operation/orbit-closure checks. cctbx is a **generation-only**
+dependency: it is installed into the pixi environment **only for the
+generation run** and removed afterwards — it is never added to the
+runtime dependencies and never imported at runtime, which loads only the
+bundled JSON. Building the database is a **one-time effort**, not a
+recurring pipeline: cctbx is installed once for that build, the exact
+software versions used are recorded in §Build provenance, and the
+install is then removed. A pinned GitHub data download was the
+considered alternative; the temporary install was chosen for the
+authoritative API and the least parsing risk.
+
+### 4. One-time local generation helper
+
+Keep the one-time generator at
+`tmp/space-groups/helper-tools/generate_space_groups.py` and run it
+**once** to emit `space_groups.json.gz`. It is intentionally not kept in
+the branch after implementation, because it is local curation tooling
+rather than runtime or routine development tooling. The future rebuild
+path is preserved by keeping the helper in the ignored
+`tmp/space-groups/` workspace and by recording its SHA-256, input
+sources, command line, software versions, and ADR companion curation
+overrides in §Build provenance. The generated JSON is the committed
+artifact; the ADR and overrides explain how it was produced.
+
+### 5. Multi-source verification
+
+The generator verifies its output against **every** gathered source, not
+just the primary one:
+
+- cryspy `wyckoff.dat` — letters, multiplicities, site symmetries, and
+  representative coordinate orbits;
+- gemmi (already a runtime dependency, 0.7.5) — `spacegroup_table()`
+  covers all 230 groups and 564 settings with Hall symbols and full
+  symmetry operations. gemmi has **no** Wyckoff API (no letters, site
+  symmetries, or special-position enumeration), so its independent
+  contribution is precise: it validates the **set of settings** and the
+  **symmetry operations** per setting, and — given a representative
+  coordinate taken from another source — it confirms that
+  representative's **orbit and multiplicity** by applying its operations
+  (an operation-closure check). It does **not** independently produce
+  the representative coordinates, letters, or site-symmetry symbols, so
+  the disagreement report labels a gemmi orbit/multiplicity check as
+  _dependent_ on the cctbx/cryspy representative, not as an independent
+  third source for that representative;
+- Avogadro `data/avogadro/spacegroupdata.h` and SgInfo
+  `data/sginfo/sginfo.dat` — settings and multiplicities;
+- cctbx `data/cctbx/symbols.cpp` / `data/cctbx/bricks.cpp` — source
+  provenance for Hall symbols and settings;
+- RASPA `data/raspa/raspa-space-group-information.csv` — setting /
+  cell-choice enumeration;
+- International Tables Vol A — authoritative spot-checks.
+
+Verification covers presence (all 230 groups, their standard settings,
+and the public cryspy coordinate-code alias surface), per-position
+values (letter, multiplicity, site symmetry), and orbit coordinates.
+
+### 6. Disagreement report and human-in-the-loop curation
+
+Where **two or more sources disagree** on any value — a multiplicity, a
+site-symmetry symbol, a coordinate, a letter, the presence of a setting
+— the generator emits a structured **disagreement report** entry
+containing:
+
+- the case (group / setting / Wyckoff letter / field);
+- each contributing source and its value;
+- an `IT` column for later International Tables comparison;
+- an `Override` column for the final selected value and rationale.
+
+The maintainer inspects the report and **selects** the authoritative
+value per case. Selections are recorded in a checked-in **YAML overrides
+file**,
+`docs/dev/adrs/suggestions/space-group-database/space_groups_overrides.yaml`
+while the ADR is proposed. If this ADR is accepted, move that companion
+file with the ADR to the accepted ADR area. YAML lets each selection
+carry an inline comment recording its rationale. The generator consumes
+it during the build, so every non-obvious choice is explicit and
+auditable rather than baked silently into the binary. The overrides are
+deliberately not embedded in this ADR or in the implementation plan:
+those Markdown files describe the process, while the YAML file is the
+stable machine-readable input to the generator with a focused diff for
+curated values. The disagreement report itself is a local curation
+artifact under `tmp/space-groups/extracted-comparison/`. The Markdown
+report is split into one table per field, and the comparison folder also
+contains a combined CSV plus one CSV per field so each class of
+disagreement can be checked independently. Cases where all sources agree
+need no entry.
+
+### 7. Current curation baseline and deferrals
+
+The extracted comparison data is sufficient for the **minimal database
+needed by `wyckoff-letter-detection.md`**. The Phase 1 build therefore
+uses this source priority:
+
+1. Use cryspy `data/cryspy/wyckoff.dat` as the initial authority for
+   Wyckoff-facing fields: letters, multiplicities, site-symmetry
+   symbols, and representative coordinate orbits. It is complete for all
+   230 IT groups and carries the International-Tables-style
+   site-symmetry strings that the detection feature needs.
+2. Use cctbx/sgtbx as the source for setting-level symmetry metadata
+   that cryspy does not provide in the same table, especially full
+   symmetry operators, generators, point group, Laue class, Hall symbol
+   candidates, and orbit-closure checks.
+3. Use RASPA, Avogadro, SgInfo, and gemmi as cross-checks for setting
+   presence, Hermann-Mauguin / Hall symbols, centring, multiplicities,
+   and operation closure. When cryspy lacks a field or a value is
+   disputed, the maintainer should prefer the source that agrees with
+   the largest independent cluster and record the choice in the ADR
+   companion overrides file.
+
+This is intentionally a **curated seed database**, not the final
+International Tables audit. The `IT` and `Override` columns in the
+comparison reports are left for future human verification. Future
+curation should check flagged rows against International Tables Vol A
+first, and may also consult the IUCr International Tables Symmetry
+Database (`https://symmdb.iucr.org/`), Bilbao Crystallographic Server,
+and ISODISTORT as independent online references for Wyckoff-position
+data. The IUCr Symmetry Database is especially relevant where subscriber
+access is available because its Wyckoff-position program exposes
+multiplicities, letters, site-symmetry symbols, and coordinate triplets.
+Those checks are deferred so the database can unblock Wyckoff detection
+now while keeping every non-obvious choice visible for later correction.
+
+The triclinic groups do not require a special-case database model. P1
+(IT 1) has one Wyckoff position, `a`, with multiplicity 1. P-1 (IT 2)
+has the expected inversion-centre special positions plus the general
+position. The only awkwardness is representation of "no
+coordinate-system code": EasyDiffraction's `SpaceGroup` category uses
+the empty string `''`, while the table key uses `None`. The database
+keeps `(1, None)` and `(2, None)`; callers normalise `''` to `None` at
+lookup boundaries, as specified in
+[`wyckoff-letter-detection.md`](wyckoff-letter-detection.md). This is
+the least surprising solution because it keeps "no setting" distinct
+from any real coordinate-code string without inventing a sentinel value.
+
+### 8. The database file is generated, not hand-edited
+
+`space_groups.json.gz` is never edited by hand. Any correction flows
+through the curation overrides and a regeneration run, keeping the file
+and the documented decisions in sync.
+
+## Consequences
+
+### Positive
+
+- Complete coverage of the **data**: every one of the 230 groups and
+  their standard settings is present, including the currently-broken P4
+  / P3 / P6 / Pm-3 and the monoclinic alternative settings. For settings
+  with a non-`None` coordinate code the existing `(IT_number, code)`
+  lookups find the new entries immediately, with no consumer change; the
+  two triclinic `None`-code groups additionally need the companion
+  consumer-side fix (see Compatibility).
+- Documented, auditable provenance: the local generator helper SHA-256,
+  curation overrides, local disagreement report, and recorded build
+  versions show exactly how the seed database was produced and which
+  value checks remain deferred.
+- The Wyckoff-detection "unsupported group" path shrinks from "common
+  groups" to genuinely-exotic settings, simplifying that feature.
+- The 42-group gap and the missing settings become permanent regression
+  guards.
+
+### Trade-offs
+
+- A temporary, generation-only cctbx install is needed for the one-time
+  build (never a runtime dependency).
+- Deferred human curation over the disagreement report before the seed
+  is promoted from cross-checked package data to a final International
+  Tables audit.
+- `space_groups.json.gz` is larger than today's partial pickle (gzipped
+  JSON is less compact than gzipped pickle), though still well under
+  ~1.5 MB.
+
+### Compatibility Outcomes
+
+- The in-memory `SPACE_GROUPS` dict is unchanged (same
+  `(IT_number, coord_code)` keys; existing value keys preserved, new
+  ones added), so `crystallography.py`, the calculators, and CIF code
+  need no changes — they see complete data and ignore the new keys.
+- Only the on-disk format changes (pickle → gzipped JSON); the
+  `_RestrictedUnpickler` and the pickle dependency are **removed**, a
+  net simplification.
+- Existing projects load identically. Previously-unsupported groups with
+  a real coordinate code (P4, P3, P6, Pm-3, the monoclinic alternative
+  settings, …) gain correct symmetry behaviour immediately — the
+  existing `(IT_number, code)` lookups simply find the now-present
+  entries. The two triclinic `None`-code groups remain skipped until the
+  companion consumer-side fix lands: `_get_wyckoff_exprs()` returns
+  early when `coord_code is None` and `_get_general_position_ops()`
+  indexes the raw key, so they need the `''`→`None` normalisation
+  defined in
+  [`wyckoff-letter-detection.md`](wyckoff-letter-detection.md) §2 (which
+  also updates these call sites). This ADR delivers the data; that ADR
+  delivers the `None`-code consumer handling.
+
+## Alternatives Considered
+
+- **cryspy as the sole source.** Fastest (already present, verified
+  complete, zero new deps), but it does not provide every setting-level
+  metadata field needed for the new database and its provenance is the
+  calculator the database is meant to outgrow. Accepted as the initial
+  authority for Wyckoff-facing fields, but not as the sole authority for
+  the whole database.
+- **Parse SgInfo / cctbx C sources directly.** Most "self-owned", but
+  the highest parsing and verification burden. Used as cross-checks
+  instead of the primary generator.
+- **Generate Wyckoff orbits at runtime from symmetry operators** (no
+  bundled table). Rejected: heavy runtime cost on a hot path, and it
+  discards the established, cache-friendly table design.
+- **Keep the partial table and degrade gracefully.** Rejected: it leaves
+  common groups (P4, P3, P6) silently without symmetry information.
+
+## Verification
+
+- A regression test asserts that **all 230 groups, their standard
+  settings, and every public cryspy coordinate-code alias are present**
+  in the loaded table (guarding against the current 42-group /
+  18-setting gap).
+- A query-surface test asserts that every coordinate-system code exposed
+  by `SpaceGroup` resolves as a `(IT_number, coord_code)` key and that
+  Hermann-Mauguin symbol resolution still reaches every group.
+- Spot-check tests compare representative groups against International
+  Tables: a primitive tetragonal (P4), a trigonal (P3), a hexagonal
+  (P6), a centrosymmetric cubic (Pm-3), a monoclinic with cell choices,
+  and an origin-choice group.
+- The disagreement report is itself a verification artifact, reviewed by
+  the maintainer before the database is accepted.
+- A packaging regression check builds the wheel and inspects it directly
+  (`tools/check_packaged_db.py`), confirming the renamed
+  `space_groups.json.gz` is shipped as package data, the obsolete
+  `.pkl.gz` is gone, and the archive covers all 230 groups — catching
+  missing package-data inclusion without coupling to the package's full
+  runtime dependency tree.
+- Per the document-review rule, this ADR was written without running
+  tests, linters, or build commands.
+
+## Build Provenance
+
+The database is built once, so the exact tooling and inputs used to
+produce the committed `space_groups.json.gz` are recorded here at
+generation time. This section **is** the named, durable provenance
+artifact that makes the one-time build auditable and reconstructable
+even after cctbx is removed from the environment.
+
+Generation run:
+
+```bash
+pixi exec --spec cctbx --spec gemmi --spec sympy --spec pyyaml \
+  python tmp/space-groups/helper-tools/generate_space_groups.py \
+  --output-json src/easydiffraction/crystallography/space_groups.json.gz \
+  --write-comparison-folder tmp/space-groups/extracted-comparison \
+  --print-summary
+```
+
+Build environment:
+
+- **cctbx** from conda-forge:
+  - `cctbx 2026.4 py314he55896b_1`
+  - `cctbx-base 2026.4 py314h4545a6d_1`
+- **Helper-only packages** from conda-forge:
+  `gemmi 0.7.5 py314h2fd7851_0`, `sympy 1.14.0 pyh2585a3b_106`,
+  `pyyaml 6.0.3 py314h6e9b3f0_1`.
+- **Python and platform:** Python 3.14.5, macOS-26.2 arm64
+  (`macOS-26.2-arm64-arm-64bit-Mach-O`).
+- **Runtime cross-check versions:** cryspy 0.11.0, gemmi 0.7.5.
+
+Generated and curation artifacts:
+
+- `src/easydiffraction/crystallography/space_groups.json.gz`:
+  `30f0051c669712ab34d991e60223c5e29264fc033b2ab03392cc01465ceba926`
+- `tmp/space-groups/helper-tools/generate_space_groups.py`:
+  `bf10dcfbcf9e60485037ddabc65425e61f746ad9649cd3ccc67376dd6aae241a`
+- `docs/dev/adrs/suggestions/space-group-database/space_groups_overrides.yaml`:
+  `7077eec25d0f3b852dd7096a24dc7ac438467f9cb594f91a65ce10cda0e0722a`
+- `tmp/space-groups/extracted-comparison/disagreements.md`:
+  `dda940fbf75862516411685c9b9bdf7170fa4a116f90eeeff93bd068b8acda4c`
+- `tmp/space-groups/extracted-comparison/all-fields.csv`:
+  `4c69060514c58730d905d204144364d5696af9781d5d6132966960131ccd6b3a`
+
+Gathered input snapshots:
+
+- cctbx `symbols.cpp`, GitHub `cctbx/cctbx_project` commit
+  `9031bd719b56bc55bc5a276f407a9a64cc08c2c3`:
+  `901e038d6c060a7630c4e05f85b5c2fb6940edd9c6a2421755c146e29298b81b`
+- cctbx `bricks.cpp`, GitHub `cctbx/cctbx_project` commit
+  `9031bd719b56bc55bc5a276f407a9a64cc08c2c3`:
+  `85cfee5c215dbbfb9520730186ddc1d73b2ba93d5c94b969dc8968da6c5f2534`
+- Avogadro `spacegroupdata.h`, GitHub `OpenChemistry/avogadrolibs`
+  commit `88ff1a7af4625824b258933715d8f112bc35453e`:
+  `c5688f343ae2f37ec2e37beea2534d47f192f354bbe382bf11203c8e7b22cac9`
+- cryspy `wyckoff.dat` snapshot:
+  `ce6a576068610fb9a0d80a77f1c8957c3d1138a0e8f8fa9c248c62786dd3fb38`
+- cryspy `function_2_space_group.py` snapshot:
+  `e3cf8fd594c053068ed6f68d805ee9d216cfefa392351a2456cb3b2632bc4462`
+- SgInfo `sginfo.dat` snapshot:
+  `54591fd507aeb8cd24f9cb7e552a4b85cd6c5fd8f905782b489639f4cce51205`
+- RASPA appendix extraction `raspa-space-group-information.csv`:
+  `61258cb176cb5851efb042d0ac144f6f3ee9f730fc92564d4550acdd52dabd17`
+- RASPA manual PDF `raspa.pdf`:
+  `c5dfc865276667f787f793b7b4eacddcde268d5c7a1fa203a00db612ad7f79cf`
+- International Tables Vol A PDF:
+  `6d619f4e71754dc257cffc1fd8e92e23145e2f8511fa97ed1b5522773da3666e`
+- International Tables Vol C PDF:
+  `f095728556c0ebb05ab55ca2bbccac76c544f04f71da3a121b0477ba66699a0d`
+- IUCr CIF Core dictionary snapshot:
+  `dd7460c1ed1666adecf2f77441556920a051f076c31a6b7274d33dfbe2b6d5ad`
+
+### P1.1 extraction observations
+
+The first cctbx extraction pass enumerates 530 cctbx-tabulated setting
+records covering all 230 IT groups, with no duplicate
+`(IT_number, IT_coordinate_system_code)` keys after normalisation. This
+is not identical to the wider cryspy-style coordinate-code surface used
+by EasyDiffraction today: cryspy exposes additional repeated
+axis/cell-choice aliases for some monoclinic, orthorhombic, and trigonal
+settings. The Phase 1 database adds 226 reference-settings alias records
+and a further 60 runtime coordinate-code aliases — the redundant
+cell-choice-2/3 codes for the five primitive monoclinic groups IT
+3/4/6/10/11, which cryspy's runtime
+`get_it_coordinate_system_codes_by_it_number` exposes and which copy
+cell choice 1 verbatim — producing 816 records total, so every
+coordinate code the `SpaceGroup` category can return resolves.
+Reference-settings alias records are generated from cctbx by parsing the
+cryspy Hermann-Mauguin alias where cctbx accepts it; otherwise they copy
+the closest same-IT cctbx setting and carry the cryspy alias name.
+Detailed value verification for those alias records remains part of the
+deferred International Tables audit.
+
+## Open Questions
+
+None outstanding. Build-time specifics — the exact software versions and
+the candidate additional-metadata fields — are recorded in §Build
+Provenance, §P1.1 extraction observations, and Deferred Work
+respectively.
+
+## Deferred Work
+
+- Full human verification against International Tables Vol A, with the
+  IUCr International Tables Symmetry Database
+  (`https://symmdb.iucr.org/`), Bilbao Crystallographic Server, and
+  ISODISTORT as additional independent references for flagged
+  Wyckoff-position rows. Record corrections in the ADR companion
+  overrides file and regenerate the database/report.
+- **Additional metadata cctbx exposes**, deliberately deferred from the
+  symmetry-core schema (§1): asymmetric-unit definition, reflection /
+  systematic-absence conditions, centring translation vectors,
+  per-Wyckoff special-position operators, and matrix-form generators.
+  Add when a concrete consumer needs them.
+- Dropping the remaining cryspy dependency for Hermann-Mauguin →
+  IT-number resolution, using the database's own `name_H-M_alt` /
+  `hall_symbol` index (§1).
+- Re-evaluating the coordinate encoding (strings versus parsed matrices)
+  if profiling shows the string parse is a bottleneck.
+
+## Related ADRs
+
+- [`wyckoff-letter-detection.md`](wyckoff-letter-detection.md) — the
+  dependent feature; its `''`→`None` coordinate-code normalisation and
+  its "unsupported group" handling both build on this database.
+- [`iucr-cif-tag-alignment.md`](../accepted/iucr-cif-tag-alignment.md) —
+  consumes space-group and Wyckoff data on export.
diff --git a/docs/dev/adrs/suggestions/space-group-database/space_groups_overrides.yaml b/docs/dev/adrs/suggestions/space-group-database/space_groups_overrides.yaml
new file mode 100644
index 000000000..339567c7a
--- /dev/null
+++ b/docs/dev/adrs/suggestions/space-group-database/space_groups_overrides.yaml
@@ -0,0 +1,11 @@
+# Space-group database curated overrides.
+#
+# Initial minimal seed decision, 2026-06-02:
+# Use the ADR source priority without manual row-level overrides for now:
+# cryspy wyckoff.dat for Wyckoff-facing values, cctbx/sgtbx for
+# setting-level metadata, and RASPA/Avogadro/SgInfo/gemmi as cross-checks.
+#
+# Flagged rows remain visible in tmp/space-groups/extracted-comparison/
+# for future verification against International Tables Vol A, Bilbao
+# Crystallographic Server, and ISODISTORT.
+[]
diff --git a/docs/dev/adrs/suggestions/wyckoff-letter-detection.md b/docs/dev/adrs/suggestions/wyckoff-letter-detection.md
new file mode 100644
index 000000000..f5f671d33
--- /dev/null
+++ b/docs/dev/adrs/suggestions/wyckoff-letter-detection.md
@@ -0,0 +1,502 @@
+# ADR: Automatic Wyckoff Position Detection
+
+**Status:** Proposed **Date:** 2026-06-01
+
+## Group
+
+Structure model.
+
+> This ADR follows [`AGENTS.md`](../../../../AGENTS.md). No deliberate
+> exception to those instructions is taken. The slug stays
+> `wyckoff-letter-detection` for continuity with the request, but the
+> decision covers the full Wyckoff _position_ (letter, multiplicity, and
+> site symmetry), since all three come from one database entry.
+
+## Context
+
+Every `AtomSite` carries a Wyckoff letter that records the symmetry of
+the site within the space group. Today the user must supply it by hand —
+in Python (`atom_sites.create(..., wyckoff_letter='a')`) or in CIF
+(`_atom_site.Wyckoff_symbol`). Several parts of the model already depend
+on that letter:
+
+- `AtomSites._apply_atomic_coordinates_symmetry_constraints()`
+  ([`default.py:555`](../../../../src/easydiffraction/datablocks/structure/categories/atom_sites/default.py))
+  reads `atom.wyckoff_letter.value`, looks up the Wyckoff position,
+  snaps coordinates onto their special values, and flags symmetry-fixed
+  axes so they cannot be refined. Atoms with no letter are silently
+  skipped.
+- `AtomSites._apply_adp_symmetry_constraints()` uses the letter (and the
+  site coordinates) to constrain the anisotropic ADP tensor.
+- The cryspy calculator overrides its own multiplicity from the letter
+  in `_update_atom_multiplicity()`
+  ([`cryspy.py:487`](../../../../src/easydiffraction/analysis/calculators/cryspy.py)),
+  because cryspy normalizes coordinates into `[0, 1)` while parsing CIF
+  and can misclassify a special position as general.
+- The IUCr writer emits `_atom_site.Wyckoff_symbol`
+  ([`iucr_writer.py:876`](../../../../src/easydiffraction/io/cif/iucr_writer.py)).
+
+Two gaps remain, both recorded as open issue **#51**
+([`open.md:999`](../../../../docs/dev/issues/open.md)):
+
+1. The set of letters a site may take is a hardcoded placeholder,
+   `['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i']`, with a TODO to read
+   the real list from the current space group
+   ([`default.py:200`](../../../../src/easydiffraction/datablocks/structure/categories/atom_sites/default.py)).
+2. There is no decision on what happens when the user does not provide a
+   letter.
+
+The reference data needed to close both gaps is already bundled. The
+packaged `SPACE_GROUPS` table
+([`space_groups.py:98`](../../../../src/easydiffraction/crystallography/space_groups.py))
+is keyed by `(IT_number, IT_coordinate_system_code)` and, for each
+Wyckoff position, stores the **full orbit** of symmetry-equivalent
+coordinate templates plus `multiplicity` and `site_symmetry`. For
+example, Pm-3m (IT 221) letter `e` lists all six templates
+`(x,0,0), (-x,0,0), (0,x,0), (0,-x,0), (0,0,x), (0,0,-x)` with
+`multiplicity = 6` and `site_symmetry = '4m.'`; letter `a` is the single
+`(0,0,0)` with `multiplicity = 1`.
+
+The crystallography submodule already parses these templates into
+rotation/translation pairs (`_parse_rotation_matrix()`,
+[`crystallography.py:350`](../../../../src/easydiffraction/crystallography/crystallography.py))
+and exposes `symmetry_operators()`. cryspy independently solves the same
+problem — it tests a coordinate against every Wyckoff orbit and, among
+the matches, picks the position with the **lowest multiplicity** (the
+most special site). That algorithm is the inspiration here, but the
+detection should live in EasyDiffraction so it does not depend on any
+single calculator backend.
+
+## Decision
+
+### 1. EasyDiffraction owns the Wyckoff position
+
+The library — not a calculator — is the single source of truth for an
+atom site's Wyckoff **letter**, **multiplicity**, and **site symmetry**.
+Calculators consume these model values and must not re-derive them.
+Deriving them model-side, from the un-normalized fractional coordinates,
+is also the _correct_ place: it avoids the `[0, 1)` normalization that
+forces the cryspy override to exist today.
+
+### 2. Detection lives in the crystallography submodule
+
+Add to
+[`crystallography.py`](../../../../src/easydiffraction/crystallography/crystallography.py):
+
+- `detect_wyckoff_position(name_hm, coord_code, fract_xyz, tol=...) -> WyckoffPosition | None`
+  — the orbit matcher. It resolves `(IT_number, coord_code)` (after the
+  key normalisation below); returns `None` only when that pair is
+  genuinely absent from `SPACE_GROUPS`, preserving today's "no letter,
+  skip constraints" behaviour. Otherwise it tests the coordinate for
+  membership in each Wyckoff orbit and returns the matched position.
+- `wyckoff_position_info(name_hm, coord_code, letter) -> WyckoffPosition | None`
+  — a plain table lookup that returns the same record for an
+  already-known letter (auto-detected or user-set), used to populate the
+  derived descriptors without re-running the matcher.
+
+Both return a small frozen
+`WyckoffPosition(letter, multiplicity, site_symmetry)` dataclass rather
+than bare tuples: the three values are always consumed together (to fill
+the letter, multiplicity, and site-symmetry descriptors), named fields
+read better at the call sites, and the record can later carry the
+equivalent-position orbit without a breaking positional change. This
+matches the project's frozen-dataclass metadata idiom (`TypeInfo`,
+`Compatibility`); the bare-tuple alternative is rejected as less
+readable and fragile to extension.
+
+**Orbit-membership test.** For a coordinate `p = (x, y, z)` and an orbit
+template parsed into rotation `R` and translation `b`, the point lies on
+that template when `R·v + b ≡ p (mod 1)` is solvable for some real `v`.
+The general position (templates with all of `x, y, z` free) always
+matches, so a space group present in the table always yields a letter.
+Among all matching positions the winner is chosen by **(multiplicity
+ascending, then residual ascending)**: the most special site first, and
+— in the rare case where two distinct positions of the _same_
+multiplicity both lie within `tol` — the one the coordinate is actually
+closest to. The matcher already computes that residual while testing
+membership, so the tie-break costs nothing extra. A genuine
+same-multiplicity tie within `tol` (which a small tolerance makes almost
+impossible, since distinct special positions are separated by fractions
+like 1/2) is reported with a `log.warning` naming both candidates.
+Refusing to guess (raising) was rejected because it would break the
+"always resolve a letter" guarantee for an essentially unreachable case,
+and an arbitrary table-order pick was rejected as less physical than
+nearest-position.
+
+**Numeric kernel.** Solve the modular linear system with NumPy
+least-squares and check the residual modulo 1 against `tol` (reduce
+`p − b` to its nearest unit cell, solve `R·v = d`, require the residual
+≡ 0 mod 1 within `tol`). This is simple, fast, and naturally
+tolerance-based. cryspy's exact rational kernel
+(`Fraction.limit_denominator` + Gaussian elimination mod 1) is the
+fallback option if numeric edge cases appear — see _Alternatives_.
+
+**Key normalisation.** `SpaceGroup` represents a group with no
+coordinate-system code as the empty string `''` (its
+`_it_coordinate_system_code_allowed_values` returns `codes or ['']`),
+but the bundled table stores those groups under a `None` code — the
+triclinic groups are `(1, None)` (P1, Wyckoff `a`, multiplicity 1) and
+`(2, None)` (P-1), and there are no empty-string keys at all. Detection
+and allowed-letter discovery therefore normalise `''` to `None` before
+indexing `SPACE_GROUPS`, so P1 and P-1 resolve to their real Wyckoff
+positions instead of being mistaken for unsupported groups. A shared
+`_normalize_coord_code()` helper owns this mapping; the existing
+`_get_wyckoff_exprs()` and `_get_general_position_ops()` lookups
+([`crystallography.py`](../../../../src/easydiffraction/crystallography/crystallography.py))
+should adopt it too, since they currently miss the `None`-keyed groups.
+
+### 3. The letter is always set, and tracks the coordinates
+
+The `wyckoff_letter` descriptor holds a concrete value whenever the
+space group is supported — there is no persistent "auto vs explicit"
+mode and no marker bit. The one exception is a space group absent from
+`SPACE_GROUPS` (§8), which splits in two: auto-detection is a no-op
+there, so **without** an explicit letter the value stays empty, while an
+explicit Python/CIF letter is stored verbatim (but carries no
+multiplicity, site symmetry, or constraints — §6). §9 defines how each
+of those cases serialises. For a supported group the letter changes in
+three ways:
+
+- **Creation or load without a letter.** When `atom_sites.create()` is
+  called without `wyckoff_letter`, or a CIF row has no
+  `_atom_site.Wyckoff_symbol`, detection runs against the coordinates
+  and stores the result. The descriptor default is a transient
+  placeholder that detection replaces; it is never surfaced as a lasting
+  state.
+- **User edits the coordinates** (any public path — `atom.fract_x = …`
+  or the live-descriptor `atom.fract_x.value = …`). The letter is
+  re-detected from the new coordinates and stored again; if it differs
+  from the current one, a warning is logged (§5). This keeps the letter
+  honest as the structure is edited. The trigger is update-flow
+  change-tracking, not a single setter (§4), so every public coordinate
+  edit is covered.
+- **User edits the letter** (public letter setter). The chosen letter is
+  applied as-is and persists. Its site-symmetry constraints snap the
+  constrained axes onto the special position (§5); if the pre-set
+  coordinates lay beyond `tol` of that letter's orbit — they did not fit
+  — a warning is logged that the coordinates were adjusted, but the
+  change is still made. A user-set letter is not re-detected until the
+  user next edits the coordinates. (For a space group absent from the
+  table the letter is accepted unvalidated and carries no derived data
+  or constraints — §8.)
+
+Detection writes the resolved letter through a dedicated internal
+mutator, `_set_wyckoff_letter_detected()`, modelled on the existing
+non-validating writer `_set_value_from_minimizer`
+([`variable.py:171`](../../../../src/easydiffraction/core/variable.py))
+(there is no `set_value_directly` method). Assigning the empty value to
+the public setter is permitted and simply requests re-detection on the
+next update.
+
+### 4. Detection triggers
+
+Both triggers live in the atom-site update flow
+([`default.py:674`](../../../../src/easydiffraction/datablocks/structure/categories/atom_sites/default.py)),
+not on any individual setter. A single setter hook would be wrong: a
+coordinate is a live `Parameter`, so `atom.fract_x = 0.1` and
+`atom.fract_x.value = 0.1` are both public edits — and the latter is the
+common one — yet neither must be missed. Both mark the owner dirty and
+run `_update()`, so the update flow is the single place that sees every
+edit.
+
+- **Fill-if-empty.** An empty letter on a site whose space group is
+  supported is detected and stored. Idempotent — a no-op once the letter
+  is non-empty — and it is what fills letters on `create()` and project
+  load.
+- **Re-detect on a coordinate change.** The flow records, per atom, the
+  coordinates a letter was last detected from. When the current
+  coordinates differ from that baseline it re-detects; if the letter
+  changes it stores the new one and warns (§5). The baseline is
+  refreshed to the current coordinates whenever the letter is set or
+  detected — on load, on a user letter-set, and after auto-detection
+  (including the constraint snap that follows in the same pass) — so
+  only a genuine _later_ coordinate change re-detects, and a freshly
+  loaded or user-set letter is not re-detected spuriously.
+
+Two write paths are deliberately excluded. The minimizer runs
+`_update()` with `called_by_minimizer=True`, which skips re-detection
+entirely, so a free Wyckoff parameter (such as `x` in `(x, 0, 0)`)
+varies throughout a fit while the letter stays fixed. The constraint
+pipeline's snap does not re-trigger detection because it writes within
+the same pass and its result becomes the new baseline. A user-set letter
+— even a deliberately less-special one — is therefore never silently
+overwritten by an internal recompute; only a real change in the stored
+coordinates re-detects.
+
+### 5. Lenient proximity matching, with transparent snapping
+
+The tolerance is a module-level constant in `crystallography.py`
+(`_WYCKOFF_DETECTION_TOL`, default `1e-3`), used as the default of the
+matcher's `tol` argument so tests can override it. `1e-3` (fractional)
+is lenient enough to recognise rounded inputs — a database CIF with
+`0.3333` for `1/3`, or `0.4999` for `1/2` — as the special position, yet
+tight enough not to mislabel a genuinely general site (distinct special
+positions are separated by fractions like 1/2). A user-facing or
+project-level tolerance setting is intentionally deferred (see Deferred
+Work) until users ask for it. Once a letter is assigned, the existing
+constraint step snaps the constrained axes onto their exact special
+values. Neither the letter nor the coordinates change silently in
+response to a user edit; two `log.warning` messages cover the cases (per
+the project's "safe defaults, clear errors" principle):
+
+- a user coordinate edit that changes the detected letter → _"coordinate
+  change moved the Wyckoff letter of <site> from X to Y"_;
+- a user letter change whose snap moves coordinates beyond `tol` →
+  _"coordinates of <site> did not fit letter L and were adjusted"_.
+
+Fill-if-empty detection on `create()` / load is the expected baseline
+and is not warned per atom.
+
+### 6. Multiplicity and site symmetry become read-only derived descriptors
+
+`AtomSite` gains read-only `multiplicity` and `site_symmetry`
+descriptors, populated from the `WyckoffPosition` record (via
+`wyckoff_position_info()`) for the resolved letter and re-derived
+alongside it. They are read-only (getter only, no setter) per the
+guarded-public-properties contract: the user influences them only
+through the coordinates and the (optional) explicit letter.
+
+When there is no `WyckoffPosition` record — an unsupported space group,
+or a transient empty letter before the first update — both descriptors
+take their empty form: `multiplicity` is `None` and `site_symmetry` is
+the empty string. They follow the letter's empty state in lockstep, both
+serialise to CIF `?` (§9), and the calculator skips a `None`
+multiplicity (§7).
+
+`site_symmetry` stores the International Tables site-symmetry symbol
+**verbatim** from the table, including its positional dots (for example
+`'4/mm.'`, `'.3m'`, `'..m'`). The dots are not noise: they encode which
+crystallographic directions the site's symmetry elements lie along, so
+stripping or "normalising" them would be lossy and is rejected. Verbatim
+is also the simplest form and the one crystallographers expect from
+International Tables.
+
+### 7. Calculators consume, never re-derive
+
+`_update_atom_multiplicity()` in the cryspy calculator is **replaced**:
+instead of looking multiplicity up from `SPACE_GROUPS`, it reads
+`atom_site.multiplicity.value`. This is behaviour-preserving — same
+table, same letter, same number — but removes the duplicated lookup and
+makes multiplicity uniform across backends. crysfml and pdffit2 do not
+compute multiplicity today (no other usages in `src/`), so nothing
+diverges. Removing the calculator's private derivation is an explicit,
+called-out replacement, not a silent change. When
+`atom_site.multiplicity.value` is `None` (no Wyckoff record — an
+unsupported group), the calculator leaves the backend's own inferred
+multiplicity in place rather than writing `None` into its array; this
+too is behaviour-preserving, since today's `_update_atom_multiplicity()`
+already returns early when the group is absent from `SPACE_GROUPS`.
+
+### 8. Allowed letters come from the current space group (closes #51)
+
+`_wyckoff_letter_allowed_values` stops returning the hardcoded list and
+instead returns the empty placeholder value plus the tabulated letters
+for the current space group,
+`list(SPACE_GROUPS[key]['Wyckoff_positions'])`, where `key` applies the
+§2 coordinate-code normalisation. When the space group is genuinely
+absent from the table its letters cannot be enumerated, so membership
+validation is not applied — the validator accepts whatever the user or a
+CIF supplies. Auto-detection is still a no-op there, but an explicit
+letter (a Python assignment or a CIF `Wyckoff_symbol`) is stored
+verbatim rather than rejected, because blocking a valid assignment or
+failing to load an otherwise-valid CIF is worse than keeping an
+unverifiable letter. Such a letter carries no `multiplicity` /
+`site_symmetry` (no record, §6) and drives no symmetry constraints, and
+a `log.warning` records that the group is untabulated so the letter
+could not be validated. Rejecting with a validation error was the
+considered alternative, declined as too brittle for boundary input that
+Python assignment and CIF loading routinely produce. The atom site
+reaches its space group through the parent chain
+`atom → atom_sites → structure → space_group`, the same access already
+used for ADP synchronisation
+([`default.py:252`](../../../../src/easydiffraction/datablocks/structure/categories/atom_sites/default.py)).
+This keeps Wyckoff letters a space-group-dependent, boundary-facing
+selector rather than a project-owned enum, consistent with
+[`value-selector-discovery.md`](../accepted/value-selector-discovery.md)
+and
+[`enum-backed-closed-values.md`](../accepted/enum-backed-closed-values.md).
+
+### 9. CIF behaviour
+
+Because the letter is concrete for every supported space group (§3), the
+project CIF treats it as an ordinary value — none of the earlier draft's
+column-omission or null-token juggling is needed. An unsupported group
+is the only special case, and it splits in two — no explicit letter
+stays empty, while an explicit letter is written verbatim — both of
+which fall out naturally below.
+
+- **Write.** Emit `_atom_site.Wyckoff_symbol` for every atom, plus the
+  standard `_atom_site.site_symmetry_multiplicity` derived from the
+  model multiplicity (written as `?` when that multiplicity is `None`).
+  **Any** non-empty letter is written verbatim — whether detected for a
+  supported group or supplied explicitly for an unsupported one (§8);
+  only the latter carries a `None` multiplicity. A letter is empty, and
+  serialises as the CIF null `?`, only when it is neither detected nor
+  explicitly supplied — an unsupported group with no user letter, or a
+  transient not-yet-updated state. `?` is already the serializer's
+  output for an empty string
+  ([`serialize.py:62`](../../../../src/easydiffraction/io/cif/serialize.py))
+  and reads back as empty. The column is therefore always present and
+  well-defined for the columnar atom-site loops emitted through the
+  ADP-family path
+  ([`serialize.py:301`](../../../../src/easydiffraction/io/cif/serialize.py)),
+  whether or not every row has a resolved letter, and saving never fails
+  on an unsupported group.
+- **Read.** A present `_atom_site.Wyckoff_symbol` is loaded as the
+  letter; an absent column — or a CIF-null `?` / `.`, which loads as the
+  empty default
+  ([`serialize.py:1091`](../../../../src/easydiffraction/io/cif/serialize.py))
+  — leaves the letter empty, and fill-if-empty detection (§4) resolves
+  it from the coordinates. A round trip is therefore stable: a written
+  letter reloads verbatim, and an omitted one re-derives to the same
+  value (same coordinates + space group → same letter), or stays empty
+  when the space group is unsupported.
+- **IUCr report export.** The report writer
+  ([`iucr_writer.py:876`](../../../../src/easydiffraction/io/cif/iucr_writer.py))
+  already emits the resolved `Wyckoff_symbol` for every atom and now
+  also emits `_atom_site.site_symmetry_multiplicity`.
+- **Derived values on read.** Multiplicity and site symmetry are
+  recomputed from the letter, so any incoming
+  `_atom_site.site_symmetry_multiplicity` is ignored rather than trusted
+  — the library does not validate its own derived output at runtime.
+
+## Open Questions
+
+- The default tolerance value (`1e-3`) is a reasonable starting point
+  but may be tuned against real datasets during implementation and
+  testing.
+
+## Consequences
+
+### Positive
+
+- Users who omit the Wyckoff letter still get correct symmetry
+  constraints, multiplicities, and site symmetries.
+- Closes issue #51: the allowed-letter list becomes real and
+  space-group-aware.
+- Multiplicity becomes calculator-independent and is derived where the
+  coordinates are still un-normalized, which is the correct place.
+- No new dependency: detection reuses `SPACE_GROUPS`, NumPy, and the
+  existing rotation/translation parser.
+- CIF round-trips are stable: a written letter reloads verbatim, and an
+  omitted one is re-derived deterministically from the coordinates (§9).
+
+### Trade-offs
+
+- Lenient matching can move a coordinate by up to the tolerance; this is
+  surfaced by a warning but is a behavioural change for atoms that
+  previously had no letter and were left untouched.
+- A user-set letter is **not** a permanent pin: editing the coordinates
+  re-detects the letter and may change it (with a warning). A user who
+  needs a letter held must avoid editing its coordinates, or re-set the
+  letter afterwards. This is the deliberate cost of keeping the letter
+  and coordinates consistent.
+- `AtomSite` gains two read-only derived descriptors (`multiplicity` and
+  `site_symmetry`).
+
+### Compatibility Outcomes
+
+- Projects that already specify every Wyckoff letter are unaffected:
+  explicit letters are respected and produce identical constraints.
+- A saved project reloads to the same letters: every letter is written
+  (whether the user supplied it or detection filled it), so all reload
+  verbatim — and an auto-filled one would re-derive to the same value
+  anyway.
+- cryspy fit results are unchanged: the multiplicity value is identical,
+  only its source moves from the calculator to the model.
+
+## Alternatives Considered
+
+- **cryspy exact rational kernel.** Use `Fraction.limit_denominator` and
+  Gaussian elimination mod 1 (cryspy's method). Exact and robust, but
+  heavier than needed when a tolerance is wanted anyway. Kept as the
+  fallback if the NumPy kernel shows numeric edge cases.
+- **Delegate detection to a calculator** (for example cryspy's
+  `calc_xyz_mult`). Rejected: it recouples a core model property to a
+  specific backend — the opposite of this ADR — and inherits cryspy's
+  `[0, 1)` normalization problem.
+- **Add spglib or gemmi for symmetry datasets.** Rejected: a new
+  dependency for data the bundled `SPACE_GROUPS` table already contains
+  as full orbits.
+- **Detect once, then freeze permanently.** Rejected: the letter would
+  go stale when the user edits coordinates. The adopted model instead
+  re-detects on a user coordinate edit (§4), so the letter follows the
+  structure.
+- **A persistent auto/provided marker** (an earlier draft of this ADR).
+  Rejected as unnecessary complexity: it required an empty-sentinel
+  state, a marker bit, and column-omission / null-token rules in the
+  project CIF. Always materialising the letter and re-detecting on a
+  user coordinate edit yields the same user-facing behaviour with no
+  marker and a plain, fully-populated CIF column.
+- **Keep the letter purely derived and never stored.** Rejected: the
+  calculator and the Python↔CIF correspondence read `.value`, and users
+  need to be able to override the letter; a never-stored value cannot be
+  overridden.
+
+## Testing
+
+Detection comes with a ready-made regression corpus: the ~20 tutorial
+scripts in `docs/docs/tutorials/*.py`. Most build structures with
+explicit Wyckoff letters and a few load structures from CIF, so in every
+case the declared letter is ground truth. Stripping a site's explicit
+letter and re-detecting from its coordinates and space group must
+reproduce that declared letter — a single assertion that yields broad,
+real-world coverage across many space groups, settings, and site types
+at almost no authoring cost, and guards against regressions whenever the
+tutorials change.
+
+Targeted tests in `tests/unit/easydiffraction/crystallography/`
+(mirroring the source per the
+[test-strategy ADR](../accepted/test-strategy.md)) cover what the corpus
+may miss:
+
+- general vs special positions, and the lowest-multiplicity / nearest
+  tie-break (§2);
+- lenient matching of rounded inputs (`0.3333 → 1/3`, `0.4999 → 1/2`) at
+  the `1e-3` tolerance (§5);
+- the `''`→`None` coordinate-code normalisation — P1/P-1 under their
+  `None` keys, and a genuinely-absent group resolving to the empty
+  letter (§2, §8);
+- the §3–§4 behaviours: fill-if-empty on `create()` / load; re-detect on
+  a user coordinate edit via _both_ `atom.fract_x = …` and
+  `atom.fract_x.value = …`, with the change warning; the user letter
+  override with the snap warning; and the minimizer leaving the letter
+  fixed;
+- the no-record contract (§6–§7, §9): empty `multiplicity` /
+  `site_symmetry`, `?` in CIF, and the calculator skip;
+- CIF round-trip stability — a written letter reloads verbatim, an
+  omitted one re-derives to the same value, and an unsupported-group row
+  stays empty.
+
+The edge-case tests are unit-level (no calculation engine, no network,
+no sleeping) per the test-strategy ADR; the tutorial-corpus checks fit
+at the functional / script level where the tutorial structures are
+already built.
+
+## Deferred Work
+
+- Exposing the full equivalent-position orbit for an atom (the
+  visualization path already derives general-position operators via
+  `symmetry_operators()`).
+- Suggesting or validating the space group from the complete set of atom
+  positions (the reverse problem).
+- A user-facing or project-level tolerance setting, if users ask to
+  control the `_WYCKOFF_DETECTION_TOL` module-constant default.
+- Using multiplicity in occupancy-normalization helpers.
+
+## Related ADRs
+
+- [`iucr-cif-tag-alignment.md`](../accepted/iucr-cif-tag-alignment.md) —
+  `_atom_site.Wyckoff_symbol` and
+  `_atom_site.site_symmetry_multiplicity` tags.
+- [`python-cif-category-correspondence.md`](../accepted/python-cif-category-correspondence.md)
+  — `wyckoff_letter` ↔ `_atom_site.Wyckoff_symbol`.
+- [`type-neutral-adp-parameters.md`](../accepted/type-neutral-adp-parameters.md)
+  — the ADP symmetry constraints that already consume site symmetry.
+- [`value-selector-discovery.md`](../accepted/value-selector-discovery.md)
+  and
+  [`enum-backed-closed-values.md`](../accepted/enum-backed-closed-values.md)
+  — why Wyckoff letters are a dynamic, space-group-dependent selector
+  rather than a project-owned enum.
+- [`guarded-public-properties.md`](../accepted/guarded-public-properties.md)
+  — read-only `multiplicity` and `site_symmetry` (getter only).
diff --git a/docs/dev/package-structure/full.md b/docs/dev/package-structure/full.md
index 1b3e42e91..202823ea6 100644
--- a/docs/dev/package-structure/full.md
+++ b/docs/dev/package-structure/full.md
@@ -263,7 +263,6 @@
 │   ├── 📄 __init__.py
 │   ├── 📄 crystallography.py
 │   └── 📄 space_groups.py
-│       └── 🏷️ class _RestrictedUnpickler
 ├── 📁 datablocks
 │   ├── 📁 experiment
 │   │   ├── 📁 categories
diff --git a/docs/dev/plans/background-auto-estimate.md b/docs/dev/plans/background-auto-estimate.md
new file mode 100644
index 000000000..f6a31703c
--- /dev/null
+++ b/docs/dev/plans/background-auto-estimate.md
@@ -0,0 +1,276 @@
+# Plan: Automatic Line-Segment Background Estimation
+
+This plan follows [`AGENTS.md`](../../../AGENTS.md) and implements the
+[`background-auto-estimate`](../adrs/suggestions/background-auto-estimate.md)
+ADR (drafted via `/draft-adr`, review cycle closed at the sentinel).
+
+**Dependency authorization (for `/draft-impl-1`):** this plan **names
+the new runtime dependency `pybaselines`** explicitly (P1.1,
+_Decisions_, _Concrete files_). Per [`AGENTS.md`](../../../AGENTS.md) →
+**Architecture**, that naming — combined with the user invoking
+`/draft-impl-1` / `/draft-impl-2` — is the pre-approval that lets those
+shortcuts edit `pyproject.toml`, `pixi.toml`, and `pixi.lock`
+autonomously. No other deliberate exception to `AGENTS.md` is taken.
+
+## ADR
+
+This plan owns the ADR
+[`docs/dev/adrs/suggestions/background-auto-estimate.md`](../adrs/suggestions/background-auto-estimate.md).
+The ADR stays a **suggestion** (Status: Proposed) for this PR; promotion
+to `accepted/` is intentionally **out of scope** here and can follow
+when the team formally accepts it. (`/review-plan` may request promotion
+as a P1 step; if so, it becomes a one-line docs step that `git mv`s the
+file, flips the Status line, and updates the index row.)
+`/draft-impl-1`'s Phase A commits the ADR from its current
+`suggestions/` location and removes the design-phase `_review-*` /
+`_reply-*` siblings.
+
+## Branch and PR
+
+- Branch: **`background-auto-estimate`** (flat slug off `develop`, no
+  `feature/` prefix). Do not push unless asked.
+- PR targets **`develop`**.
+
+## Decisions (settled in the ADR)
+
+- **Public API.** A user-invoked
+  `LineSegmentBackground.auto_estimate(*, method='auto', width=None, smoothness=None, n_points=None, use_model=True)`
+  — zero-arg must work, no `free` argument, no `**kwargs`. Returns
+  `None`, logs a one-line summary (method, width, point count).
+  **Never** runs inside `_update()` / at calculation time.
+- **Two-stage algorithm.** Stage 1 estimates a peak-insensitive
+  background curve `B(x)`; Stage 2 thins it to sparse `(x, intensity)`
+  anchors with Ramer–Douglas–Peucker simplification (endpoints always
+  kept, optional `n_points` cap). Anchor heights come from `B(x)`,
+  clipped to `0 ≤ intensity ≤ intensity_meas` (always the original
+  measured intensities). Dense overlap is handled by **abstention** (no
+  forced anchor).
+- **Auto-parameterization, per dataset.** Peak width `W` (points) is
+  measured from the data (`scipy.signal.find_peaks` → `peak_widths`,
+  robust **~75th percentile** upper estimate to clear CWL angular
+  broadening); noise σ via the MAD of the second difference. The
+  peak/resolution model is **not** used for width by default.
+  Deterministic; one `log.warning` on degenerate input.
+- **One method to start.** A single penalised-least-squares default,
+  **`arpls`**, for every experiment; all per-dataset adaptation via the
+  derived width/noise/tolerance. `method` is a per-call keyword argument
+  validated against a closed `BackgroundEstimatorMethodEnum` with
+  exactly `{auto, snip, arpls, fabc}`; `auto` resolves to `arpls`; it is
+  **not** a persisted descriptor. A `beam_mode`/`radiation_probe` policy
+  is deferred to corpus benchmarking.
+- **Backend.** `pybaselines` (approved; BSD-3, runtime deps NumPy+SciPy,
+  both already required) supplies Stage-1 `B(x)` (and the classification
+  mask). The in-house layer owns the parameterization, Stage-2 thinning,
+  clipping, model-guided re-run, and the point lifecycle.
+- **Model-guided re-run.** When a calculation has run, the helper input
+  is the **peak-subtracted measured intensities**
+  `y = intensity_meas − (intensity_calc − intensity_bkg)` (not the fit
+  residual), so `B(x)` is the **absolute** background — emitted points
+  are absolute heights, no add-back. Peak positions are detected from
+  the peak-only model array `intensity_calc − intensity_bkg`. Everything
+  comes from the backend-independent `data.*` arrays; **no
+  `experiment.refln`** dependency (identical for Cryspy and CrysFML).
+  Data-only path (no calculation yet, or `use_model=False`) passes
+  `y = intensity_meas`.
+- **Lifecycle.** Every call **overwrites and re-fixes**: clears the
+  collection and rebuilds it with **fixed** points
+  (`intensity.free = False`) regardless of prior free state; no append
+  mode. When the collection is non-empty it logs a one-line notice that
+  it is replacing the existing points (first call is silent). Sequential
+  string ids (`'1', '2', …`). Excluded regions are honoured for free
+  (`data.x` / `data.intensity_meas` iterate active points only).
+
+## Open questions
+
+- **Empirical calibration (resolved during Phase 2, not blocking).** The
+  Stage-2 tolerance multiplier (`c · σ`, proposed `c ≈ 2`), the width
+  percentile (proposed ~75th), and confirmation that the single `arpls`
+  default holds across the tutorial corpus (CWL/TOF, neutron/X-ray).
+  Record anything surprising in the ADR.
+- **ADR promotion** to `accepted/` is out of scope here (see _ADR_);
+  flagged for `/review-plan` to confirm or request.
+
+## Concrete files likely to change
+
+- `pyproject.toml` — add `'pybaselines>=1.1'` to `dependencies` (the
+  version that ships the classification `mask` + `min_length` and
+  `fabc`).
+- `pixi.lock` — regenerated via `pixi lock` after the `pyproject.toml`
+  edit. `pixi.toml` likely needs **no** edit (the package is installed
+  editable, so the new runtime dep flows from `pyproject.toml`); add a
+  pin there only if `pixi lock` cannot resolve it.
+- `src/easydiffraction/datablocks/experiment/categories/background/enums.py`
+  — add `BackgroundEstimatorMethodEnum` (`auto`, `snip`, `arpls`,
+  `fabc`) with `default()` / `description()`, matching
+  `BackgroundTypeEnum`.
+- `src/easydiffraction/datablocks/experiment/categories/background/estimate.py`
+  — **new** pure-function estimator module (parameterization + Stage-1
+  via `pybaselines` + Stage-2 thinning).
+- `src/easydiffraction/core/collection.py` — reusable `clear()` on
+  `CollectionBase` via `_adopt_items([])` (unlink children, empty
+  `_items`, rebuild `_index`). Used by the overwrite contract.
+- `src/easydiffraction/core/category.py` — `CategoryCollection.clear()`
+  override (calls `super().clear()` then `_mark_parent_dirty()`), since
+  `CategoryCollection` is defined here, not in `collection.py`.
+- `src/easydiffraction/datablocks/experiment/categories/background/line_segment.py`
+  — add `LineSegmentBackground.auto_estimate()` (the thin adapter).
+- `docs/dev/adrs/suggestions/background-auto-estimate.md` and
+  `docs/dev/adrs/index.md` — already written; committed by
+  `/draft-impl-1` Phase A (not edited again here).
+- Phase 2 (tests):
+  `tests/unit/easydiffraction/datablocks/experiment/categories/background/test_estimate.py`
+  (**new**), `…/test_line_segment.py` (update for `auto_estimate`), unit
+  coverage for `CollectionBase.clear()`, and a
+  `tests/functional/…/background/` tutorial-corpus comparison test (run
+  by `pixi run functional-tests`).
+
+## Implementation steps (Phase 1)
+
+Each `- [ ]` step is one atomic commit. Per §Commits, stage only the
+files the step names, with explicit paths, and commit locally with the
+step's `Commit:` message **before** moving to the next step or the Phase
+1 review gate. Mark `[x]` in this file as part of the same commit. Phase
+1 is **code + docs only — no tests** (those are Phase 2).
+
+- [ ] **P1.1 — Add `pybaselines` dependency.** Add `'pybaselines>=1.1'`
+      to the `dependencies` list in `pyproject.toml` (it is the new
+      runtime backend, §4 of the ADR). Run `pixi lock` to regenerate
+      `pixi.lock`. Stage `pyproject.toml` and `pixi.lock` (and
+      `pixi.toml` only if a direct pin was required). Commit:
+      `Add pybaselines dependency`
+
+- [ ] **P1.2 — Add `BackgroundEstimatorMethodEnum`.** In `enums.py`, add
+      a `StrEnum` with members `AUTO='auto'`, `SNIP='snip'`,
+      `ARPLS='arpls'`, `FABC='fabc'`, plus `default()` (returns `AUTO`)
+      and `description()`, following the existing `BackgroundTypeEnum`.
+      No `__init__.py` change (the enum is imported directly, like
+      `BackgroundTypeEnum`). Commit: `Add BackgroundEstimatorMethodEnum`
+
+- [ ] **P1.3 — Add the background curve estimator helper.** Create the
+      new module `estimate.py` with a pure
+      `estimate_background_curve(x, y, *, method='arpls', beam_mode, peaks=None, width=None, smoothness=None, n_points=None) -> (curve, anchors)`.
+      `method` is the **resolved** Stage-1 algorithm (`snip` / `arpls` /
+      `fabc` — never `auto`) and selects the `pybaselines` routine, so
+      **all backend dispatch lives in the helper**, not the adapter.
+      Derive `W` (find_peaks → peak_widths, ~75th percentile) and noise
+      σ (MAD of the second difference) when not supplied; compute the
+      Stage-1 `B(x)` via the selected `pybaselines` routine; thin `B(x)`
+      to anchors by RDP with tolerance `c · σ` (endpoints kept, optional
+      `n_points` cap). Array-in/array-out, no model state, no domain
+      imports. Extract helpers to stay under the lint complexity
+      thresholds. Commit: `Add background curve estimator helper`
+
+- [ ] **P1.4 — Add `CollectionBase.clear()`.** Add a bulk reset to
+      `CollectionBase` (`core/collection.py`). It must **not** be a bare
+      `self._items = []`: that would strand the name `_index` and leave
+      removed children with a stale `_parent`. Implement it by
+      delegating to the existing teardown primitive
+      `self._adopt_items([])`, which unlinks every child
+      (`_parent = None`), empties `_items`, and rebuilds `_index` — the
+      same invariants `__delitem__` already maintains. Because
+      `_adopt_items()` does not notify a dirty-tracking owner, override
+      `clear()` on `CategoryCollection` (in `core/category.py`) to call
+      `super().clear()` then `self._mark_parent_dirty()`, mirroring how
+      `CategoryCollection.add()` layers dirty-marking on the base
+      mutator. Stage **both** `src/easydiffraction/core/collection.py`
+      and `src/easydiffraction/core/category.py`. (Unit coverage for
+      these invariants is added in Phase 2.) Commit:
+      `Add clear method to CollectionBase`
+
+- [ ] **P1.5 — Add `LineSegmentBackground.auto_estimate()`.** In
+      `line_segment.py`, add the public method (signature in
+      _Decisions_). It: reads `self._parent.data`; chooses the helper
+      input `y` — data-only `intensity_meas`, or, when `use_model` and
+      `np.any(intensity_calc)`, the peak-subtracted
+      `intensity_meas − (intensity_calc − intensity_bkg)` and `peaks`
+      detected from the peak-only model array; resolves `method='auto'`
+      to `arpls` and passes the resolved method into the helper (which
+      owns Stage-1 dispatch); clips heights to `[0, intensity_meas]`;
+      `clear()`s the collection (logging the replace notice when it was
+      non-empty) and `create()`s fixed points with sequential ids; logs
+      the one-line summary. Validate `method` against
+      `BackgroundEstimatorMethodEnum` centrally. Numpy-style docstring;
+      no `**kwargs`. Commit:
+      `Add auto_estimate to LineSegmentBackground`
+
+- [ ] **P1.6 — Phase 1 review gate.** No code. Mark this `[x]`, commit
+      the checklist update alone, and hand off to `/review-impl-1`.
+      Commit: `Reach Phase 1 review gate`
+
+## Phase 2 — Verification
+
+Add/update tests, then run the checks below. **Stop after Phase 1 for
+review before starting Phase 2.**
+
+Tests to add/update (unit tests mirror the source tree per
+[`test-strategy.md`](../adrs/accepted/test-strategy.md)):
+
+- **`test_estimate.py` (new)** on the pure helper: synthetic patterns
+  with a known analytic background (flat, linear, smooth curve, TOF-like
+  decay) plus planted Gaussians including a deliberately overlapped
+  multiplet — assert the recovered points reproduce the true background
+  within tolerance, **no anchor lands on a planted peak**, and none
+  exceeds the local data; **CWL angular broadening** (FWHM grows with x)
+  keeps the background off the broad peaks; **model-guided re-run** with
+  a supplied peak-only model places better anchors **and** yields
+  **absolute** background heights (not residual corrections);
+  **determinism** (same input → same points); **graceful degradation**
+  (peakless input → single warning, not a crash).
+- **`test_line_segment.py` (update)** for `auto_estimate` lifecycle:
+  overwrite-and-re-fix (fixed points even when prior ones were freed),
+  the replace notice on a non-empty collection, sequential ids, and
+  data-only vs model-guided dispatch. Also assert each
+  `BackgroundEstimatorMethodEnum` value is accepted and reaches Stage-1
+  dispatch (`auto`→`arpls`, plus `snip` / `arpls` / `fabc`), and that an
+  invalid method is rejected.
+- **`CollectionBase.clear()` invariants (new unit coverage)**: after
+  `clear()` the collection is empty, name lookups fail (`_index`
+  cleared), every prior child has `_parent is None`, and a
+  `CategoryCollection` marks its parent dirty — tested directly, not
+  only via `auto_estimate()`.
+- **Functional tutorial-corpus comparison** in `tests/functional/`
+  (data-only, no engine; run by `pixi run functional-tests`): load
+  representative tutorial experiments — CWL
+  [`ed-2.py`](../../docs/tutorials/ed-2.py),
+  [`ed-17.py`](../../docs/tutorials/ed-17.py); TOF
+  [`ed-13.py`](../../docs/tutorials/ed-13.py),
+  [`ed-16.py`](../../docs/tutorials/ed-16.py) — strip their hand-placed
+  points, run `auto_estimate()`, and assert the recovered curve matches
+  the original within tolerance. Use this to calibrate `c` and the width
+  percentile and confirm the single `arpls` default.
+- Verify the test-structure mirror with `pixi run test-structure-check`.
+
+Verification commands (zsh-safe log capture where output is needed):
+
+```bash
+pixi run fix
+pixi run check > /tmp/easydiffraction-check.log 2>&1; check_exit_code=$?; tail -n 200 /tmp/easydiffraction-check.log; exit $check_exit_code
+pixi run test-structure-check > /tmp/easydiffraction-structure.log 2>&1; structure_exit_code=$?; tail -n 100 /tmp/easydiffraction-structure.log; exit $structure_exit_code
+pixi run unit-tests > /tmp/easydiffraction-unit.log 2>&1; unit_tests_exit_code=$?; tail -n 200 /tmp/easydiffraction-unit.log; exit $unit_tests_exit_code
+pixi run functional-tests > /tmp/easydiffraction-functional.log 2>&1; functional_tests_exit_code=$?; tail -n 200 /tmp/easydiffraction-functional.log; exit $functional_tests_exit_code
+pixi run integration-tests > /tmp/easydiffraction-integration.log 2>&1; integration_tests_exit_code=$?; tail -n 200 /tmp/easydiffraction-integration.log; exit $integration_tests_exit_code
+pixi run script-tests > /tmp/easydiffraction-script.log 2>&1; script_tests_exit_code=$?; tail -n 200 /tmp/easydiffraction-script.log; exit $script_tests_exit_code
+```
+
+If implementation uncovers a serious requirement, risk, design issue, or
+a scope change not covered by this plan — for example a public-API
+change beyond what the ADR approved, or a dependency the plan does not
+name — **stop and ask** before proceeding, per `AGENTS.md` → §Planning.
+
+## Suggested Pull Request
+
+**Title:** Add one-call automatic background estimation for powder
+patterns
+
+**Description:** Setting up a line-segment background used to mean
+placing every anchor point by hand — tedious, and easy to get wrong
+where peaks overlap and the pattern never returns to baseline. This
+change adds `experiment.background.auto_estimate()`: call it with no
+arguments and it detects a sensible set of background points directly
+from your measured pattern, placing them between peaks and reading their
+heights from a peak-insensitive background curve so they don't eat into
+peak intensities. The points are ordinary, editable control points —
+review them, keep them fixed, or free any of them for refinement. Run it
+again after an initial fit and it uses the fitted model to place even
+better points, especially across crowded regions. It works for both
+constant-wavelength and time-of-flight data, neutron and X-ray.
diff --git a/docs/dev/plans/space-group-database.md b/docs/dev/plans/space-group-database.md
new file mode 100644
index 000000000..9710b0561
--- /dev/null
+++ b/docs/dev/plans/space-group-database.md
@@ -0,0 +1,275 @@
+# Plan: Complete Space-Group Reference Database
+
+This plan follows [`AGENTS.md`](../../../AGENTS.md) and implements the
+[`space-group-database`](../adrs/suggestions/space-group-database.md)
+ADR.
+
+**Deliberate exception to note for `/draft-impl-1`:** Phase 1 contains a
+**maintainer-only curation gate** (P1.4). The disagreement report is
+generated by the agent, but selecting authoritative values is a human
+decision (the maintainer inspects sources + International Tables and
+fills the overrides file). `/draft-impl-1` must **stop at P1.4 and
+wait** for the maintainer; it resumes at P1.5 once the ADR companion
+overrides file is populated (or confirmed empty because all machine
+sources agreed).
+
+**Deliberate exception to the normal checked-in tooling pattern:** the
+space-group source bundle, extraction helpers, generator, and comparison
+tables live under ignored `tmp/space-groups/`. They are one-time
+curation artifacts, not branch deliverables. The branch commits the
+final generated database, the ADR companion overrides file, and ADR
+provenance; the local helper path and SHA-256 are recorded so a future
+careful rebuild remains possible from the preserved local workspace.
+
+## ADR
+
+This plan owns the ADR
+[`docs/dev/adrs/suggestions/space-group-database.md`](../adrs/suggestions/space-group-database.md)
+(drafted via `/draft-adr`, review cycle closed). It is a
+**prerequisite** for
+[`wyckoff-letter-detection`](../adrs/suggestions/wyckoff-letter-detection.md):
+this plan delivers the complete data; that feature delivers the
+`''`→`None` consumer handling so the triclinic groups use it.
+
+## Branch and PR
+
+- Branch: **`space-group-database`** (flat slug off `develop`, no
+  `feature/` prefix). Do not push unless asked.
+- PR targets **`develop`**.
+
+## Decisions (settled in the ADR)
+
+- **Format:** `space_groups.json.gz` (gzip-compressed JSON). Drop the
+  pickle and the `_RestrictedUnpickler`; the loader `json.load`s the
+  decompressed stream and rebuilds the in-memory dict.
+- **In-memory shape unchanged:** `SPACE_GROUPS` stays a dict keyed by
+  `(IT_number, IT_coordinate_system_code)`; on disk it is a list of
+  setting records carrying those two canonical fields. Existing
+  consumers (`crystallography.py`, `calculators/cryspy.py`) are
+  untouched.
+- **Source priority:** cryspy `wyckoff.dat` first for Wyckoff-facing
+  values (letters, multiplicities, site symmetries, representative
+  coordinate orbits); cctbx/sgtbx for setting-level metadata and
+  operation checks. cctbx is **generation-only**, installed into a
+  **throwaway environment** for the one-time build and never added to
+  the project's runtime dependencies (`cctbx` is named here for
+  `/draft-impl-1` pre-approval, but it is _not_ a pyproject runtime
+  dep).
+- **Scope:** all 230 groups × all standard settings and public
+  coordinate-code aliases × full Wyckoff orbits, plus the
+  **symmetry-core** metadata `hall_symbol`, general-position `symop`
+  list, `generators`, `point_group`, `laue_class`, `centring` (further
+  fields deferred per the ADR).
+- **Cross-check sources:** cryspy `data/cryspy/wyckoff.dat`, gemmi
+  (settings + ops + orbit-closure of a given representative), parsed
+  Avogadro/SgInfo setting data, and the full RASPA appendix CSV under
+  `data/raspa/`; **International Tables** is the maintainer's authority
+  for flagged cases (PDF — not machine-readable, so not automated).
+- **Curation:** disagreements (≥2 machine sources differ) → local
+  grouped Markdown/CSV exports under
+  `tmp/space-groups/extracted-comparison/`; maintainer selections are
+  the checked-in ADR companion record (list of records, each with
+  rationale).
+- **Build is one-time:** the exact software versions are recorded in the
+  ADR's _Build Provenance_ section; no recurring pipeline.
+
+## Open questions
+
+- None blocking. The exact cctbx field availability (e.g. whether every
+  symmetry-core field is exposed directly or must be derived) is
+  resolved empirically while writing the generator (P1.1); record
+  anything surprising in the ADR.
+
+## Concrete files likely to change
+
+- `tmp/space-groups/helper-tools/generate_space_groups.py` — local
+  ignored generator (cctbx extraction + multi-source cross-check +
+  disagreement report + overrides consumption). Do not keep this helper
+  in the branch after implementation.
+- `docs/dev/adrs/suggestions/space-group-database/space_groups_overrides.yaml`
+  — **new** curation overrides (maintainer-authored at P1.4). Keep the
+  selected values here, not inside this plan: the plan documents
+  workflow, while YAML is the structured generator input with a focused
+  review diff. If the ADR is accepted, move this companion file into the
+  accepted ADR companion folder with the ADR.
+- `tmp/space-groups/extracted-comparison/` — local grouped Markdown/CSV
+  exports, including one CSV per compared field.
+- `src/easydiffraction/crystallography/space_groups.json.gz` — **new**
+  generated database; **remove** `space_groups.pkl.gz`.
+- `src/easydiffraction/crystallography/space_groups.py` — rewrite loader
+  (read JSON, reconstruct dict, drop `_RestrictedUnpickler` + `pickle`).
+- `docs/dev/adrs/suggestions/space-group-database.md` — fill in _Build
+  Provenance_ with recorded versions.
+- `tools/check_packaged_db.py` — **new** helper that inspects a built
+  wheel (independent of the package's dependency tree): it reads
+  `space_groups.json.gz` straight from the wheel and asserts the data
+  ships, the obsolete `.pkl.gz` is gone, and all 230 groups plus the
+  cryspy coordinate-code alias surface are present (used by the Phase 2
+  packaging regression).
+- `pyproject.toml` — **only if** the Phase 2 packaging test shows the
+  `.json.gz` is not shipped (add a hatch `artifacts`/`force-include`
+  entry).
+- Phase 2:
+  `tests/unit/easydiffraction/crystallography/test_space_groups.py` and
+  `test_space_groups_coverage.py` (JSON loader + presence +
+  query-surface
+  - spot-check tests); a wheel import/load packaging test.
+
+## Implementation steps (Phase 1)
+
+Each `- [ ]` step is one atomic commit. Per §Commits, stage only the
+files the step names, with explicit paths, and commit locally with the
+step's `Commit:` message **before** moving to the next step. Mark `[x]`
+in this file as part of the same commit.
+
+- [x] **P1.1 — cctbx extraction to a complete setting table.** Write the
+      first part of
+      `tmp/space-groups/helper-tools/generate_space_groups.py`: in a
+      throwaway env with `cctbx` installed, enumerate all 230 groups ×
+      standard settings via sgtbx, emit the available symmetry-core
+      metadata and cctbx Wyckoff/orbit candidates into the in-memory
+      record list keyed by `(IT_number, IT_coordinate_system_code)`.
+      Keep coordinates/operators as strings (JSON-native). Do not wire a
+      routine pixi task. Commit:
+      `Add cctbx-based space-group table extraction`
+
+- [x] **P1.2 — Multi-source cross-check + disagreement report.** Extend
+      the generator to merge cryspy `wyckoff.dat` Wyckoff-facing values
+      with cctbx setting metadata, then compare against gemmi
+      (`spacegroup_table()` settings/ops + orbit-closure), parsed
+      Avogadro/SgInfo data, and the RASPA CSV. Where ≥2 machine sources
+      disagree on a value, write a report record
+      `{case, per-source values, IT: <blank for maintainer>, Override: <blank for maintainer>}`
+      to the local comparison folder. Consume the ADR companion
+      overrides file if present. P1.3 command:
+
+  ```bash
+  pixi exec --spec cctbx --spec gemmi --spec sympy --spec pyyaml \
+    python tmp/space-groups/helper-tools/generate_space_groups.py \
+    --write-comparison-folder tmp/space-groups/extracted-comparison \
+    --print-summary
+  ```
+
+  Commit: `Add multi-source cross-check and disagreement report`
+
+- [x] **P1.3 — First generation run + commit the report.** Run the
+      generator (cctbx temp-installed) with no overrides to produce the
+      initial local disagreement report. Do not commit the local
+      comparison artifacts or a database file yet. Commit:
+      `Generate initial space-group disagreement report`
+
+- [x] **P1.3a — Localize one-time curation artifacts.** Move the
+      generator and comparison outputs fully into ignored
+      `tmp/space-groups/`; remove the previously tracked generator and
+      report artifacts from the branch. Update the ADR and plan to
+      record that the generator helper is local curation tooling and
+      that the final provenance records its SHA-256 instead of a commit
+      hash. Commit: `Localize space-group curation artifacts`
+
+- [x] **P1.4 — MAINTAINER CURATION GATE (manual).** `/draft-impl-1`
+      **stops here**. The maintainer inspects the report, consults
+      International Tables for flagged cases, and **always** produces a
+      checked-in
+      `docs/dev/adrs/suggestions/space-group-database/space_groups_overrides.yaml`:
+      a list of curated records (each with rationale) when there were
+      disagreements, or — if the report was empty because all machine
+      sources agreed — the same file containing only an explanatory
+      header comment and an empty list. Either way there is a concrete
+      file to stage, so the per-step commit rule holds. The agent
+      resumes at P1.5 only after the maintainer confirms. Commit
+      (maintainer, or agent on resume):
+      `Add curated space-group overrides`
+
+- [x] **P1.5 — Final generation + provenance.** Re-run the generator
+      consuming the overrides to emit
+      `src/easydiffraction/crystallography/space_groups.json.gz`. Fill
+      in the ADR's _Build Provenance_ section with the exact versions
+      (cctbx channel/ version/build/install command, Python/platform,
+      gemmi/cryspy versions + `wyckoff.dat` SHA-256, gathered-input
+      origins+SHA-256, generator helper SHA-256 + command, output
+      SHA-256). Commit:
+      `Generate complete space_groups.json.gz with recorded provenance`
+
+- [x] **P1.6 — Rewrite loader, drop pickle.** Rewrite
+      `src/easydiffraction/crystallography/space_groups.py` to read
+      `space_groups.json.gz` and rebuild the
+      `(IT_number, IT_coordinate_system_code)`-keyed `SPACE_GROUPS`
+      dict; remove `_RestrictedUnpickler` and the `pickle` import.
+      `git rm` the old `space_groups.pkl.gz`. Commit:
+      `Load space groups from JSON and drop restricted unpickler`
+
+- [x] **P1.7 — Phase 1 review gate.** No code. Mark this `[x]`, commit
+      the checklist update alone, and hand off to `/review-impl-1`.
+      Commit: `Reach Phase 1 review gate`
+
+## Phase 2 — Verification
+
+Add/update tests, then run the checks below. Stop after Phase 1 for
+review before starting Phase 2.
+
+Tests to add/update (in `tests/unit/easydiffraction/crystallography/`,
+mirroring source):
+
+- update `test_space_groups.py` / `test_space_groups_coverage.py` for
+  the JSON loader (no pickle);
+- **presence**: all 230 groups + standard settings load (regression vs
+  the current 42-group / 18-setting gap);
+- **query surface (parity with today, no new index)**: every
+  standard-setting `(IT_number, IT_coordinate_system_code)` entry loads
+  from the DB, every coordinate-system code currently exposed by
+  cryspy's `get_it_coordinate_system_codes_by_it_number` resolves in
+  `SPACE_GROUPS`, and for each group the _existing_ cryspy-backed
+  `get_it_number_by_name_hm_short` resolution still returns an IT number
+  that is present in the DB. This verifies "at least as queryable as
+  today" against the loaded dict and the unchanged H-M path; a
+  database-derived H-M index is **not** added here (it stays Deferred
+  Work in the ADR);
+- **spot-checks vs International Tables** for P4, P3, P6, Pm-3, a
+  monoclinic with cell choices, and an origin-choice group;
+- **packaging**: `tools/check_packaged_db.py` opens the built **wheel**
+  and reads `space_groups.json.gz` directly from it (no install, so the
+  check is independent of the package's dependency tree), asserting the
+  data ships, the obsolete `.pkl.gz` is absent, and all 230 groups plus
+  the cryspy coordinate-code alias surface are present. This catches
+  package-data omission for the renamed `.json.gz` regardless of
+  unrelated runtime-import issues.
+
+Verification commands (zsh-safe log capture where output is needed):
+
+```bash
+pixi run fix
+pixi run check > /tmp/easydiffraction-check.log 2>&1; check_exit_code=$?; tail -n 200 /tmp/easydiffraction-check.log; exit $check_exit_code
+pixi run unit-tests > /tmp/easydiffraction-unit.log 2>&1; unit_tests_exit_code=$?; tail -n 200 /tmp/easydiffraction-unit.log; exit $unit_tests_exit_code
+pixi run integration-tests > /tmp/easydiffraction-integration.log 2>&1; integration_tests_exit_code=$?; tail -n 200 /tmp/easydiffraction-integration.log; exit $integration_tests_exit_code
+pixi run script-tests > /tmp/easydiffraction-script.log 2>&1; script_tests_exit_code=$?; tail -n 200 /tmp/easydiffraction-script.log; exit $script_tests_exit_code
+```
+
+Packaging regression — build the wheel and inspect it directly (no
+install, so the check does not depend on the package's full runtime
+dependency tree):
+
+```bash
+rm -rf dist
+pixi run dist-build > /tmp/easydiffraction-build.log 2>&1; build_exit_code=$?; tail -n 8 /tmp/easydiffraction-build.log; [ "$build_exit_code" -eq 0 ] || exit "$build_exit_code"
+python tools/check_packaged_db.py dist/*.whl; pkg_check_exit_code=$?; [ "$pkg_check_exit_code" -eq 0 ] || exit "$pkg_check_exit_code"
+```
+
+If this shows `.json.gz` is not shipped, add a hatch
+`artifacts`/`force-include` entry in `pyproject.toml` and re-run.
+
+## Suggested Pull Request
+
+**Title:** Complete the bundled space-group database (all 230 groups)
+
+**Description:** EasyDiffraction's bundled space-group table was missing
+42 common space groups entirely — including P4, P3, P6, and Pm-3 — plus
+many alternative monoclinic settings, so symmetry constraints and
+Wyckoff information silently did nothing for structures in those groups.
+This change rebuilds the database from curated cryspy and cctbx/sgtbx
+source data, covering all 230 groups, their standard settings, and every
+public coordinate-code alias with full symmetry information. The seed
+data is cross-checked against several independent references and keeps
+flagged rows visible for later International Tables verification. The
+data now ships as transparent, inspectable JSON instead of an opaque
+binary pickle. Existing projects load unchanged; structures in the
+previously-missing groups now get correct symmetry handling.
diff --git a/docs/docs/tutorials/ed-13.ipynb b/docs/docs/tutorials/ed-13.ipynb
index db36a147e..ad016e87f 100644
--- a/docs/docs/tutorials/ed-13.ipynb
+++ b/docs/docs/tutorials/ed-13.ipynb
@@ -2671,7 +2671,7 @@
     "\n",
     "If you'd like to keep exploring, the EasyDiffraction library offers\n",
     "many additional tutorials and examples on the official documentation\n",
-    "site: 👉 https://docs.easydiffraction.org/lib/tutorials/\n",
+    "site: 👉 https://docs.easydiffraction.org/lib/latest/tutorials\n",
     "\n",
     "Besides the Python package, EasyDiffraction also comes with a\n",
     "graphical user interface (GUI) that lets you perform similar analyses\n",
diff --git a/docs/docs/tutorials/ed-13.py b/docs/docs/tutorials/ed-13.py
index 655e270b3..a72473422 100644
--- a/docs/docs/tutorials/ed-13.py
+++ b/docs/docs/tutorials/ed-13.py
@@ -1508,7 +1508,7 @@
 #
 # If you'd like to keep exploring, the EasyDiffraction library offers
 # many additional tutorials and examples on the official documentation
-# site: 👉 https://docs.easydiffraction.org/lib/tutorials/
+# site: 👉 https://docs.easydiffraction.org/lib/latest/tutorials
 #
 # Besides the Python package, EasyDiffraction also comes with a
 # graphical user interface (GUI) that lets you perform similar analyses
diff --git a/src/easydiffraction/crystallography/space_groups.json.gz b/src/easydiffraction/crystallography/space_groups.json.gz
new file mode 100644
index 000000000..75d4f80ce
Binary files /dev/null and b/src/easydiffraction/crystallography/space_groups.json.gz differ
diff --git a/src/easydiffraction/crystallography/space_groups.pkl.gz b/src/easydiffraction/crystallography/space_groups.pkl.gz
deleted file mode 100644
index a9682a022..000000000
Binary files a/src/easydiffraction/crystallography/space_groups.pkl.gz and /dev/null differ
diff --git a/src/easydiffraction/crystallography/space_groups.py b/src/easydiffraction/crystallography/space_groups.py
index e370d116b..d3ceee287 100644
--- a/src/easydiffraction/crystallography/space_groups.py
+++ b/src/easydiffraction/crystallography/space_groups.py
@@ -3,96 +3,34 @@
 """
 Space group reference data.
 
-Loads a gzipped, packaged pickle with crystallographic space-group
+Loads gzipped, packaged JSON with crystallographic space-group
 information. The file is part of the distribution; user input is not
 involved.
 """
 
-import builtins
+from __future__ import annotations
+
 import gzip
-import io
-import pickle  # noqa: S403
+import json
 from pathlib import Path
-from typing import override
-
-_SAFE_BUILTINS = frozenset({
-    'dict',
-    'frozenset',
-    'list',
-    'set',
-    'tuple',
-})
-
-
-class _RestrictedUnpickler(pickle.Unpickler):  # noqa: S301
-    """
-    Unpickler that only allows safe built-in types.
-
-    Rejects any ``GLOBAL`` opcode that references modules or classes
-    outside of ``builtins``, limiting deserialisation to plain Python
-    data structures (dicts, lists, tuples, sets, frozensets) plus
-    primitive scalars (str, int, float, bool, None) which the pickle
-    protocol handles without ``GLOBAL``.
-    """
-
-    @override
-    def find_class(
-        self,
-        module: str,
-        name: str,
-    ) -> type:
-        """
-        Allow only safe built-in types.
-
-        Parameters
-        ----------
-        module : str
-            The module name from the pickle stream.
-        name : str
-            The class/function name from the pickle stream.
-
-        Returns
-        -------
-        type
-            The resolved built-in type.
+from typing import Any
 
-        Raises
-        ------
-        pickle.UnpicklingError
-            If the requested type is not in the safe set.
-        """
-        if module == 'builtins' and name in _SAFE_BUILTINS:
-            return getattr(builtins, name)
-        msg = f'Restricted unpickler refused {module}.{name}'
-        raise pickle.UnpicklingError(msg)
+_SpaceGroupKey = tuple[int, str | None]
+_SpaceGroupRecord = dict[str, Any]
 
 
-def _restricted_pickle_load(file_obj: io.BufferedIOBase) -> object:
-    """
-    Load pickle data using a restricted unpickler.
-
-    Only safe built-in types (dict, list, tuple, set, frozenset, and
-    primitive scalars) are permitted. The archive lives in the package;
-    no user-controlled input enters this function.
-
-    Parameters
-    ----------
-    file_obj : io.BufferedIOBase
-        Binary file object to read pickle data from.
-
-    Returns
-    -------
-    object
-        The deserialised Python data structure.
-    """
-    return _RestrictedUnpickler(file_obj).load()
-
-
-def _load() -> object:
+def _load() -> dict[_SpaceGroupKey, _SpaceGroupRecord]:
     """Load space-group data from the packaged archive."""
-    path = Path(__file__).with_name('space_groups.pkl.gz')
-    with gzip.open(path, 'rb') as f:
-        return _restricted_pickle_load(f)
-
-
-SPACE_GROUPS = _load()
+    path = Path(__file__).with_name('space_groups.json.gz')
+    with gzip.open(path, 'rt', encoding='utf-8') as file_handle:
+        records = json.load(file_handle)
+    return {
+        (
+            record['IT_number'],
+            record['IT_coordinate_system_code'],
+        ): record
+        for record in records
+    }
+
+
+SPACE_GROUPS: dict[_SpaceGroupKey, _SpaceGroupRecord] = _load()
diff --git a/src/easydiffraction/display/plotters/plotly.py b/src/easydiffraction/display/plotters/plotly.py
index 875b6ae55..b6b478e35 100644
--- a/src/easydiffraction/display/plotters/plotly.py
+++ b/src/easydiffraction/display/plotters/plotly.py
@@ -100,6 +100,14 @@
 AXIS_TITLE_FONT_SIZE = 12
 X_AXIS_TICK_LABEL_STANDOFF = 5
 Y_AXIS_TICK_LABEL_STANDOFF = 6
+HOVER_LABEL_FONT_SIZE = 12
+# Plotly has no hover-label padding, so a non-breaking space is baked
+# into each template line to hold the text off the left and right frame.
+# Vertical spacing is left to Plotly's own ~3px line box: a blank spacer
+# line reserves a full content-line height, which inflates the bottom
+# margin and cannot be tuned, so a single space keeps all four margins
+# small and even.
+HOVER_HORIZONTAL_PAD = '\u00a0'
 PREDICTIVE_BAND_COLOR = 'rgba(214, 39, 40, 0.14)'
 PREDICTIVE_BAND_EDGE_COLOR = 'rgba(214, 39, 40, 0.45)'
 PREDICTIVE_DRAW_COLOR = 'rgba(140, 140, 140, 0.18)'
@@ -322,6 +330,50 @@ def _legend_background_color(cls) -> str:
         """Return a half-transparent legend background color."""
         return cls._theme_colors().legend_background
 
+    @classmethod
+    def _hover_label_style(
+        cls,
+        theme_colors: DisplayThemeColors | None = None,
+    ) -> dict:
+        """
+        Return the shared hover-label style for every Plotly figure.
+
+        This is the single source of truth for tooltip framing. The
+        border matches the Axes-rectangle (axis-frame) color and the
+        background follows the active theme. Per-line text colors live
+        in each trace's hover template, not here.
+
+        Parameters
+        ----------
+        theme_colors : DisplayThemeColors | None, default=None
+            Explicit theme colors; the active theme is used when
+            omitted.
+
+        Returns
+        -------
+        dict
+            A Plotly ``hoverlabel`` style dictionary.
+        """
+        colors = theme_colors if theme_colors is not None else cls._theme_colors()
+        return {
+            'bgcolor': colors.hover_background,
+            'bordercolor': colors.axis_frame,
+            'font': {'color': colors.foreground, 'size': HOVER_LABEL_FONT_SIZE},
+            'align': 'left',
+        }
+
+    @classmethod
+    def _apply_hover_label_style(
+        cls,
+        fig: object,
+        *,
+        theme_colors: DisplayThemeColors | None = None,
+    ) -> None:
+        """Apply the shared hover-label style to a Plotly figure."""
+        update_layout = getattr(fig, 'update_layout', None)
+        if callable(update_layout):
+            update_layout(hoverlabel=cls._hover_label_style(theme_colors))
+
     @staticmethod
     def _background_color_for_template(template: str) -> str | None:
         theme_colors = display_theme_colors_for_template(template)
@@ -554,8 +606,9 @@ def _get_correlation_label_trace(
             showlegend=False,
         )
 
-    @staticmethod
+    @classmethod
     def _get_powder_trace(
+        cls,
         x: object,
         y: object,
         label: str,
@@ -623,10 +676,50 @@ def _get_powder_trace(
             hovertemplate=(
                 hovertemplate
                 if hovertemplate is not None
-                else f'{name}<br>x: %{{x}}<br>y: %{{y}}<extra></extra>'
+                else cls._format_hover_lines([
+                    cls._hover_color_span(name, color),
+                    cls._hover_color_span('x: %{x}', color),
+                    cls._hover_color_span('y: %{y}', color),
+                ])
             ),
         )
 
+    @staticmethod
+    def _hover_text_color(color: str) -> str:
+        """Return a span-safe CSS color (no internal whitespace)."""
+        return color.replace(' ', '')
+
+    @classmethod
+    def _hover_color_span(cls, text: str, color: str) -> str:
+        """Wrap hover text in a span colored to match a trace."""
+        return f'<span style="color:{cls._hover_text_color(color)}">{text}</span>'
+
+    @classmethod
+    def _format_hover_lines(
+        cls,
+        lines: list[str],
+        *,
+        extra: str = '<extra></extra>',
+    ) -> str:
+        """
+        Join hover lines with the padding shared by every tooltip.
+
+        Parameters
+        ----------
+        lines : list[str]
+            Per-line hover content, already colored where needed.
+        extra : str, default='<extra></extra>'
+            Trailing Plotly hover directive (the secondary box).
+
+        Returns
+        -------
+        str
+            A hover-template body padded left and right; top and bottom
+            spacing is supplied by Plotly's own line box.
+        """
+        padded = [f'{HOVER_HORIZONTAL_PAD}{line}{HOVER_HORIZONTAL_PAD}' for line in lines]
+        return '<br>'.join(padded) + extra
+
     @staticmethod
     def _powder_meas_vs_calc_hover_data(plot_spec: PowderMeasVsCalcSpec) -> np.ndarray:
         """Return shared hover values for composite powder traces."""
@@ -649,29 +742,54 @@ def _powder_meas_vs_calc_hover_data(plot_spec: PowderMeasVsCalcSpec) -> np.ndarr
             residual_values,
         ))
 
-    @staticmethod
-    def _powder_meas_vs_calc_hover_template(plot_spec: PowderMeasVsCalcSpec) -> str:
+    @classmethod
+    def _powder_meas_vs_calc_hover_template(
+        cls,
+        plot_spec: PowderMeasVsCalcSpec,
+    ) -> str:
         """
         Return a shared hover template for composite powder traces.
+
+        Each line is colored to match its curve and padded away from the
+        tooltip frame through the shared hover formatter.
         """
         calc_label = plot_spec.y_calc_name or 'Icalc'
         if plot_spec.y_bkg is None:
-            return (
-                'x: %{x:,.2f}<br>'
-                'Imeas: %{customdata[0]:,.2f}<br>'
-                f'{calc_label}: %{{customdata[1]:,.2f}}<br>'
-                f'Imeas - {calc_label}: %{{customdata[2]:,.2f}}'
-                '<extra></extra>'
-            )
+            return cls._format_hover_lines([
+                'x: %{x:,.2f}',
+                cls._hover_color_span(
+                    'Imeas: %{customdata[0]:,.2f}',
+                    DEFAULT_COLORS['meas'],
+                ),
+                cls._hover_color_span(
+                    f'{calc_label}: %{{customdata[1]:,.2f}}',
+                    DEFAULT_COLORS['calc'],
+                ),
+                cls._hover_color_span(
+                    f'Imeas - {calc_label}: %{{customdata[2]:,.2f}}',
+                    DEFAULT_COLORS['resid'],
+                ),
+            ])
 
-        return (
-            'x: %{x:,.2f}<br>'
-            'Imeas: %{customdata[0]:,.2f}<br>'
-            'Ibkg: %{customdata[1]:,.2f}<br>'
-            f'{calc_label}: %{{customdata[2]:,.2f}}<br>'
-            f'Imeas - {calc_label}: %{{customdata[3]:,.2f}}'
-            '<extra></extra>'
-        )
+        return cls._format_hover_lines([
+            'x: %{x:,.2f}',
+            cls._hover_color_span(
+                'Imeas: %{customdata[0]:,.2f}',
+                DEFAULT_COLORS['meas'],
+            ),
+            cls._hover_color_span(
+                'Ibkg: %{customdata[1]:,.2f}',
+                DEFAULT_COLORS['bkg'],
+            ),
+            cls._hover_color_span(
+                f'{calc_label}: %{{customdata[2]:,.2f}}',
+                DEFAULT_COLORS['calc'],
+            ),
+            cls._hover_color_span(
+                f'Imeas - {calc_label}: %{{customdata[3]:,.2f}}',
+                DEFAULT_COLORS['resid'],
+            ),
+        ])
 
     @staticmethod
     def _get_single_crystal_trace(
@@ -1196,6 +1314,7 @@ def _theme_sync_post_script() -> str:
         'legend.bgcolor': colors.legend,
         'legend.font.color': colors.foreground,
         'hoverlabel.bgcolor': colors.hoverBackground,
+        'hoverlabel.bordercolor': colors.axisFrame,
         'hoverlabel.font.color': colors.foreground,
     };
 
@@ -1547,6 +1666,7 @@ def _show_figure(
         """
         config = self._get_config()
         self._apply_background_color(fig)
+        self._apply_hover_label_style(fig)
 
         if in_pycharm() or display is None or HTML is None:
             fig.show(config=config)
@@ -1616,6 +1736,12 @@ def serialize_html(
             if legend_bgcolor is not None:
                 fig.update_layout(legend={'bgcolor': legend_bgcolor})
         cls._apply_background_color(fig, background_color=background_color)
+        hover_theme_colors = (
+            display_theme_colors_for_template(force_template)
+            if force_template is not None
+            else None
+        )
+        cls._apply_hover_label_style(fig, theme_colors=hover_theme_colors)
         html_fig = pio.to_html(
             fig,
             include_plotlyjs=include_plotlyjs,
@@ -1810,14 +1936,20 @@ def _add_excluded_region_vrects(
                 add_kwargs['col'] = col
             fig.add_vrect(**add_kwargs)
 
-    @staticmethod
+    @classmethod
     def _get_bragg_tick_trace(
+        cls,
         tick_set: BraggTickSet,
         row_y: float,
         color: str,
     ) -> object:
         """
         Create a hover-capable Bragg tick trace for one linked phase.
+
+        Only the Miller-index line is colored to match the phase tick
+        marker; the phase name and x line use the default tooltip text
+        color, and all lines share the padding and themed frame used by
+        every other tooltip.
         """
         y = np.full(tick_set.x.shape, row_y, dtype=float)
         hover_text = []
@@ -1825,14 +1957,17 @@ def _get_bragg_tick_trace(
             index_h = int(tick_set.h[idx])
             index_k = int(tick_set.k[idx])
             index_l = int(tick_set.ell[idx])
-            hover_text.append(
-                f'{tick_set.phase_id}<br>'
-                f'x: {float(x_value):,.2f}<br>'
-                f'Miller indices: ({index_h} {index_k} {index_l})<br>'
-                # f'F²cal:{float(tick_set.f_squared_calc[idx]):.6g}<br>'
-                # f'Fcalc:{float(tick_set.f_calc[idx]):.6g}'
-                '<extra></extra>'
-            )
+            lines = [
+                tick_set.phase_id,
+                f'x: {float(x_value):,.2f}',
+                cls._hover_color_span(
+                    f'Miller indices: ({index_h} {index_k} {index_l})',
+                    color,
+                ),
+                # f'F²cal: {float(tick_set.f_squared_calc[idx]):.6g}',
+                # f'Fcalc: {float(tick_set.f_calc[idx]):.6g}',
+            ]
+            hover_text.append(cls._format_hover_lines(lines))
 
         return go.Scatter(
             x=tick_set.x,
@@ -1846,10 +1981,6 @@ def _get_bragg_tick_trace(
             },
             name=f'Bragg peaks: {tick_set.phase_id}',
             text=hover_text,
-            hoverlabel={
-                'font': {'color': 'white'},
-                'bordercolor': 'white',
-            },
             hovertemplate='%{text}',
         )
 
diff --git a/src/easydiffraction/display/tablers/base.py b/src/easydiffraction/display/tablers/base.py
index decb2282f..36b642b09 100644
--- a/src/easydiffraction/display/tablers/base.py
+++ b/src/easydiffraction/display/tablers/base.py
@@ -12,7 +12,10 @@
 from abc import ABC
 from abc import abstractmethod
 
-from IPython import get_ipython
+try:
+    from IPython import get_ipython
+except ImportError:  # IPython is an optional display dependency
+    get_ipython = None
 from rich.color import Color
 
 from easydiffraction.display.theme import DARK_AXIS_FRAME_COLOR
@@ -63,7 +66,9 @@ def _is_dark_theme() -> bool:
         default = True
 
         in_jupyter = (
-            get_ipython() is not None and get_ipython().__class__.__name__ == 'ZMQInteractiveShell'
+            get_ipython is not None
+            and get_ipython() is not None
+            and get_ipython().__class__.__name__ == 'ZMQInteractiveShell'
         )
 
         if not in_jupyter:
diff --git a/tests/unit/easydiffraction/crystallography/test_space_groups.py b/tests/unit/easydiffraction/crystallography/test_space_groups.py
index dd1482cd0..37eab7235 100644
--- a/tests/unit/easydiffraction/crystallography/test_space_groups.py
+++ b/tests/unit/easydiffraction/crystallography/test_space_groups.py
@@ -1,10 +1,74 @@
 # SPDX-FileCopyrightText: 2025 EasyScience contributors <https://github.com/easyscience>
 # SPDX-License-Identifier: BSD-3-Clause
+"""Unit tests for the space-group reference-data loader."""
+
+from easydiffraction.crystallography.space_groups import SPACE_GROUPS
+
+_EXPECTED_RECORD_KEYS = {
+    'IT_number',
+    'IT_coordinate_system_code',
+    'setting',
+    'name_H-M_alt',
+    'crystal_system',
+    'Wyckoff_positions',
+    'hall_symbol',
+    'symop',
+    'generators',
+    'point_group',
+    'laue_class',
+    'centring',
+}
+_EXPECTED_WYCKOFF_KEYS = {'multiplicity', 'site_symmetry', 'coords_xyz'}
+
+# Accepted seed: 530 cctbx settings + 226 reference-settings aliases + 60
+# runtime coordinate-code aliases. A deliberate regeneration updates this.
+_EXPECTED_RECORD_COUNT = 816
 
 
 def test_module_import():
     import easydiffraction.crystallography.space_groups as MUT
 
-    expected_module_name = 'easydiffraction.crystallography.space_groups'
-    actual_module_name = MUT.__name__
-    assert expected_module_name == actual_module_name
+    assert MUT.__name__ == 'easydiffraction.crystallography.space_groups'
+
+
+def test_space_groups_is_dict_keyed_by_it_and_code():
+    """SPACE_GROUPS is a non-empty dict keyed by (IT number, coord code)."""
+    assert isinstance(SPACE_GROUPS, dict)
+    assert SPACE_GROUPS
+    for it_number, coord_code in SPACE_GROUPS:
+        assert isinstance(it_number, int)
+        assert coord_code is None or isinstance(coord_code, str)
+
+
+def test_all_230_groups_present():
+    """Every International Tables group 1-230 is present (no coverage gap)."""
+    it_numbers = {key[0] for key in SPACE_GROUPS}
+    assert it_numbers == set(range(1, 231))
+
+
+def test_record_count_matches_accepted_seed():
+    """The loaded table keeps its full setting/alias surface (no silent loss).
+
+    SPACE_GROUPS is keyed by ``(IT_number, IT_coordinate_system_code)``, so this
+    also pins the number of unique setting keys.
+    """
+    assert len(SPACE_GROUPS) == _EXPECTED_RECORD_COUNT
+
+
+def test_triclinic_groups_keep_none_coordinate_code():
+    """Triclinic P1/P-1 keep the ``None`` coordinate-system-code key."""
+    assert (1, None) in SPACE_GROUPS
+    assert (2, None) in SPACE_GROUPS
+
+
+def test_every_record_has_the_expected_schema():
+    """Each setting record carries the full symmetry-core schema."""
+    for key, record in SPACE_GROUPS.items():
+        assert set(record) >= _EXPECTED_RECORD_KEYS, key
+        assert record['IT_number'] == key[0]
+        assert record['IT_coordinate_system_code'] == key[1]
+        for letter, position in record['Wyckoff_positions'].items():
+            assert set(position) >= _EXPECTED_WYCKOFF_KEYS, (key, letter)
+            assert isinstance(position['multiplicity'], int)
+            assert isinstance(position['coords_xyz'], list)
+            assert position['coords_xyz']
diff --git a/tests/unit/easydiffraction/crystallography/test_space_groups_coverage.py b/tests/unit/easydiffraction/crystallography/test_space_groups_coverage.py
index 1792e017b..638a85cd4 100644
--- a/tests/unit/easydiffraction/crystallography/test_space_groups_coverage.py
+++ b/tests/unit/easydiffraction/crystallography/test_space_groups_coverage.py
@@ -1,71 +1,85 @@
-# SPDX-FileCopyrightText: 2026 EasyScience contributors <https://github.com/easyscience>
+# SPDX-FileCopyrightText: 2025 EasyScience contributors <https://github.com/easyscience>
 # SPDX-License-Identifier: BSD-3-Clause
-"""Additional unit tests for space_groups.py to cover RestrictedUnpickler."""
-
-import io
-import pickle  # noqa: S403
-
-import pytest
-
-
-class TestRestrictedUnpickler:
-    def test_loads_plain_dict(self):
-        """Safe built-in types should be allowed."""
-        from easydiffraction.crystallography.space_groups import _restricted_pickle_load
-
-        data = {'key': [1, 2, 3], 'nested': {'a': (True, None)}}
-        buf = io.BytesIO()
-        pickle.dump(data, buf)
-        buf.seek(0)
-        result = _restricted_pickle_load(buf)
-        assert result == data
-
-    def test_loads_set_and_frozenset(self):
-        from easydiffraction.crystallography.space_groups import _restricted_pickle_load
-
-        data = {'s': {1, 2}, 'fs': frozenset({3, 4})}
-        buf = io.BytesIO()
-        pickle.dump(data, buf)
-        buf.seek(0)
-        result = _restricted_pickle_load(buf)
-        assert result == data
-
-    def test_loads_tuple_and_list(self):
-        from easydiffraction.crystallography.space_groups import _restricted_pickle_load
-
-        data = ([1, 2], (3, 4))
-        buf = io.BytesIO()
-        pickle.dump(data, buf)
-        buf.seek(0)
-        result = _restricted_pickle_load(buf)
-        assert result == data
-
-    def test_rejects_unsafe_class(self):
-        """Non-builtin types should be rejected."""
-        from easydiffraction.crystallography.space_groups import _RestrictedUnpickler
-
-        # Create a pickle stream that tries to instantiate os.system
-        buf = io.BytesIO()
-        # Use protocol 2 to get GLOBAL opcode
-        pickle.dump(object(), buf, protocol=2)
-        buf.seek(0)
-
-        # Directly test find_class rejection
-        unpickler = _RestrictedUnpickler(buf)
-        with pytest.raises(pickle.UnpicklingError, match='Restricted unpickler refused'):
-            unpickler.find_class('os', 'system')
-
-    def test_rejects_builtins_not_in_safe_set(self):
-        from easydiffraction.crystallography.space_groups import _RestrictedUnpickler
-
-        buf = io.BytesIO(b'')
-        unpickler = _RestrictedUnpickler(buf)
-        with pytest.raises(pickle.UnpicklingError, match='Restricted unpickler refused'):
-            unpickler.find_class('builtins', 'eval')
-
-    def test_space_groups_loaded_successfully(self):
-        """The SPACE_GROUPS constant should be a non-empty dict."""
-        from easydiffraction.crystallography.space_groups import SPACE_GROUPS
-
-        assert isinstance(SPACE_GROUPS, dict)
-        assert len(SPACE_GROUPS) > 0
+"""Coverage tests for space_groups.py: query-surface parity and IT spot-checks."""
+
+from cryspy.A_functions_base.function_2_space_group import ACCESIBLE_NAME_HM_SHORT
+from cryspy.A_functions_base.function_2_space_group import (
+    get_it_coordinate_system_codes_by_it_number,
+)
+from cryspy.A_functions_base.function_2_space_group import get_it_number_by_name_hm_short
+
+from easydiffraction.crystallography.space_groups import SPACE_GROUPS
+
+
+def _multiplicities(it_number: int, coord_code):
+    record = SPACE_GROUPS[it_number, coord_code]
+    return {
+        letter: position['multiplicity']
+        for letter, position in record['Wyckoff_positions'].items()
+    }
+
+
+def test_every_cryspy_coordinate_code_resolves():
+    """Every (IT number, coordinate code) the SpaceGroup category can produce
+    is a key in the database (parity with today's query surface).
+    """
+    missing = []
+    for name_hm in ACCESIBLE_NAME_HM_SHORT:
+        it_number = get_it_number_by_name_hm_short(name_hm)
+        if it_number is None:
+            continue
+        codes = get_it_coordinate_system_codes_by_it_number(it_number)
+        # SpaceGroup uses ``codes or ['']``; '' normalises to None (the
+        # no-setting key) exactly as wyckoff-letter-detection specifies.
+        for code in list(codes) if codes else ['']:
+            key = (it_number, None if code == '' else code)
+            if key not in SPACE_GROUPS:
+                missing.append(key)
+    assert not missing, f'coordinate codes absent from SPACE_GROUPS: {sorted(set(missing))}'
+
+
+def test_hm_short_symbol_resolves_to_present_it_number():
+    """Every cryspy H-M short symbol maps to an IT number present in the DB."""
+    db_it_numbers = {key[0] for key in SPACE_GROUPS}
+    for name_hm in ACCESIBLE_NAME_HM_SHORT:
+        it_number = get_it_number_by_name_hm_short(name_hm)
+        if it_number is None:
+            continue
+        assert it_number in db_it_numbers, name_hm
+
+
+def test_spot_check_multiplicities_against_international_tables():
+    """Wyckoff multiplicities match International Tables for representatives."""
+    expected = {
+        (75, '1'): {'a': 1, 'b': 1, 'c': 2, 'd': 4},  # P4
+        (143, 'h'): {'a': 1, 'b': 1, 'c': 1, 'd': 3},  # P3
+        (168, 'h'): {'a': 1, 'b': 2, 'c': 3, 'd': 6},  # P6
+        (14, 'b1'): {'a': 2, 'b': 2, 'c': 2, 'd': 2, 'e': 4},  # P2_1/c
+        (200, '1'): {  # Pm-3
+            'a': 1,
+            'b': 1,
+            'c': 3,
+            'd': 3,
+            'e': 6,
+            'f': 6,
+            'g': 6,
+            'h': 6,
+            'i': 8,
+            'j': 12,
+            'k': 12,
+            'l': 24,
+        },
+    }
+    for key, mults in expected.items():
+        assert _multiplicities(*key) == mults, key
+
+
+def test_origin_choice_settings_share_multiplicities_but_differ_in_coordinates():
+    """Fd-3m (227) origin choices 1 and 2 share multiplicities, differ in coords."""
+    assert (227, '1') in SPACE_GROUPS
+    assert (227, '2') in SPACE_GROUPS
+    assert _multiplicities(227, '1') == _multiplicities(227, '2')
+    pos1 = SPACE_GROUPS[227, '1']['Wyckoff_positions']
+    pos2 = SPACE_GROUPS[227, '2']['Wyckoff_positions']
+    # The origin shift changes the special-position coordinates.
+    assert pos1['c']['coords_xyz'][0] != pos2['c']['coords_xyz'][0]
diff --git a/tests/unit/easydiffraction/display/plotters/test_plotly.py b/tests/unit/easydiffraction/display/plotters/test_plotly.py
index 812ec9157..17faf6381 100644
--- a/tests/unit/easydiffraction/display/plotters/test_plotly.py
+++ b/tests/unit/easydiffraction/display/plotters/test_plotly.py
@@ -611,11 +611,17 @@ def fake_show_figure(self, fig):
         2 * pp.PlotlyPlotter._bragg_tick_symbol_height_pixels()
     )
 
+    # Each line is wrapped in a colored span and padded left/right with the
+    # shared non-breaking space (see PlotlyPlotter._format_hover_lines).
+    pad = pp.HOVER_HORIZONTAL_PAD
+    meas_span = '<span style="color:rgb(31,119,180)">Imeas: %{customdata[0]:,.2f}</span>'
+    calc_span = '<span style="color:rgb(214,39,40)">Icalc: %{customdata[1]:,.2f}</span>'
+    resid_span = '<span style="color:rgb(44,160,44)">Imeas - Icalc: %{customdata[2]:,.2f}</span>'
     expected_hovertemplate = (
-        'x: %{x:,.2f}<br>'
-        'Imeas: %{customdata[0]:,.2f}<br>'
-        'Icalc: %{customdata[1]:,.2f}<br>'
-        'Imeas - Icalc: %{customdata[2]:,.2f}'
+        f'{pad}x: %{{x:,.2f}}{pad}<br>'
+        f'{pad}{meas_span}{pad}<br>'
+        f'{pad}{calc_span}{pad}<br>'
+        f'{pad}{resid_span}{pad}'
         '<extra></extra>'
     )
     meas_trace = next(trace for trace in fig.data if trace.name == 'Measured (Imeas)')
diff --git a/tests/unit/easydiffraction/display/tablers/test_base.py b/tests/unit/easydiffraction/display/tablers/test_base.py
index 2402a6bb9..d5ddcf68b 100644
--- a/tests/unit/easydiffraction/display/tablers/test_base.py
+++ b/tests/unit/easydiffraction/display/tablers/test_base.py
@@ -40,6 +40,17 @@ def test_is_dark_theme_outside_jupyter(self):
         # Outside Jupyter, default is True
         assert backend._is_dark_theme() is True
 
+    def test_is_dark_theme_without_ipython_installed(self, monkeypatch):
+        # Regression: base.py must tolerate IPython being absent (it is an
+        # optional display dependency, guarded at import). Without the guard
+        # `import easydiffraction` fails in a clean install.
+        import easydiffraction.display.tablers.base as base_module
+        from easydiffraction.display.tablers.rich import RichTableBackend
+
+        monkeypatch.setattr(base_module, 'get_ipython', None)
+        backend = RichTableBackend()
+        assert backend._is_dark_theme() is True
+
     def test_rich_border_color_property(self):
         from easydiffraction.display.tablers.rich import RichTableBackend
 
diff --git a/tools/check_packaged_db.py b/tools/check_packaged_db.py
new file mode 100644
index 000000000..d0bac73bd
--- /dev/null
+++ b/tools/check_packaged_db.py
@@ -0,0 +1,69 @@
+# SPDX-FileCopyrightText: 2025 EasyScience contributors <https://github.com/easyscience>
+# SPDX-License-Identifier: BSD-3-Clause
+"""Packaging regression for the bundled space-group database.
+
+Inspects a built wheel (not an installed package) so the check is independent
+of the project's full dependency tree: it opens the wheel, reads
+``space_groups.json.gz`` straight from it, and asserts the data is shipped as
+package data, that the obsolete ``space_groups.pkl.gz`` is gone, and that the
+archive covers all 230 IT groups plus the cryspy coordinate-code alias surface.
+Exits non-zero on any problem so a packaging regression fails the caller.
+
+Usage: ``python tools/check_packaged_db.py [path/to/wheel]`` (defaults to the
+newest wheel in ``dist/``).
+"""
+
+from __future__ import annotations
+
+import gzip
+import json
+import sys
+import zipfile
+from pathlib import Path
+
+_DATA_MEMBER = 'easydiffraction/crystallography/space_groups.json.gz'
+_OBSOLETE_MEMBER = 'easydiffraction/crystallography/space_groups.pkl.gz'
+_REQUIRED_KEYS = [(14, '-b1'), (3, '-a1'), (1, None)]
+# Accepted seed record count (see the space-group-database ADR provenance).
+_EXPECTED_RECORD_COUNT = 816
+
+
+def _wheel_path(argv: list[str]) -> Path:
+    if len(argv) > 1:
+        return Path(argv[1])
+    wheels = sorted(Path('dist').glob('*.whl'))
+    if not wheels:
+        sys.exit('no wheel found in dist/; build one with `pixi run dist-build`')
+    return wheels[-1]
+
+
+def main(argv: list[str]) -> None:
+    wheel = _wheel_path(argv)
+    with zipfile.ZipFile(wheel) as archive:
+        members = set(archive.namelist())
+        if _DATA_MEMBER not in members:
+            sys.exit(f'{wheel.name} does not ship {_DATA_MEMBER}')
+        if _OBSOLETE_MEMBER in members:
+            sys.exit(f'{wheel.name} still ships obsolete {_OBSOLETE_MEMBER}')
+        records = json.loads(gzip.decompress(archive.read(_DATA_MEMBER)).decode('utf-8'))
+
+    keys = {(record['IT_number'], record['IT_coordinate_system_code']) for record in records}
+    missing_groups = sorted(set(range(1, 231)) - {key[0] for key in keys})
+    if missing_groups:
+        sys.exit(f'packaged database missing IT numbers: {missing_groups}')
+    missing_keys = [key for key in _REQUIRED_KEYS if key not in keys]
+    if missing_keys:
+        sys.exit(f'packaged database missing expected keys: {missing_keys}')
+    if len(records) != _EXPECTED_RECORD_COUNT:
+        sys.exit(f'packaged database has {len(records)} records, expected {_EXPECTED_RECORD_COUNT}')
+    if len(keys) != _EXPECTED_RECORD_COUNT:
+        sys.exit(f'packaged database has {len(keys)} unique keys, expected {_EXPECTED_RECORD_COUNT}')
+
+    print(
+        f'packaged DB OK in {wheel.name}: '
+        f'{len({key[0] for key in keys})} IT groups, {len(records)} settings'
+    )
+
+
+if __name__ == '__main__':
+    main(sys.argv)