diff --git a/.env.example b/.env.example
index 7d49f5b9..38ef75b4 100644
--- a/.env.example
+++ b/.env.example
@@ -126,5 +126,15 @@ BATCH_GLOBAL_MAX_PARALLEL=4
 # mid-call, so a long fit can stall the drain.
 BATCH_CANCEL_DRAIN_TIMEOUT_SECONDS=30
 
+# Model selection (champion selector) async runner (Slice B)
+# Hard upper bound on concurrent candidate backtests across all active selection
+# runs on this host. Effective parallelism per run is min(this, candidates).
+# Set to 1 for sequential execution. Requires uvicorn restart to apply.
+MODEL_SELECTION_GLOBAL_MAX_PARALLEL=4
+# Max seconds DELETE /model-selection/{id} waits for in-flight candidates to
+# drain before returning RFC 7807 504. sklearn / LightGBM fits are uncancellable
+# mid-call, so a long fit can stall the drain.
+MODEL_SELECTION_CANCEL_DRAIN_TIMEOUT_SECONDS=30
+
 # Frontend (Vite)
 VITE_API_BASE_URL=http://localhost:8123
diff --git a/PRPs/ai_docs/forecast-champion-selector-backend-research.md b/PRPs/ai_docs/forecast-champion-selector-backend-research.md
new file mode 100644
index 00000000..2d37603b
--- /dev/null
+++ b/PRPs/ai_docs/forecast-champion-selector-backend-research.md
@@ -0,0 +1,222 @@
+# Forecast Champion Selector Backend Research
+
+Date: 2026-06-01
+
+This note captures external-library and runtime facts used by
+`PRPs/forecast-champion-selector-backend.md`. It is intentionally narrow:
+only claims that affect backend implementation are recorded here.
+
+## Official Documentation References
+
+- FastAPI APIRouter / multi-file apps:
+  https://fastapi.tiangolo.com/tutorial/bigger-applications/
+  - Reason: the new `app/features/model_selection/routes.py` must follow the
+    existing `APIRouter(prefix=..., tags=...)` slice pattern and be wired in
+    `app/main.py`.
+
+- Pydantic v2 strict mode and field-level overrides:
+  https://pydantic.dev/docs/validation/latest/concepts/strict_mode/
+  - Reason: ForecastLabAI request schemas use `ConfigDict(strict=True)`, but
+    JSON request bodies still need date/datetime/UUID/Decimal fields to accept
+    JSON-native strings via `Field(strict=False, ...)`.
+
+- SQLAlchemy 2.0 PostgreSQL JSONB:
+  https://docs.sqlalchemy.org/en/20/dialects/postgresql.html#json-types
+  - Reason: `model_selection_run` should store immutable request/response
+    snapshots (`candidate_models`, `ranking_result`, `winner_metrics`,
+    `forecast_result`, `business_summary`) as PostgreSQL JSONB.
+
+- Alembic `Operations.create_index`:
+  https://alembic.sqlalchemy.org/en/latest/ops.html#alembic.operations.Operations.create_index
+  - Reason: the migration should use explicit named indexes; any partial or
+    JSONB index must use Alembic operations rather than raw SQL.
+
+- scikit-learn `TimeSeriesSplit`:
+  https://scikit-learn.org/stable/modules/generated/sklearn.model_selection.TimeSeriesSplit.html
+  - Reason: the selector's recommended split defaults mirror the project's
+    own `SplitConfig` semantics and should not assume unsupported parameters.
+
+## Runtime Verification Commands
+
+Run from repository root on 2026-06-01.
+
+```bash
+uv run python -c "import inspect; from sqlalchemy import select, table, column; import sqlalchemy; stmt=select(column('id')).select_from(table('t')).with_for_update(skip_locked=True); print('sqlalchemy', sqlalchemy.__version__); print('with_for_update_has_skip_locked', 'skip_locked' in str(inspect.signature(select(column('id')).with_for_update))); print(stmt)"
+```
+
+Observed:
+
+```text
+sqlalchemy 2.0.46
+with_for_update_has_skip_locked True
+SELECT id
+FROM t FOR UPDATE
+```
+
+Note: generic SQL compilation does not render PostgreSQL-specific
+`SKIP LOCKED`; use PostgreSQL dialect compilation in tests when asserting
+that string.
+
+```bash
+uv run python -c "from datetime import date; import pydantic; from pydantic import BaseModel, ConfigDict, Field; M=type('M',(BaseModel,),{'__annotations__':{'d':date},'model_config':ConfigDict(strict=True),'d':Field(strict=False)}); print('pydantic', pydantic.__version__); print(M.model_validate({'d':'2026-06-01'}).d.isoformat())"
+```
+
+Observed:
+
+```text
+pydantic 2.12.5
+2026-06-01
+```
+
+```bash
+uv run python -c "import inspect, sklearn; from sklearn.model_selection import TimeSeriesSplit; print('sklearn', sklearn.__version__); print(inspect.signature(TimeSeriesSplit)); t=TimeSeriesSplit(n_splits=3, test_size=2, gap=1); print(t)"
+```
+
+Observed:
+
+```text
+sklearn 1.8.0
+(n_splits=5, *, max_train_size=None, test_size=None, gap=0)
+TimeSeriesSplit(gap=1, max_train_size=None, n_splits=3, test_size=2)
+```
+
+```bash
+uv run python -c "import inspect, fastapi; from fastapi import APIRouter, BackgroundTasks; print('fastapi', fastapi.__version__); print('APIRouter_prefix_param', 'prefix' in inspect.signature(APIRouter).parameters); print('BackgroundTasks_add_task', inspect.signature(BackgroundTasks.add_task))"
+```
+
+Observed:
+
+```text
+fastapi 0.128.0
+APIRouter_prefix_param True
+BackgroundTasks_add_task (self, func: ..., *args: P.args, **kwargs: P.kwargs) -> None
+```
+
+```bash
+uv run python -c "import inspect, alembic; from alembic.operations import Operations; print('alembic', alembic.__version__); print(inspect.signature(Operations.create_index))"
+```
+
+Observed:
+
+```text
+alembic 1.18.4
+(self, index_name, table_name, columns, *, schema=None, unique=False, if_not_exists=None, **kw) -> None
+```
+
+## Implementation Consequences
+
+- Use `Literal[...]` request fields for JSON string enums under
+  `ConfigDict(strict=True)`; convert to ORM enums at service boundaries.
+- Use `Field(strict=False, ...)` on every request-body date/datetime/UUID/
+  Decimal field, or `app/core/tests/test_strict_mode_policy.py` can fail.
+- Persist selector decisions in JSONB snapshots because registry metrics are
+  free-form JSONB and metric key names differ across layers.
+- Do not assume a batch backtest item contains fold-level chart data. Batch
+  metrics are intentionally pinned to `{wape, smape, mae, bias, sample_size}`.
+- If an implementation compiles SQL for PostgreSQL-specific clauses, compile
+  with the PostgreSQL dialect rather than relying on generic SQL strings.
+
+## Verified Internal Service Contracts (read from source 2026-06-01)
+
+These are the in-repo signatures the selector orchestrates. They were the prior
+draft's #1 residual risk; recorded here so they survive and can be re-verified on
+refactor. Re-verify with `grep -n "async def run_backtest\|async def train_model\|async def predict" app/features/backtesting/service.py app/features/forecasting/service.py`.
+
+### BacktestingService — `app/features/backtesting/service.py:213`
+
+```python
+# __init__(self) -> None  — takes NO db; instantiate as BacktestingService()
+async def run_backtest(
+    self, db: AsyncSession, store_id: int, product_id: int,
+    start_date: date, end_date: date, config: BacktestConfig,
+) -> BacktestResponse
+```
+
+`BacktestConfig` (`backtesting/schemas.py:81`, `frozen=True, extra="forbid"`):
+`split_config: SplitConfig`, `model_config_main: Annotated[ModelConfig, Field(discriminator="model_type")]`,
+`include_baselines: bool = True`, `store_fold_details: bool = True`.
+
+`SplitConfig` (`:24`): `strategy: Literal["expanding","sliding"]="expanding"`,
+`n_splits: int=5 (ge=2,le=20)`, `min_train_size: int=30 (ge=7)`, `gap: int=0 (ge=0,le=30)`,
+`horizon: int=14 (ge=1,le=90)`; validator `horizon > gap`.
+
+### BacktestResponse — `backtesting/schemas.py:257`
+
+`main_model_results: ModelBacktestResult`, `baseline_results: list[ModelBacktestResult] | None`,
+plus `backtest_id, store_id, product_id, config_hash, split_config, comparison_summary,
+duration_ms, leakage_check_passed`.
+
+`ModelBacktestResult` (`:180`): `model_type, config_hash, fold_results: list[FoldResult],
+aggregated_metrics: dict[str,float], metric_std: dict[str,float],
+bucketed_aggregated_metrics: dict|None, feature_aware: bool, exogenous_policy`.
+
+`FoldResult` (`:147`): `fold_index, split, dates: list[date], actuals: list[float],
+predictions: list[float], metrics: dict[str,float], horizon_bucket_metrics`.
+
+**Metric keys (CORRECTION to the prior draft):** `aggregated_metrics` has **five** keys —
+`{"mae", "rmse", "smape", "wape", "bias"}` (`backtesting/metrics.py:347`; PRP-36 added `rmse`).
+`metric_std` keys are suffixed `"{name}_stability"` (a coefficient of variation, not a raw std).
+`sample_size` is NOT in `aggregated_metrics` — derive from fold actuals length or n_folds.
+Fold chart data path: `main_model_results.fold_results[i].{dates,actuals,predictions}` — populated
+only when `config.store_fold_details=True`.
+
+### ForecastingService — `app/features/forecasting/service.py`
+
+```python
+# __init__(self) -> None
+async def train_model(                                            # :247
+    self, db: AsyncSession, store_id: int, product_id: int,
+    train_start_date: date, train_end_date: date, config: ModelConfig,
+    *, feature_frame_version: int = 1, feature_groups: list[str] | None = None,
+) -> TrainResponse                                                # TrainResponse.model_path is the artifact path
+
+async def predict(                                                # :402  — NO db arg
+    self, store_id: int, product_id: int, horizon: int, model_path: str,
+) -> PredictResponse                                              # PredictResponse.forecasts: list[ForecastPoint]
+```
+
+`predict()` rejects feature-aware models (`service.py:491`) — feature-aware winners must route
+through `/scenarios/simulate`; catch and warn rather than 500.
+
+### ModelConfig union — `forecasting/schemas.py:417`
+
+Plain PEP 604 union (`NaiveModelConfig | SeasonalNaiveModelConfig | … | ProphetLikeModelConfig`),
+discriminated by each member's `model_type` Literal. Members are **flat** (`SeasonalNaiveModelConfig`
+has `model_type` + `season_length`, NOT a nested `params`). No module-level `TypeAdapter`/helper.
+Build from `{"model_type": ..., "params": {...}}` by FLATTENING:
+
+```python
+from pydantic import TypeAdapter
+from app.features.forecasting.schemas import ModelConfig
+TypeAdapter(ModelConfig).validate_python({"model_type": c.model_type, **c.params})
+```
+
+Members are `frozen=True, extra="forbid"` → bad params raise `ValidationError` (treat as a failed
+candidate). `model_type` values: `naive, seasonal_naive, moving_average, weighted_moving_average,
+seasonal_average, trend_regression_baseline, random_forest, lightgbm, xgboost, regression,
+prophet_like` (`lightgbm`/`xgboost` are opt-in extras → may `ImportError`).
+
+### Data-platform ORM column names — `data_platform/models.py`
+
+`Store` (`:40`): `id` (int PK), `code` (business key — NOT `store_code`). `Product` (`:68`): `id`,
+`sku`, `launch_date: date|None`. `SalesDaily` (`:172`): `date` (FK calendar.date), `store_id`,
+`product_id`, `quantity` (Integer, CHECK ≥0), `unit_price`, `total_amount`; grain unique
+`(date, store_id, product_id)`. `Promotion` (`:274`): `product_id` NOT NULL, `store_id` NULLABLE
+(NULL = chain-wide, applies to all stores), date RANGE `[start_date, end_date]`,
+`kind ∈ {pct_off,bogo,bundle,markdown}`.
+
+### Cross-cutting patterns
+
+- Exceptions (`app/core/exceptions.py`): `BadRequestError`(400), `NotFoundError`(404),
+  `DatabaseError`(500), `ConflictError`(409), `UnprocessableEntityError`(422); each
+  `(message=..., details=None)`. Routes map `ValueError→BadRequestError`,
+  `SQLAlchemyError→DatabaseError` (mirror `backtesting/routes.py:60`).
+- `validate_date_range` is slice-local in `analytics/routes.py:36` (raises `BadRequestError`,
+  inverted-range + 730-day-max) — NOT importable cross-slice; reimplement locally.
+- `TimestampMixin` (`app/shared/models.py`): `created_at`/`updated_at`, `server_default func.now()`,
+  `updated_at onupdate func.now()`. Mix in first: `class X(TimestampMixin, Base)`.
+- JSONB import differs: migration `from sqlalchemy.dialects import postgresql` →
+  `postgresql.JSONB(astext_type=sa.Text())`; ORM `from sqlalchemy.dialects.postgresql import JSONB`.
+- `app/main.py` wires routers as `from app.features.<slice>.routes import router as <slice>_router`
+  + `app.include_router(<slice>_router)` (NO prefix at include; the router carries it).
+- Current alembic head observed: `c1d2e3f40512` (`create_batch_tables`).
diff --git a/PRPs/forecast-champion-selector-backend.md b/PRPs/forecast-champion-selector-backend.md
new file mode 100644
index 00000000..651fc009
--- /dev/null
+++ b/PRPs/forecast-champion-selector-backend.md
@@ -0,0 +1,970 @@
+name: "Forecast Champion Selector Backend"
+description: |
+  Backend foundation for an interactive Forecast Champion Selector. Adds a
+  first-class `model_selection` vertical slice that validates a store/product
+  pair, recommends/selects backtest settings, runs candidate model comparison,
+  ranks results by WAPE/sMAPE/bias/MAE, persists an auditable selection record,
+  and optionally trains/predicts with the winning model. This PRP deliberately
+  scopes UI work out; it creates the stable backend contract the UI can consume.
+
+**Created:** 2026-06-01 · **Refined:** 2026-06-01 (signatures verified against live code)
+**Current repo base observed:** `dev` at `1b4c3f3` (`Merge pull request #352 ...fix/agents-finalizer-fallback`)
+**Current alembic head observed:** `c1d2e3f40512` (`create_batch_tables`) — verify with `uv run alembic heads` at implementation time and chain to whatever head exists THEN.
+**Working-tree caveat observed:** `docker-compose.lan.yml` is an untracked local dogfood override; do not commit it.
+**Tracking issue:** create before implementation, suggested title `feat(api): add forecast champion selector backend`.
+**Suggested branch:** `feat/forecast-champion-selector-backend` (off `dev`, per `.claude/rules/branch-naming.md`).
+**Commit scope:** `api` (cross-feature backend wiring + new slice + `app/main.py`) and `db` (migration). Every commit references the tracking issue.
+
+---
+
+## VALIDATE — Missing Backend Surface Check
+
+The lower-level primitives exist; the business workflow does not.
+
+### Reusable backend primitives already present (verified)
+
+- `POST /backtesting/run` → single store/product/model backtest with fold metrics,
+  aggregated metrics, optional baselines, bucketed horizon metrics, leakage status.
+  `app/features/backtesting/routes.py:24` (router), `:60` (handler).
+  **Service entry point is `BacktestingService().run_backtest(db, store_id, product_id, start_date, end_date, config)`** — see verified signature below.
+- `POST /forecasting/train` → trains one model; supports `feature_frame_version` (1|2) and
+  `feature_groups`. `app/features/forecasting/routes.py:25`. Service:
+  `ForecastingService().train_model(db, store_id, product_id, train_start_date, train_end_date, config, *, feature_frame_version=1, feature_groups=None) -> TrainResponse`.
+- `POST /forecasting/predict` → predicts from a saved bundle. Service:
+  `ForecastingService().predict(store_id, product_id, horizon, model_path) -> PredictResponse`
+  (**no db arg** — loads bundle from disk; rejects feature-aware models, `service.py:491`).
+- `POST /batch/forecasting` fan-out exists but pins metrics to five keys and does **not**
+  expose fold-level chart data — NOT suitable for this slice's chart payload.
+- `GET /dimensions/stores`, `GET /dimensions/products` provide dimension metadata.
+- `app/features/ops/service.py` is the canonical read-only cross-slice ORM aggregation precedent.
+
+### Backend pieces missing for the full feature
+
+- No `app/features/model_selection/` slice; no `POST /model-selection/run`; no persisted
+  `model_selection_run` table; no orchestration of pair-validation → candidate backtests →
+  ranking → optional final train → optional predict; no pair-availability endpoint; no
+  backend ranking/confidence policy; no deterministic business explanation layer; no
+  chart-ready comparison payload.
+- Batch/Job model allow-lists are narrower than forecasting's full `ModelConfig` union, and
+  job/batch training does not pass `feature_frame_version`/`feature_groups`. **Therefore this
+  slice calls the direct backtesting/forecasting services**, not batch/jobs.
+
+---
+
+## BRAINSTORM / RERANK — Chosen Scope
+
+Chosen: **Option A — Backend foundation only** (new `model_selection` slice: pair
+availability, candidate comparison, ranking/confidence, persisted audit, optional
+train/predict, chart-ready payload). It covers every backend gap the eventual UI needs,
+reuses mature primitives, creates a stable testable contract, and avoids frontend coupling.
+
+Non-goals (out of scope for this PRP):
+
+- No React page / shadcn UI / frontend routing.
+- No agent tool, no `agent_require_approval` entry, no agent mutation surface.
+- No alias auto-promotion (the selector may *recommend* a winner; alias mutation is a future
+  approval-gated PRP).
+- No batch model-zoo retrofit. Use direct services for the single selected pair.
+
+---
+
+## Goal
+
+**Feature Goal:** A backend-only Forecast Champion Selector vertical slice that, given one
+store/product pair + window + horizon + candidate models, validates data availability, runs
+comparable backtests for every candidate, deterministically ranks completed candidates,
+computes a recommendation confidence with reasons, persists an auditable selection run, and
+returns chart-ready comparison data plus optional final-model training and forecast output.
+
+**Deliverable:** `app/features/model_selection/` slice (`models.py`, `schemas.py`,
+`ranking.py`, `explanations.py`, `service.py`, `routes.py`, `tests/`) + one Alembic migration
+creating `model_selection_run`, wired in `app/main.py`.
+
+**Success Definition:** `POST /model-selection/run` with the default five candidates against
+a seeded pair returns HTTP 200 with a persisted `selection_id`, a non-empty deterministic
+`ranking`, a `winner`, a `recommendation_confidence`, and a `chart_data` payload; the row is
+retrievable by `GET /model-selection/{selection_id}`; all validation gates pass.
+
+## Why
+
+- Business users want to ask "which model should I use for this store/product?" without
+  manually coordinating `/backtesting/run`, `/forecasting/train`, `/forecasting/predict`.
+- The UI needs **one stable backend contract** rather than re-implementing ranking in TypeScript.
+- A persisted selection run makes the model choice auditable: which models competed, which
+  window, which policy, and why the winner won.
+- Keeps the single-host architecture intact — no queue, no cloud SDK, no new service.
+
+## What
+
+### New endpoints (all under `APIRouter(prefix="/model-selection", tags=["model-selection"])`)
+
+```http
+GET  /model-selection/availability?store_id=...&product_id=...&forecast_horizon=14
+POST /model-selection/run
+GET  /model-selection/{selection_id}
+GET  /model-selection/{selection_id}/ranking
+POST /model-selection/{selection_id}/train-winner
+POST /model-selection/{selection_id}/predict
+```
+
+### Core request shape (`POST /model-selection/run`)
+
+```json
+{
+  "store_id": 1,
+  "product_id": 1,
+  "selection_window": { "start_date": "2026-01-01", "end_date": "2026-05-31" },
+  "forecast_horizon": 14,
+  "ranking_metric": "wape",
+  "split_config": { "strategy": "expanding", "n_splits": 5, "min_train_size": 30, "gap": 0, "horizon": 14 },
+  "candidate_models": [
+    {"model_type": "naive", "params": {}},
+    {"model_type": "seasonal_naive", "params": {"season_length": 7}},
+    {"model_type": "moving_average", "params": {"window_size": 7}},
+    {"model_type": "regression", "params": {}},
+    {"model_type": "prophet_like", "params": {}}
+  ],
+  "feature_frame_version": 1,
+  "feature_groups": null,
+  "auto_train_winner": false,
+  "auto_predict": false
+}
+```
+
+### LOCKED decisions (these remove every "choose one and test" ambiguity in the prior draft)
+
+1. **HTTP status codes:** `POST /model-selection/run` → **200** (synchronous, returns the
+   full result, mirrors `/backtesting/run` which is `status.HTTP_200_OK`). All GETs → 200.
+   `train-winner` / `predict` → 200. (201 is *not* used; the row is an audit side-effect, the
+   response is the computed result. Tests lock 200.)
+2. **Availability gate:** if `availability.status == "unusable"`, **fail fast** — persist the
+   row as `status="failed"` with `error_message`, then raise `BadRequestError` (RFC 7807 **400**).
+   Nothing is ranked.
+3. **All-candidates-fail (availability OK but every backtest errored):** **do NOT raise.**
+   Persist `status="failed"`, `ranking_result` with the failed entries, `winner=null`, and
+   return **200** with the failed-status response. Rationale: the run was validly attempted and
+   is an auditable outcome, not a client error. (Distinguish from #2: #2 is "we never started".)
+4. **Per-candidate backtest config:** `BacktestConfig(split_config=req.split_config,
+   model_config_main=<ModelConfig>, include_baselines=False, store_fold_details=True)`.
+   `include_baselines=False` because each candidate is itself a `model_config_main` run — we do
+   not want N redundant baseline runs. `store_fold_details=True` so fold chart data is populated.
+5. **`split_config.horizon` MUST equal `forecast_horizon`** (model-validator on the request).
+   The window dates from `selection_window` become `run_backtest`'s `start_date`/`end_date`.
+6. **Ranking determinism:** primary = `ranking_metric` (default `"wape"`), then the fixed
+   tie-break chain `wape → smape → abs(bias) → mae → model_type`. With the default, the sort key
+   is exactly `(wape, smape, abs(bias), mae, model_type)` (success-criteria order). A non-default
+   `ranking_metric` puts that metric first, remaining chain follows excluding the duplicate.
+7. **`auto_predict=True` requires `auto_train_winner=True`** (request model-validator) — predict
+   needs a freshly trained `final_model.model_path` from this run.
+
+### Success Criteria
+
+- [ ] `app/features/model_selection/` slice exists and is wired in `app/main.py`.
+- [ ] `POST /model-selection/run` with the default five candidates returns a persisted
+      `status="completed"` (or `"partial"`) selection with `winner`, `ranking`, confidence, and `chart_data`.
+- [ ] `GET /model-selection/availability` returns: `first_sales_date`, `last_sales_date`,
+      `observed_days`, `expected_calendar_days`, `coverage_ratio`, `missing_days`,
+      `zero_sale_days`, `promotion_days` (or `null` + warning), `average_daily_demand`,
+      `status` ∈ `{ready, limited, unusable}`, and `recommended_split_config`.
+- [ ] Ranking is deterministic per LOCKED decision #6.
+- [ ] Partial success supported (LOCKED #3): failed candidates appear in `ranking` with error
+      detail and are excluded from winner selection; a valid candidate still wins.
+- [ ] `auto_train_winner=True` stores `final_model.model_path` via the **direct**
+      `ForecastingService.train_model`, preserving `feature_frame_version` + `feature_groups`.
+- [ ] `auto_predict=True` (with train) returns forecast points + total/average demand summary.
+- [ ] New migration creates `model_selection_run` with JSONB snapshots and named indexes;
+      `downgrade` drops indexes then table cleanly.
+- [ ] `app/core/tests/test_strict_mode_policy.py` stays green for all new strict request schemas.
+- [ ] No agent tools / `agent_require_approval` entries; no frontend files; no cloud SDK.
+
+## All Needed Context
+
+### Documentation & References
+
+```yaml
+# PRP conventions
+- file: PRPs/templates/prp_base.md
+  why: Base template (Goal/Context/Blueprint/Validation). NOTE — the user referenced a
+       "PRPs/prp-readme.md.md"; it does NOT exist (`find PRPs -iname '*readme*'` empty on 2026-06-01).
+- file: PRPs/PRP-33-batch-runner-mvp.md
+  why: Strongest backend vertical-slice precedent — migration assertions, strict-mode gotchas,
+       route/test detail. Mirror its structure.
+- file: PRPs/PRP-28-forecast-explainability-driver-attribution.md
+  why: Read/composition-slice precedent consuming existing contracts; deterministic explanation layer.
+- docfile: PRPs/ai_docs/forecast-champion-selector-backend-research.md
+  why: External-lib + runtime verification (FastAPI APIRouter, Pydantic strict, JSONB, Alembic
+       create_index, sklearn TimeSeriesSplit). Versions: pydantic 2.12.5, sqlalchemy 2.0.46,
+       sklearn 1.8.0, fastapi 0.128.0, alembic 1.18.4.
+
+# Verified service contracts to reuse (DO NOT re-derive — exact signatures below in Gotchas)
+- file: app/features/backtesting/service.py
+  why: BacktestingService().run_backtest(db, store_id, product_id, start_date, end_date, config). :213
+- file: app/features/backtesting/schemas.py
+  why: SplitConfig :24, BacktestConfig :81, BacktestResponse :257, ModelBacktestResult :180,
+       FoldResult :147. aggregated_metrics keys = {mae,rmse,smape,wape,bias}.
+- file: app/features/backtesting/routes.py
+  why: EXACT route error-mapping pattern to mirror (try/except ValueError->BadRequestError,
+       SQLAlchemyError->DatabaseError; service instantiated as BacktestingService()). :60-140
+- file: app/features/forecasting/service.py
+  why: ForecastingService().train_model :247 (db first; feature_frame_version/feature_groups
+       keyword-only after *), predict :402 (NO db). Lazy cross-slice import precedent :55-61, :967.
+- file: app/features/forecasting/schemas.py
+  why: ModelConfig union :417-429 (flat members, model_type discriminator, NO module-level helper);
+       TrainResponse.model_path :540; PredictResponse.forecasts :605; ForecastPoint :574.
+- file: app/features/data_platform/models.py
+  why: Store :40 (business key `code`, not store_code), Product :68 (`sku`, `launch_date`),
+       SalesDaily :172 (date/store_id/product_id/quantity/unit_price/total_amount), Promotion :274.
+- file: app/features/ops/service.py
+  why: Read-only cross-slice ORM aggregation precedent — module-scope ORM-model imports, stateless
+       service, db: AsyncSession per method, func.min/max/count/sum + group_by style. :225, :456.
+- file: app/features/analytics/routes.py
+  why: validate_date_range :36 (raises BadRequestError, inverted-range + 730-day-max). CANNOT be
+       cross-slice imported — reimplement the two checks locally raising BadRequestError.
+- file: app/core/exceptions.py
+  why: BadRequestError(400) :152, NotFoundError(404) :64, DatabaseError(500) :108,
+       ConflictError(409) :130, UnprocessableEntityError(422) :174. Each: (message=..., details=None).
+- file: app/core/problem_details.py
+  why: RFC 7807 envelope; never raise bare HTTPException with raw strings.
+- file: app/core/config.py
+  why: get_settings() cached singleton :225; Settings(BaseSettings) :62; add a plain typed attr
+       with literal default; env var = UPPER_SNAKE of the field name.
+- file: app/core/database.py
+  why: Base (ORM declarative base) + get_db dependency used by routes/tests.
+- file: app/shared/models.py
+  why: TimestampMixin (created_at/updated_at, server_default func.now(), updated_at onupdate). Mix in first.
+- file: app/main.py
+  why: Router wiring — `from app.features.<slice>.routes import router as <slice>_router` (:18-26),
+       `app.include_router(<slice>_router)` with NO prefix at include (:137-155), inside create_app().
+- file: app/core/tests/test_strict_mode_policy.py
+  why: AST policy — scans app/features/*/schemas.py; any ConfigDict(strict=True) model field typed
+       date/datetime/time/UUID/Decimal (anywhere in the annotation) MUST carry Field(strict=False, ...).
+
+# Migration / test patterns
+- file: alembic/versions/c1d2e3f40512_create_batch_tables.py
+  why: JSONB via `from sqlalchemy.dialects import postgresql` -> postgresql.JSONB(astext_type=sa.Text());
+       named CheckConstraint; op.create_index (op.f for single-col, explicit name for composite);
+       sa.DateTime(timezone=True) server_default sa.text("now()"); downgrade drops indexes THEN table.
+- file: app/features/batch/models.py
+  why: ORM JSONB via `from sqlalchemy.dialects.postgresql import JSONB` (bare); Mapped[]+mapped_column;
+       status as String + default=Enum.PENDING.value + CheckConstraint in __table_args__; TimestampMixin.
+- file: app/features/batch/schemas.py
+  why: Strict request pattern — ConfigDict(strict=True), Literal[...] for JSON enums, Field(strict=False)
+       on date fields (:132-133), @model_validator cross-field checks.
+- file: app/features/explainability/tests/test_routes.py
+  why: ASGITransport + AsyncClient + app.dependency_overrides[get_db]; RFC 7807 4-key body assert; async tests.
+- file: app/features/explainability/tests/conftest.py
+  why: Integration fixture — real engine from get_settings().database_url, prefix-scoped teardown in finally.
+
+# External official docs (verified in research doc)
+- url: https://fastapi.tiangolo.com/tutorial/bigger-applications/
+  why: APIRouter prefix/tags multi-file pattern.
+- url: https://pydantic.dev/docs/validation/latest/concepts/strict_mode/
+  why: strict mode + field-level Field(strict=False) override (runtime-verified, pydantic 2.12.5).
+- url: https://docs.sqlalchemy.org/en/20/dialects/postgresql.html#json-types
+  why: JSONB column type for audit snapshots.
+- url: https://alembic.sqlalchemy.org/en/latest/ops.html#alembic.operations.Operations.create_index
+  why: create_index signature (alembic 1.18.4: index_name, table_name, columns, *, unique, **kw).
+- url: https://scikit-learn.org/stable/modules/generated/sklearn.model_selection.TimeSeriesSplit.html
+  why: split semantics (sklearn 1.8.0 signature: n_splits, *, max_train_size, test_size, gap).
+```
+
+### Current Codebase Tree (relevant slices)
+
+```bash
+app/features/
+├── analytics/       # KPI/drilldown/timeseries; validate_date_range lives in routes.py (slice-local)
+├── backtesting/     # single-pair single-model backtesting; fold/chart data via store_fold_details
+├── batch/           # batch fan-out; pinned 5-key metrics; NO fold chart data
+├── data_platform/   # shared ORM: Store, Product, SalesDaily, Promotion, InventorySnapshotDaily, ...
+├── dimensions/      # store/product discovery
+├── forecasting/     # direct train/predict; full ModelConfig union
+├── jobs/            # train/predict/backtest job orchestration
+├── ops/             # read-only cross-slice ORM aggregation precedent (OpsService)
+└── registry/        # model runs, aliases, compare, artifact verify
+alembic/versions/    # current head: c1d2e3f40512 (create_batch_tables)
+```
+
+### Desired Codebase Tree
+
+```bash
+app/features/model_selection/
+├── __init__.py
+├── models.py            # ModelSelectionRun ORM + ModelSelectionStatus enum
+├── schemas.py           # strict request models + response models
+├── ranking.py           # PURE: normalize metrics, filter, rank, confidence
+├── explanations.py      # PURE: deterministic business summary + confidence_reasons
+├── service.py           # ModelSelectionService: availability + orchestration (lazy cross-slice imports)
+├── routes.py            # APIRouter(prefix="/model-selection")
+└── tests/
+    ├── __init__.py
+    ├── conftest.py
+    ├── test_models.py
+    ├── test_schemas.py
+    ├── test_ranking.py
+    ├── test_explanations.py
+    ├── test_service.py
+    ├── test_routes.py
+    └── test_routes_integration.py
+alembic/versions/<rev>_create_model_selection_run.py
+```
+
+### Known Gotchas & VERIFIED Library/Internal Contracts
+
+```python
+# ── VERIFIED INTERNAL SIGNATURES (exact, read 2026-06-01) ─────────────────────
+# BacktestingService.__init__(self) -> None      # takes NO db; instantiate as BacktestingService()
+# await BacktestingService().run_backtest(
+#     db, store_id, product_id, start_date, end_date, config: BacktestConfig
+# ) -> BacktestResponse                            # service.py:213 ; db is FIRST arg
+#
+# ForecastingService.__init__(self) -> None
+# await ForecastingService().train_model(
+#     db, store_id, product_id, train_start_date, train_end_date, config: ModelConfig,
+#     *, feature_frame_version: int = 1, feature_groups: list[str] | None = None
+# ) -> TrainResponse                               # service.py:247 ; .model_path is the artifact path
+# await ForecastingService().predict(
+#     store_id, product_id, horizon, model_path     # NO db arg — loads bundle from disk
+# ) -> PredictResponse                              # service.py:402 ; .forecasts: list[ForecastPoint]
+#                                                   #   ForecastPoint: {date, forecast, lower_bound?, upper_bound?}
+#   GOTCHA: predict() REJECTS feature-aware models (service.py:491). For a feature-aware winner,
+#   auto_predict may raise; catch and surface a warning rather than failing the whole run.
+
+# ── METRIC KEYS — CORRECTED (draft was incomplete) ────────────────────────────
+# BacktestResponse.main_model_results.aggregated_metrics has FIVE keys:
+#   {"mae", "rmse", "smape", "wape", "bias"}        # metrics.py:347 — draft MISSED "rmse"
+# metric_std keys are SUFFIXED "{name}_stability" (a coefficient of variation, NOT raw std).
+# sample_size is NOT in aggregated_metrics — derive it from fold actuals length
+#   (sum of len(fold.actuals) across fold_results) or n_folds; normalize in ranking.py.
+# Fold chart data path: BacktestResponse.main_model_results.fold_results[i].{dates, actuals, predictions}
+#   populated ONLY when config.store_fold_details=True (LOCKED #4 sets it True).
+# bucketed_aggregated_metrics lives on each ModelBacktestResult (optional, may be None).
+
+# ── ModelConfig CONSTRUCTION — members are FLAT, no nested "params" ────────────
+# The request uses {"model_type": "seasonal_naive", "params": {"season_length": 7}} but the
+# ModelConfig members are FLAT (SeasonalNaiveModelConfig has model_type + season_length at top
+# level). There is NO module-level TypeAdapter/helper. Build at the service boundary by FLATTENING:
+#   from pydantic import TypeAdapter
+#   from app.features.forecasting.schemas import ModelConfig
+#   _MODEL_CONFIG_ADAPTER = TypeAdapter(ModelConfig)
+#   cfg = _MODEL_CONFIG_ADAPTER.validate_python({"model_type": c.model_type, **c.params})
+# Members are frozen + extra="forbid", so unknown params raise a ValidationError (good — surfaces
+# bad candidate params as a failed candidate with a reason). Do this import LAZILY in-method.
+# Valid model_type values (full union, forecasting/schemas.py:417): naive, seasonal_naive,
+#   moving_average, weighted_moving_average, seasonal_average, trend_regression_baseline,
+#   random_forest, lightgbm, xgboost, regression, prophet_like.
+#   (lightgbm/xgboost are opt-in extras — may ImportError at runtime; treat as a failed candidate.)
+
+# ── CROSS-SLICE IMPORT RULE ───────────────────────────────────────────────────
+# Vertical-slice rule: app/features/X must not import app/features/Y at MODULE scope when it
+# would close an alembic cold-boot cycle. model_selection is a NEW leaf (nothing imports it), but
+# to match the BatchService/forecasting precedent and stay safe, import the SERVICE CLASSES
+# (BacktestingService, ForecastingService) and the ModelConfig TypeAdapter LAZILY inside the
+# methods that use them. Read ORM models (Store/Product/SalesDaily/Promotion) at module scope —
+# that mirrors OpsService and is the sanctioned read-only ORM surface.
+
+# ── validate_date_range IS NOT IMPORTABLE ─────────────────────────────────────
+# It lives in app/features/analytics/routes.py (slice-local). Reimplement the two checks locally
+# (inverted range; max-span) raising app.core.exceptions.BadRequestError, OR rely on schema
+# validators. Do NOT import across the slice boundary.
+# NOTE: analytics' max-span is settings.analytics_max_date_range_days (configurable, ~730), not a
+#   hardcoded constant — pick your own local bound (or reuse the setting) when reimplementing.
+
+# ── STRICT-MODE POLICY (app/core/tests/test_strict_mode_policy.py) ────────────
+# Every request model with model_config = ConfigDict(strict=True) MUST add Field(strict=False, ...)
+# to EVERY field typed date|datetime|time|UUID|Decimal (incl. inside Optional/Annotated/list/dict).
+# Use Literal[...] for JSON enum strings (NOT a str-Enum — strict won't coerce). The AST walker does
+# NOT follow inheritance, so set ConfigDict(strict=True) on each concrete request model directly.
+
+# ── ORM / MIGRATION QUIRKS ────────────────────────────────────────────────────
+# JSONB import DIFFERS by layer:
+#   migration: from sqlalchemy.dialects import postgresql  ->  postgresql.JSONB(astext_type=sa.Text())
+#   ORM:       from sqlalchemy.dialects.postgresql import JSONB  ->  mapped_column(JSONB)
+# Status enum enforced via CheckConstraint("status IN (...)", name="ck_...") in BOTH migration and
+#   ORM __table_args__; ORM column is String(N) with default=ModelSelectionStatus.PENDING.value.
+# created_at/updated_at come from TimestampMixin (app/shared/models.py) — declare class as
+#   `class ModelSelectionRun(TimestampMixin, Base)` (mixin FIRST). Declare completed_at explicitly.
+# Migration down_revision: chain to the CURRENT head at implementation time (observed c1d2e3f40512);
+#   run `uv run alembic heads` to confirm — do NOT hardcode this PRP's observed value blindly.
+
+# ── DATA-PLATFORM COLUMN NAMES (availability aggregation) ─────────────────────
+# Store.id (int PK), Store.code (business key). Product.id, Product.sku, Product.launch_date (date|None).
+# SalesDaily: .date (Date FK calendar.date), .store_id, .product_id, .quantity (Integer, CHECK >=0),
+#   .unit_price (Numeric), .total_amount (Numeric). Grain unique (date, store_id, product_id).
+#   => For ONE pair: count(distinct date) == count(*); zero_sale_days = count where quantity == 0.
+# Promotion: per-product (product_id NOT NULL), store_id NULLABLE (NULL = CHAIN-WIDE, applies to all
+#   stores), date RANGE [start_date, end_date], kind in {pct_off,bogo,bundle,markdown}. To count
+#   promotion_days for (store, product) within the window, JOIN promotion to the pair's sales dates
+#   ON sd.date BETWEEN p.start_date AND p.end_date AND p.product_id=? AND (p.store_id=? OR p.store_id IS NULL),
+#   then COUNT(DISTINCT sd.date). If this proves complex/edge-casey, return promotion_days=None with a
+#   warning string (acceptable per Success Criteria) — do NOT sum (end-start) per row (double-counts overlaps).
+
+# ── RUNTIME-VERIFIED LIBRARY FACTS (research doc) ─────────────────────────────
+# Pydantic 2.12.5 accepts Field(strict=False) date string under a strict model. sklearn 1.8.0
+# TimeSeriesSplit(n_splits, *, max_train_size, test_size, gap). FastAPI 0.128.0 APIRouter(prefix=...).
+# Alembic 1.18.4 Operations.create_index(index_name, table_name, columns, *, unique, **kw).
+```
+
+## Implementation Blueprint
+
+### Data Models and Schemas
+
+`app/features/model_selection/models.py`:
+
+```python
+from datetime import date, datetime
+from enum import Enum
+from typing import Any
+
+from sqlalchemy import CheckConstraint, Date, DateTime, Index, Integer, String
+from sqlalchemy.dialects.postgresql import JSONB
+from sqlalchemy.orm import Mapped, mapped_column
+
+from app.core.database import Base
+from app.shared.models import TimestampMixin
+
+
+class ModelSelectionStatus(str, Enum):
+    PENDING = "pending"
+    RUNNING = "running"
+    COMPLETED = "completed"
+    PARTIAL = "partial"
+    FAILED = "failed"
+
+
+class ModelSelectionRun(TimestampMixin, Base):   # TimestampMixin FIRST → created_at/updated_at
+    __tablename__ = "model_selection_run"
+
+    id: Mapped[int] = mapped_column(Integer, primary_key=True)
+    selection_id: Mapped[str] = mapped_column(String(32), unique=True, index=True)
+    store_id: Mapped[int] = mapped_column(Integer, index=True)
+    product_id: Mapped[int] = mapped_column(Integer, index=True)
+    start_date: Mapped[date] = mapped_column(Date)
+    end_date: Mapped[date] = mapped_column(Date)
+    forecast_horizon: Mapped[int] = mapped_column(Integer)
+    ranking_metric: Mapped[str] = mapped_column(String(20))
+    status: Mapped[str] = mapped_column(String(20), default=ModelSelectionStatus.PENDING.value, index=True)
+    candidate_models: Mapped[list[dict[str, Any]]] = mapped_column(JSONB)
+    policy_snapshot: Mapped[dict[str, Any]] = mapped_column(JSONB)
+    availability_snapshot: Mapped[dict[str, Any] | None] = mapped_column(JSONB, nullable=True)
+    ranking_result: Mapped[dict[str, Any] | None] = mapped_column(JSONB, nullable=True)
+    winner_model_type: Mapped[str | None] = mapped_column(String(40), nullable=True)
+    winner_metrics: Mapped[dict[str, Any] | None] = mapped_column(JSONB, nullable=True)
+    final_model_path: Mapped[str | None] = mapped_column(String(512), nullable=True)
+    forecast_result: Mapped[dict[str, Any] | None] = mapped_column(JSONB, nullable=True)
+    business_summary: Mapped[dict[str, Any] | None] = mapped_column(JSONB, nullable=True)
+    error_message: Mapped[str | None] = mapped_column(String(2000), nullable=True)
+    completed_at: Mapped[datetime | None] = mapped_column(DateTime(timezone=True), nullable=True)
+
+    __table_args__ = (
+        CheckConstraint(
+            "status IN ('pending','running','completed','partial','failed')",
+            name="ck_model_selection_run_valid_status",
+        ),
+        Index("ix_model_selection_run_store_product_created", "store_id", "product_id", "created_at"),
+        Index("ix_model_selection_run_status_created", "status", "created_at"),
+    )
+```
+
+`app/features/model_selection/schemas.py` — strict request models + response models:
+
+- `SelectionWindow(start_date, end_date)` — `ConfigDict(strict=True)`, both dates `Field(strict=False, ...)`.
+- `CandidateModelConfig(model_type: Literal[<11 model_types>], params: dict[str, Any] = {})`.
+- `RankingPolicy(minimum_sample_size: int = 0, high_confidence_rel_improvement: float = 0.10,
+   max_acceptable_abs_bias: float = ...)` — defaults; snapshotted into `policy_snapshot`.
+- `ModelSelectionRunRequest` — `ConfigDict(strict=True)`; fields: `store_id`, `product_id`,
+  `selection_window`, `forecast_horizon` (int, ge=1, le=90), `ranking_metric: Literal["wape","smape","mae","bias"]="wape"`,
+  `split_config: SplitConfig` (reuse backtesting's? — see NOTE), `candidate_models: list` (min_length=1, max_length=10),
+  `feature_frame_version: int = 1` (ge=1, le=2), `feature_groups: list[str] | None = None`,
+  `ranking_policy: RankingPolicy = Field(default_factory=RankingPolicy)`,
+  `auto_train_winner: bool = False`, `auto_predict: bool = False`.
+  - `@model_validator(mode="after")`: `split_config.horizon == forecast_horizon` (LOCKED #5);
+    `auto_predict implies auto_train_winner` (LOCKED #7).
+  - NOTE on `split_config`: `backtesting.schemas.SplitConfig` is `frozen=True, extra="forbid"`
+    (NOT strict). Either (a) reuse it directly (import lazily is unnecessary for a schema type —
+    it's safe at module scope since backtesting.schemas has no cycle back to model_selection), or
+    (b) define a local `SplitSettings` mirror. **Prefer reusing `SplitConfig`** to avoid drift; it
+    already validates n_splits/min_train_size/gap/horizon. Since it is not strict-mode, its `date`-free
+    fields don't trip the strict-mode linter.
+**Response + intermediate models (plain `BaseModel` — outputs don't need `strict=True`). These
+fields ARE the stable contract the UI consumes; specify them exactly, do not improvise.**
+
+```python
+# ── intermediate (service-internal, also embedded in JSONB) ───────────────────
+class CandidateResult(BaseModel):            # what shape_candidate()/shape_failed_candidate() return
+    model_type: str
+    params: dict[str, Any]                   # ORIGINAL candidate params — REQUIRED so the winner can be rebuilt (pseudocode L667)
+    failed: bool
+    error: str | None = None                 # reason when failed=True
+    aggregated_metrics: dict[str, float] | None = None   # raw 5-key dict from backtest (mae,rmse,smape,wape,bias) or None
+    sample_size: int = 0                      # RULE: sum(len(fold.actuals)) across main_model_results.fold_results
+    config_hash: str | None = None
+    folds: list[FoldChart] = []              # per-fold chart points (empty when failed)
+
+class FoldChart(BaseModel):
+    fold_index: int
+    dates: list[date]
+    actuals: list[float]
+    predictions: list[float]
+
+class ModelRankEntry(BaseModel):             # one row in the ranking table (valid OR excluded)
+    rank: int | None                          # 1-based; None when excluded/failed
+    model_type: str
+    params: dict[str, Any]                    # carried through (see CandidateResult.params)
+    included: bool                            # False = failed or filtered out
+    exclusion_reason: str | None = None
+    metrics: dict[str, float] | None = None   # normalized {wape,smape,mae,rmse,bias,sample_size}
+
+class RankingResult(BaseModel):              # Pydantic (model_dump'd into ranking_result JSONB, L663)
+    winner: ModelRankEntry | None
+    entries: list[ModelRankEntry]             # ALL candidates, ranked-then-failed, never hidden
+    confidence: Literal["high", "medium", "low"]
+    reasons: list[str]
+
+class WinnerSummary(BaseModel):
+    model_type: str
+    params: dict[str, Any]
+    metrics: dict[str, float]                 # normalized winner metrics
+    rank: int                                 # always 1
+
+class ChartData(BaseModel):                  # chart-ready comparison payload (Success Criteria deliverable)
+    wape_by_model: dict[str, float]           # {model_type: wape}  → WAPE bar chart
+    bias_by_model: dict[str, float]           # {model_type: bias}  → bias chart
+    fold_stability: dict[str, list[float]]    # {model_type: per-fold wape}  → stability lines
+    winner_actual_vs_predicted: list[FoldChart]   # the WINNER's folds only → actual-vs-predicted overlay
+
+class PairAvailabilityResponse(BaseModel):
+    store_id: int
+    product_id: int
+    first_sales_date: date | None
+    last_sales_date: date | None
+    observed_days: int
+    expected_calendar_days: int
+    coverage_ratio: float
+    missing_days: int
+    zero_sale_days: int
+    promotion_days: int | None                # None + a warning when not safely derivable
+    average_daily_demand: float               # CAST float(...) — func.avg over Integer quantity returns Decimal
+    status: Literal["ready", "limited", "unusable"]
+    recommended_split_config: SplitConfig     # reuse backtesting.schemas.SplitConfig
+    warnings: list[str] = []
+
+class ForecastSummary(BaseModel):
+    points: list[dict[str, Any]]              # ForecastPoint.model_dump(mode="json") list
+    total_demand: float
+    average_demand: float
+    horizon: int
+
+class ModelSelectionRunResponse(BaseModel):  # THE /run + /{id} contract
+    selection_id: str
+    store_id: int
+    product_id: int
+    status: Literal["pending", "running", "completed", "partial", "failed"]
+    selection_window: SelectionWindow
+    forecast_horizon: int
+    ranking_metric: str
+    availability: PairAvailabilityResponse | None
+    ranking: list[ModelRankEntry]             # == RankingResult.entries
+    winner: WinnerSummary | None
+    recommendation_confidence: Literal["high", "medium", "low"] | None   # CANONICAL KEY (maps from RankingResult.confidence)
+    confidence_reasons: list[str]             # == RankingResult.reasons
+    chart_data: ChartData | None
+    final_model: dict[str, Any] | None        # {"model_path": ...} when auto_train_winner
+    forecast: ForecastSummary | None          # when auto_predict
+    business_summary: dict[str, Any] | None
+    error_message: str | None
+    created_at: datetime
+    completed_at: datetime | None
+
+class TrainWinnerResponse(BaseModel):
+    selection_id: str
+    model_type: str
+    model_path: str
+
+class PredictWinnerResponse(BaseModel):
+    selection_id: str
+    forecast: ForecastSummary
+```
+
+> **NAMING (resolves the only internal-consistency nit):** the response key is
+> **`recommendation_confidence`** (Success Criteria + manual probe + Goal all use it).
+> `RankingResult.confidence` is the service-internal field; `_response()` maps
+> `RankingResult.confidence → ModelSelectionRunResponse.recommendation_confidence` and
+> `RankingResult.reasons → confidence_reasons`. Tests assert the response key
+> `recommendation_confidence`.
+
+> **`self._response(row, ranking)` helper:** pure mapping `ModelSelectionRun` ORM row +
+> `RankingResult` → `ModelSelectionRunResponse` (rehydrate `availability_snapshot`/`ranking_result`/
+> `business_summary`/`forecast_result` JSONB back into the response models; build `chart_data` from
+> the per-candidate `CandidateResult.folds` + normalized metrics; map the confidence keys per above).
+
+### Implementation Tasks (dependency-ordered)
+
+```yaml
+Task 1 — Migration + ORM:
+  RUN: uv run alembic heads   # confirm current head (observed c1d2e3f40512)
+  CREATE alembic/versions/<rev>_create_model_selection_run.py:
+    - down_revision = "<current head>"
+    - MIRROR alembic/versions/c1d2e3f40512_create_batch_tables.py exactly:
+      - from sqlalchemy.dialects import postgresql  ->  postgresql.JSONB(astext_type=sa.Text())
+      - sa.DateTime(timezone=True), server_default=sa.text("now()") for created_at/updated_at
+      - CheckConstraint name="ck_model_selection_run_valid_status"
+      - op.create_index(op.f("ix_model_selection_run_selection_id"), ..., unique=True)
+      - op.create_index("ix_model_selection_run_store_product_created", ..., ["store_id","product_id","created_at"])
+      - op.create_index("ix_model_selection_run_status_created", ..., ["status","created_at"])
+      - downgrade(): drop indexes (reverse order) THEN op.drop_table("model_selection_run")
+  CREATE app/features/model_selection/models.py:   # as blueprint above; mirror batch/models.py
+
+Task 2 — Schemas:
+  CREATE app/features/model_selection/schemas.py:
+    - all REQUEST models ConfigDict(strict=True); date fields Field(strict=False, ...)
+    - Literal[...] for model_type + ranking_metric (NOT str-Enum)
+    - candidate_models min_length=1 max_length=10 (or settings.model_selection_max_candidates)
+    - @model_validator: horizon match (LOCKED #5) + auto_predict implies auto_train_winner (LOCKED #7)
+    - reuse backtesting.schemas.SplitConfig (module-scope import OK; no cycle)
+
+Task 3 — Ranking pure logic:
+  CREATE app/features/model_selection/ranking.py:
+    - NormalizedMetrics dataclass {wape, smape, mae, rmse, bias, sample_size}
+    - normalize_metrics(aggregated_metrics, sample_size) -> NormalizedMetrics | None
+        (None when the primary metric is missing OR NaN — use math.isnan guard; np.nan can appear,
+         metrics.py:381; keys are mae/rmse/smape/wape/bias)
+    - input: list[CandidateResult] (Task-2 schema). Each entry CARRIES model_type + params through to
+      ModelRankEntry/WinnerSummary so the winner can be rebuilt (pseudocode L667 reads winner.params).
+    - filter: not failed AND numeric primary metric AND sample_size >= policy.minimum_sample_size
+    - rank key (default ranking_metric="wape"): (wape, smape, abs(bias), mae, model_type)  [LOCKED #6]
+    - confidence (PIN the rel-improvement formula — denominator is the SECOND-place value):
+        rel_improvement = (second.wape - winner.wape) / second.wape   # guard second.wape == 0 → treat as 0.0
+        HIGH  : >=2 valid AND rel_improvement >= policy.high_confidence_rel_improvement (default 0.10)
+                AND abs(winner.bias) <= policy.max_acceptable_abs_bias AND winner.sample_size sufficient
+        MEDIUM: a valid winner exists but HIGH not met (narrow lead OR mild warnings) and >=2 valid
+        LOW   : exactly one valid candidate, OR availability "limited", OR abs(bias) over threshold,
+                OR rel_improvement < some near-tie epsilon (document the epsilon as a module constant)
+    - emit human-readable reasons[] strings explaining the chosen level (consumed as confidence_reasons)
+    - return RankingResult(winner, entries[ALL ranked-then-failed, never hidden], confidence, reasons)
+
+Task 4 — Business explanation pure logic:
+  CREATE app/features/model_selection/explanations.py:
+    - explain_winner(ranking, availability) -> business_summary dict + confidence_reasons + warnings
+    - translate WAPE/sMAPE/MAE/bias into short deterministic English; NO LLM, NO external call
+
+Task 5 — Pair availability:
+  CREATE ModelSelectionService.get_availability(db, store_id, product_id, forecast_horizon, split_config?) -> PairAvailabilityResponse:
+    - verify Store and Product exist (NotFoundError if absent) via data_platform ORM (module-scope import OK)
+    - aggregate SalesDaily for the pair (SQLAlchemy 2.0 async, mirror OpsService style):
+        select(func.min(SalesDaily.date), func.max(SalesDaily.date),
+               func.count(func.distinct(SalesDaily.date)), func.sum(SalesDaily.quantity),
+               func.avg(SalesDaily.quantity),
+               func.count().filter(SalesDaily.quantity == 0))   # FILTER aggregate; valid async idiom
+        .where(SalesDaily.store_id == store_id, SalesDaily.product_id == product_id)
+      # CAST: func.avg over Integer quantity returns Decimal; wrap average_daily_demand in float(...).
+      # func.count().filter(...) is a Postgres FILTER aggregate (not shown in OpsService, but supported);
+      #   alternatively a second scalar count with .where(quantity == 0). One round-trip is fine.
+    - expected_calendar_days = (max_date - min_date).days + 1
+    - coverage_ratio = observed_days / expected_calendar_days   (guard div-by-zero / no rows)
+    - missing_days = expected_calendar_days - observed_days
+    - promotion_days: JOIN promotion ON date BETWEEN start/end AND product_id match AND
+        (store_id == X OR store_id IS NULL); COUNT(DISTINCT date). On any doubt → None + warning.
+    - status (LOCKED thresholds):
+        ready    if observed_days >= min_train_size + horizon*n_splits AND coverage_ratio >= 0.8
+        limited  if observed_days >= min_train_size + horizon
+        unusable otherwise
+    - recommended_split_config: expanding, n_splits=min(5, feasible), min_train_size=30 (or adjusted),
+        gap=0, horizon=forecast_horizon
+    - NO rows for the pair -> status="unusable" with zeros/None and a warning
+
+Task 6 — Orchestration:
+  CREATE ModelSelectionService.run_selection(db, request) -> ModelSelectionRunResponse:
+    - persist ModelSelectionRun(selection_id=uuid4().hex, status="running", snapshots); flush
+    - availability = get_availability(...); persist snapshot
+    - if availability.status == "unusable": status="failed", error_message, flush, raise BadRequestError  [LOCKED #2]
+    - for each candidate (LAZY import services + ModelConfig adapter):
+        try: cfg = flatten+validate ModelConfig; bt = await BacktestingService().run_backtest(
+                 db, store_id, product_id, window.start, window.end,
+                 BacktestConfig(split_config=req.split_config, model_config_main=cfg,
+                                include_baselines=False, store_fold_details=True))
+             collect aggregated_metrics, sample_size, fold dates/actuals/predictions for chart
+        except Exception as exc: append failed entry with reason=str(exc)   [never hide — Anti-Patterns]
+    - ranking = rank_candidates(results, req.ranking_policy, req.ranking_metric)
+    - if ranking.winner is None: status="failed", persist ranking_result, flush, RETURN 200 response  [LOCKED #3]
+    - if req.auto_train_winner:
+        train = await ForecastingService().train_model(db, store_id, product_id, window.start, window.end,
+                    winner_cfg, feature_frame_version=req.feature_frame_version, feature_groups=req.feature_groups)
+        row.final_model_path = train.model_path
+    - if req.auto_predict:   # requires auto_train_winner (validated)
+        try: pred = await ForecastingService().predict(store_id, product_id, req.forecast_horizon, row.final_model_path)
+             row.forecast_result = pred.model_dump(mode="json")
+        except <feature-aware reject>: warning, leave forecast_result None
+    - business_summary = explain_winner(ranking, availability)
+    - status = "partial" if any candidate failed else "completed"; completed_at = datetime.now(UTC)
+    - persist all JSONB via model_dump(mode="json"); flush + refresh; return response_from_row(row)
+  ADD methods: get_selection(db, selection_id)->row|NotFoundError ; get_ranking ; train_winner ; predict_winner
+
+Task 7 — Routes:
+  CREATE app/features/model_selection/routes.py:
+    - router = APIRouter(prefix="/model-selection", tags=["model-selection"])
+    - GET /availability ; POST /run (200) ; GET /{selection_id} ; GET /{selection_id}/ranking ;
+      POST /{selection_id}/train-winner ; POST /{selection_id}/predict
+    - MIRROR backtesting/routes.py error mapping EXACTLY:
+        service instantiated locally; try/except ValueError->BadRequestError(str(e)),
+        SQLAlchemyError->DatabaseError("...", details={"error": str(e)}); NotFoundError from service bubbles.
+    - structured logger.info events (see Integration Points)
+  MODIFY app/main.py:
+    - `from app.features.model_selection.routes import router as model_selection_router`  (alpha order with siblings)
+    - `app.include_router(model_selection_router)`  inside create_app(), near backtesting/forecasting (NO prefix arg)
+
+Task 8 — Tests (see Validation Loop for required names):
+  CREATE app/features/model_selection/tests/{conftest,test_models,test_schemas,test_ranking,
+    test_explanations,test_service,test_routes,test_routes_integration}.py
+    - unit route tests: ASGITransport + app.dependency_overrides[get_db]=AsyncMock; 4-key RFC7807 assert
+    - service tests: mock BacktestingService/ForecastingService (patch the lazy import targets) for
+      happy/partial/all-fail/auto-train/auto-predict paths
+    - integration tests (@pytest.mark.integration): real engine, prefix-scoped teardown in finally
+```
+
+### Pseudocode (CRITICAL details only)
+
+```python
+# ranking.py — deterministic, pure
+def rank_candidates(results, policy, ranking_metric="wape"):
+    valid, failed = [], []
+    for r in results:
+        m = normalize_metrics(r.aggregated_metrics, r.sample_size)  # keys: mae,rmse,smape,wape,bias
+        if m is None or m.sample_size < policy.minimum_sample_size:
+            failed.append(r.as_failed("missing/NaN primary metric or sample_size below minimum"))
+            continue
+        valid.append((r, m))
+    if not valid:
+        return RankingResult(winner=None, entries=failed, confidence="low", reasons=["no valid candidate"])
+    primary = lambda m: getattr(m, ranking_metric) if ranking_metric != "bias" else abs(m.bias)
+    ordered = sorted(valid, key=lambda p: (primary(p[1]), p[1].smape, abs(p[1].bias), p[1].mae, p[0].model_type))
+    winner = ordered[0]
+    return build_ranking_result(ordered, failed, policy)   # computes confidence vs 2nd place
+```
+
+```python
+# service.py — orchestration (exact verified service calls)
+async def run_selection(self, db, req):
+    from pydantic import TypeAdapter                                  # lazy
+    from app.features.backtesting.schemas import BacktestConfig       # lazy
+    from app.features.backtesting.service import BacktestingService   # lazy
+    from app.features.forecasting.schemas import ModelConfig          # lazy
+    from app.features.forecasting.service import ForecastingService   # lazy
+    adapter = TypeAdapter(ModelConfig)
+
+    row = ModelSelectionRun(selection_id=uuid.uuid4().hex, status="running",
+                            store_id=req.store_id, product_id=req.product_id,
+                            start_date=req.selection_window.start_date, end_date=req.selection_window.end_date,
+                            forecast_horizon=req.forecast_horizon, ranking_metric=req.ranking_metric,
+                            candidate_models=[c.model_dump() for c in req.candidate_models],
+                            policy_snapshot=req.ranking_policy.model_dump(mode="json"))
+    db.add(row); await db.flush()
+
+    availability = await self.get_availability(db, req.store_id, req.product_id, req.forecast_horizon, req.split_config)
+    row.availability_snapshot = availability.model_dump(mode="json")
+    if availability.status == "unusable":
+        row.status = "failed"; row.error_message = "Insufficient data for model selection"
+        await db.flush(); raise BadRequestError(message=row.error_message)   # LOCKED #2
+
+    results = []
+    for c in req.candidate_models:
+        try:
+            cfg = adapter.validate_python({"model_type": c.model_type, **c.params})   # FLATTEN
+            bt = await BacktestingService().run_backtest(
+                db, req.store_id, req.product_id,
+                req.selection_window.start_date, req.selection_window.end_date,
+                BacktestConfig(split_config=req.split_config, model_config_main=cfg,
+                               include_baselines=False, store_fold_details=True))   # LOCKED #4
+            results.append(shape_candidate(c, bt))
+        except Exception as exc:
+            results.append(shape_failed_candidate(c, exc))
+
+    ranking = rank_candidates(results, req.ranking_policy, req.ranking_metric)
+    row.ranking_result = ranking.model_dump(mode="json")
+    if ranking.winner is None:
+        row.status = "failed"; await db.flush(); return self._response(row, ranking)   # LOCKED #3 (HTTP 200)
+
+    winner_cfg = adapter.validate_python({"model_type": ranking.winner.model_type, **ranking.winner.params})
+    if req.auto_train_winner:
+        train = await ForecastingService().train_model(
+            db, req.store_id, req.product_id, req.selection_window.start_date, req.selection_window.end_date,
+            winner_cfg, feature_frame_version=req.feature_frame_version, feature_groups=req.feature_groups)
+        row.final_model_path = train.model_path
+    if req.auto_predict and row.final_model_path:
+        try:
+            pred = await ForecastingService().predict(req.store_id, req.product_id, req.forecast_horizon, row.final_model_path)
+            row.forecast_result = pred.model_dump(mode="json")
+        except Exception as exc:   # e.g. feature-aware reject (forecasting service.py:491)
+            row.forecast_result = None  # surface a warning in business_summary
+
+    row.winner_model_type = ranking.winner.model_type
+    row.winner_metrics = ranking.winner.metrics
+    row.business_summary = explain_winner(ranking, availability)
+    row.status = "partial" if any(r.failed for r in results) else "completed"
+    row.completed_at = datetime.now(UTC)
+    await db.flush(); await db.refresh(row)
+    return self._response(row, ranking)
+```
+
+### Integration Points
+
+```yaml
+DATABASE:
+  - migration: add `model_selection_run` (JSONB snapshots: candidate_models, policy_snapshot,
+    availability_snapshot, ranking_result, winner_metrics, forecast_result, business_summary)
+  - indexes: ix_model_selection_run_selection_id (unique), ix_model_selection_run_store_product_created,
+    ix_model_selection_run_status_created
+ROUTES:
+  - app/main.py: import + app.include_router(model_selection_router)  (router carries its own prefix)
+CONFIG (optional — only if used; then ADD to .env.example with UPPER_SNAKE + a comment, and a test):
+  - model_selection_max_candidates: int = 10
+  - model_selection_min_coverage_ratio: float = 0.8
+  - model_selection_default_min_train_size: int = 30
+OBSERVABILITY (structlog events, mirror ops/backtesting naming):
+  - model_selection.run_received / .availability_checked / .candidate_completed /
+    .candidate_failed / .run_completed / .run_failed
+```
+
+## Validation Loop
+
+### Level 1 — Focused syntax & policy
+
+```bash
+uv run ruff check app/features/model_selection app/main.py alembic/versions
+uv run ruff format --check app/features/model_selection app/main.py alembic/versions
+uv run mypy app/features/model_selection app/main.py
+uv run pyright app/features/model_selection app/main.py
+uv run pytest app/core/tests/test_strict_mode_policy.py -v
+```
+
+### Level 2 — Focused unit tests
+
+```bash
+uv run pytest app/features/model_selection/tests -v -m "not integration"
+```
+
+Required test names:
+
+- `test_schema_accepts_iso_dates_under_strict_model` (JSON path: `Model.model_validate({"start_date":"2026-01-01",...})`)
+- `test_schema_rejects_auto_predict_without_train_winner`
+- `test_schema_rejects_horizon_mismatch_between_split_and_forecast`
+- `test_rank_candidates_wape_smape_abs_bias_mae_tie_break`
+- `test_rank_candidates_excludes_missing_or_nan_metrics`
+- `test_rank_candidates_normalizes_five_metric_keys_including_rmse`
+- `test_confidence_high_when_winner_beats_second_by_10_percent`
+- `test_availability_ready_limited_unusable_thresholds`
+- `test_build_model_config_flattens_params` (e.g. seasonal_naive + {"season_length":7})
+- `test_run_selection_partial_success_chooses_valid_winner`
+- `test_run_selection_all_candidates_fail_returns_failed_status_not_500` (LOCKED #3)
+- `test_run_selection_unusable_availability_raises_bad_request` (LOCKED #2)
+- `test_run_selection_auto_train_passes_feature_frame_version_and_groups`
+- `test_routes_return_problem_json_on_bad_request` (4-key RFC 7807 body)
+- `test_response_uses_recommendation_confidence_key` (NOT `confidence`; maps from `RankingResult.confidence`)
+- `test_winner_entry_carries_params_for_rebuild` (`ModelRankEntry.params` / `WinnerSummary.params` preserved)
+- `test_chart_data_has_wape_bias_fold_stability_and_winner_actual_vs_predicted`
+
+### Level 3 — Migration & integration
+
+```bash
+docker compose up -d
+uv run alembic upgrade head
+uv run pytest app/features/model_selection/tests -v -m integration
+uv run alembic downgrade -1 && uv run alembic upgrade head   # downgrade/upgrade round-trips cleanly
+```
+
+Integration expectations:
+
+- `model_selection_run` exists with the three named indexes.
+- `POST /model-selection/run` persists a row; `GET /model-selection/{selection_id}` returns the same id.
+- Availability detects an inserted pair with enough history (`ready`) and a too-short pair (`limited`/`unusable`).
+- Partial failure persists the failed candidate reason and still ranks a valid winner.
+
+### Level 4 — Full backend gates (must be green before PR)
+
+```bash
+uv run ruff check . && uv run ruff format --check .
+uv run mypy app/ && uv run pyright app/
+uv run pytest -v -m "not integration"
+uv run pytest -v -m integration
+```
+
+> Known-local-noise: mypy/pyright report pre-existing `lightgbm`/`xgboost` optional-dep import
+> errors in `forecasting/`+`registry/` (untouched here; CI installs the extras). Do not "fix" them.
+
+### Manual API probe (seeded DB; discover real store/product ids + date window first — IDs are
+not guaranteed 1-based, see memory `seeder-does-not-reset-id-sequences`)
+
+```bash
+uv run uvicorn app.main:app --port 8123 &
+curl -s "http://localhost:8123/model-selection/availability?store_id=5&product_id=8&forecast_horizon=14" | python3 -m json.tool
+curl -s -X POST http://localhost:8123/model-selection/run -H "Content-Type: application/json" -d '{
+  "store_id": 5, "product_id": 8,
+  "selection_window": {"start_date": "2026-01-01", "end_date": "2026-05-31"},
+  "forecast_horizon": 14,
+  "split_config": {"strategy":"expanding","n_splits":5,"min_train_size":30,"gap":0,"horizon":14},
+  "candidate_models": [
+    {"model_type":"naive","params":{}},
+    {"model_type":"seasonal_naive","params":{"season_length":7}},
+    {"model_type":"moving_average","params":{"window_size":7}},
+    {"model_type":"regression","params":{}},
+    {"model_type":"prophet_like","params":{}}
+  ],
+  "auto_train_winner": false, "auto_predict": false
+}' | python3 -m json.tool
+```
+
+Expected: HTTP 200; response carries `selection_id`, non-empty `ranking`, `winner.model_type`,
+`recommendation_confidence`, `chart_data`.
+
+## Final Validation Checklist
+
+- [ ] New slice follows `app/features/<slice>/{models,schemas,service,routes,tests}.py`.
+- [ ] Router wired in `app/main.py` (import alias + `include_router`, no prefix at include).
+- [ ] Migration `down_revision` chains to the live head; downgrade drops indexes then table.
+- [ ] Request schemas use `ConfigDict(strict=True)` + `Field(strict=False)` for every date field; strict-mode test green.
+- [ ] All 4xx responses use project exceptions (`BadRequestError`/`NotFoundError`/`DatabaseError`) → RFC 7807.
+- [ ] Ranking + explanation logic is pure and unit-tested; normalizer handles all five metric keys incl. `rmse`.
+- [ ] Availability covered for ready/limited/unusable + no-rows.
+- [ ] `auto_train_winner` uses direct `ForecastingService.train_model` (db first, feature args keyword-only).
+- [ ] `auto_predict` handles feature-aware-reject gracefully (warning, not 500).
+- [ ] LOCKED decisions #1–#7 are implemented and tested.
+- [ ] No frontend files, no agent mutation surface, no managed-cloud SDK.
+- [ ] All four Level-4 gates pass; `gh issue view <N>` confirms the referenced issue is open.
+
+## Anti-Patterns to Avoid
+
+- Don't implement the React UI; don't rank models in TypeScript — backend owns ranking/confidence.
+- Don't use batch item metrics for fold-level chart data (batch has none) — use direct `BacktestingService` with `store_fold_details=True`.
+- Don't import sibling feature *services* at module scope — lazy in-method (matches forecasting/BatchService precedent). ORM *models* at module scope is fine (OpsService precedent).
+- Don't import `validate_date_range` from analytics — reimplement locally.
+- Don't pass the candidate `params` as a nested dict to `ModelConfig` — FLATTEN (`{"model_type":..., **params}`).
+- Don't assume four metric keys — there are five (`rmse` included); normalize, never index a raw shape blindly.
+- Don't sum `(end_date - start_date)` for promotion days (double-counts overlaps; ignores chain-wide `store_id IS NULL`).
+- Don't mutate aliases automatically; don't add an agent tool.
+- Don't hide failed candidates — include them with `reason`.
+- Don't use an LLM for explanations — deterministic text only.
+- Don't raise on all-candidates-fail (LOCKED #3 → persist failed + return 200); DO raise on unusable availability (LOCKED #2 → 400).
+- Don't build SQL with string concatenation; don't weaken strict-mode or leakage tests.
+
+## Confidence Score
+
+**9.5/10** for one-pass backend implementation success. The prior draft self-rated 8/10 with
+"service signatures must be rechecked at implementation time" as the top risk — that risk is now
+**retired**: every `run_backtest` / `train_model` / `predict` signature, the corrected five-key
+metric shape, the `ModelConfig` flattening, the strict-mode rule, the migration/JSONB/exception
+patterns, and seven previously-ambiguous decisions are verified and locked here. An independent
+quality-gate pass confirmed every cited signature/line-number/field-name against live source
+("tried to break the cited signatures and could not") and its findings — the full response/
+intermediate contract (`CandidateResult`, `ModelRankEntry`, `RankingResult`, `WinnerSummary`,
+`ChartData`, `ModelSelectionRunResponse`, …), the `recommendation_confidence` naming, the
+`winner.params` carry-through, the `_response` mapping, and the rel-improvement denominator — are
+now specified inline.
+
+Residual risks:
+
+- Per-candidate backtest runtime: five models × a multi-fold backtest is synchronous in-process.
+  On a slow host the `/run` request can be slow (acceptable for a single pair; mirrors
+  `/backtesting/run`). If it becomes a problem, a future PRP can move it behind the jobs slice.
+- `promotion_days` derivation has real edge cases (chain-wide promos, overlapping ranges); the
+  PRP explicitly permits `null + warning` as a correct fallback.
+- `lightgbm`/`xgboost` candidates can `ImportError` when extras are absent — they degrade to a
+  failed candidate with a reason (verified path), not a 500.
diff --git a/PRPs/forecast-champion-selector-slice-a-selection-capability.md b/PRPs/forecast-champion-selector-slice-a-selection-capability.md
new file mode 100644
index 00000000..f43c0371
--- /dev/null
+++ b/PRPs/forecast-champion-selector-slice-a-selection-capability.md
@@ -0,0 +1,716 @@
+name: "Forecast Champion Selector — Slice A: Selection & Capability Foundation"
+description: |
+  First usable frontend/backend surface for the Forecast Champion Selector. Adds
+  one backend-owned model-capability catalog endpoint to the existing
+  `model_selection` slice, then builds the React selection shell — searchable
+  store/product selectors, pair validation, live data-availability assessment,
+  a simple/advanced backtest-settings form, and a candidate-model picker — under
+  a new `/visualize/champion` page. Slice A deliberately STOPS before running the
+  comparison: it does NOT call `POST /model-selection/run`, render ranking/chart
+  results, train, predict, or promote. Those are Slice B (async run + results)
+  and Slice C (train/predict/business summary/override/promotion).
+
+**Created:** 2026-06-01 · **Slice:** A of 3 (A → B → C)
+**Current repo base observed:** `dev` @ `6c3f8d4` (Merge PR #354 — model_selection backend merged)
+**Backend foundation (source of truth):** `PRPs/forecast-champion-selector-backend.md` (issue #353, MERGED) +
+the live slice `app/features/model_selection/` (schemas/service/routes/ranking/explanations verified 2026-06-01).
+**Working-tree caveat:** `docker-compose.lan.yml` is an untracked local dogfood override; do NOT commit it.
+**Tracking issue:** create before implementation, suggested title `feat(api,ui): forecast champion selector slice A — selection & capability`.
+**Suggested branch:** `feat/champion-selector-slice-a` (off `dev`, per `.claude/rules/branch-naming.md`).
+**Commit scope:** `api` (new catalog endpoint + slice schemas/service/routes) and `ui` (frontend page/components/hooks/types).
+No migration in Slice A — no schema change. Every commit references the tracking issue.
+
+---
+
+## Goal
+
+**Feature Goal:** Ship the first interactive Forecast Champion Selector surface — a `/visualize/champion`
+React page that lets a user choose a **Store → Product → Time Period → Forecast Horizon → Model Types →
+Backtest Settings**, see whether the chosen pair has enough history to model (live availability assessment),
+and pick candidate models from a **backend-owned** capability catalog — backed by exactly one new backend
+endpoint (`GET /model-selection/models`). The page is genuinely usable for *configuration + availability
+triage* even though the comparison **run** itself lands in Slice B.
+
+**Deliverable:**
+- **Backend:** `GET /model-selection/models` → `ModelCatalogResponse` (capability catalog), implemented via a new
+  pure module `app/features/model_selection/capabilities.py`, response schemas added to the slice's
+  `schemas.py`, a thin `ModelSelectionService.get_model_catalog()` delegate, and the route wired in the slice's
+  existing `routes.py`. No migration, no new mutation surface, no agent tool.
+- **Frontend:** a lazy-loaded `pages/visualize/champion.tsx` page (route `ROUTES.VISUALIZE.CHAMPION`,
+  nav entry under **Visualize**), a `components/champion-selector/` component family (searchable store/product
+  selects, availability panel, backtest-settings form, candidate-model picker), a `hooks/use-model-selection.ts`
+  query-hook module (catalog + availability reads), and a `types/api.ts` "Model Selection" section that declares
+  the FULL workflow contract (so Slices B/C inherit, not redefine, the types).
+
+**Success Definition:**
+1. `GET /model-selection/models` returns HTTP 200 with a non-empty `models` array — each entry carrying
+   `model_type`, `label`, `family ∈ {baseline,tree,additive}`, `feature_aware`, `requires_extra`,
+   `default_params`, `supports_auto_predict`, `description` — plus a `default_candidate_model_types` list.
+2. The `/visualize/champion` page renders: a searchable store select, a searchable product select (each with a
+   secondary line — store `code · name`, product `sku · category`), a date-range picker, a horizon input, a
+   candidate-model picker fed by `GET /model-selection/models`, and a simple/advanced backtest-settings form.
+3. Selecting a valid `(store, product, horizon)` triggers `GET /model-selection/availability` and renders a
+   `ready | limited | unusable` status block with coverage/observed-days/zero-sale/promotion/avg-demand and the
+   recommended split config; an unusable/empty pair shows a clear not-enough-data state.
+4. The "Run comparison" primary CTA is present but **disabled** with explanatory copy (Slice B turns it on).
+5. All Slice A validation gates pass (backend Level-1..4 + frontend `tsc`/`lint`/`test`).
+
+## Why
+
+- Business users want to ask "which model should I use for this store/product?" through a UI, not curl. Slice A
+  gives them the **configuration + triage** half of that workflow immediately, and a stable shell Slice B/C bolt
+  onto with minimal churn.
+- The capability catalog must be **backend-owned** (coordination contract): the model union, families, opt-in
+  extras, and feature-aware flags live in Python (`app/features/forecasting/`), and shipping them over an API
+  prevents the TypeScript `MODEL_FAMILY_MAP`/`MODEL_TYPE_LABELS` from drifting out of sync as new models land.
+- Declaring the full TS contract now (consumed read-only in A) means Slices B and C add behavior, not type
+  definitions — cleaner slice boundaries, fewer merge conflicts.
+- Preserves the single-host architecture: one new read-only GET, no queue, no new dependency, no cloud SDK.
+
+## What
+
+### New backend endpoint (added to the existing slice router `APIRouter(prefix="/model-selection")`)
+
+```http
+GET /model-selection/models
+```
+
+Response `ModelCatalogResponse`:
+
+```json
+{
+  "models": [
+    {
+      "model_type": "naive",
+      "label": "Naive",
+      "family": "baseline",
+      "feature_aware": false,
+      "requires_extra": false,
+      "default_params": {},
+      "supports_auto_predict": true,
+      "description": "Repeats the last observed value."
+    },
+    {
+      "model_type": "seasonal_naive",
+      "label": "Seasonal Naive",
+      "family": "baseline",
+      "feature_aware": false,
+      "requires_extra": false,
+      "default_params": { "season_length": 7 },
+      "supports_auto_predict": true,
+      "description": "Repeats the value from one season ago."
+    }
+    // ... one entry per forecasting ModelConfig member (11 total)
+  ],
+  "default_candidate_model_types": ["naive", "seasonal_naive", "moving_average", "regression", "prophet_like"]
+}
+```
+
+### LOCKED Slice-A decisions (remove every "choose-one" ambiguity)
+
+1. **Exactly one new backend endpoint:** `GET /model-selection/models`. It is **declared in `routes.py`
+   BEFORE the `GET /{selection_id}` route** (literal path must precede the path-param route, mirroring the
+   existing `/availability` route at `routes.py:41` which sits before `/{selection_id}` at `:94`). Status 200.
+   No request body, no query params.
+2. **Catalog is backend-owned and derived, not hand-duplicated.** `family` comes from the forecasting
+   authority `app.features.forecasting.feature_metadata.model_family_for(model_type)` (imported LAZILY inside
+   the builder, per the slice's cross-slice discipline) mapped to the lowercase literal
+   (`ModelFamily.BASELINE → "baseline"`, etc.). `model_type` iteration order + `default_params` + `label` +
+   `description` come from a slice-local ordered map in `capabilities.py` whose keys are asserted (in a test) to
+   exactly equal the `ModelType` Literal in `app/features/model_selection/schemas.py`.
+3. **`requires_extra`** = `model_type in {"lightgbm", "xgboost"}` (opt-in extras that may `ImportError`).
+   **`feature_aware`** = `model_type in {"regression", "prophet_like", "lightgbm", "xgboost", "random_forest"}`
+   (the set the forecasting `predict()` rejects — see Known Gotchas to verify against `forecasting/service.py`).
+   **`supports_auto_predict`** = `not feature_aware` (feature-aware winners cannot auto-predict — backend
+   `predict()` rejects them; this flag lets Slice C grey-out the auto-predict toggle).
+4. **`default_candidate_model_types`** = `["naive", "seasonal_naive", "moving_average", "regression", "prophet_like"]`
+   — the exact default five from the backend PRP's `POST /run` example, so the UI pre-selects the same set the
+   contract documents.
+5. **No `model_selection_run` write in Slice A.** The page consumes `GET /models` and `GET /availability` only.
+   It assembles a typed `ModelSelectionRunRequest` in component state and exposes it through a **disabled**
+   "Run comparison" CTA; Slice B wires the `POST /run` mutation + results. Slice A MUST NOT call `POST /run`,
+   `/{id}`, `/{id}/ranking`, `/{id}/train-winner`, or `/{id}/predict`.
+6. **Searchable selects use existing primitives only** (no new npm dependency). Stores/products are fetched at
+   `pageSize: 100` (the dimensions cap) and filtered **client-side** inside a `Popover` + text `Input` +
+   scrollable button list. (If the catalog ever exceeds 100, swap to the server-side `search` param the
+   `useStores`/`useProducts` hooks already support — out of scope here.)
+7. **Bias-explanation copy (locked, reused by B/C):** wherever bias is explained in help text/tooltips, use
+   exactly — *"Positive bias means the model under-forecasts (risk of stockouts); negative bias means it
+   over-forecasts (risk of overstock)."* Export it as a shared constant so B/C reuse the same wording.
+8. **WAPE is the default ranking metric**; the advanced form's ranking-metric select offers `wape` (default),
+   `smape`, `mae`, `bias`, with help text stating the tie-break chain *WAPE → sMAPE → |bias| → MAE* and the
+   bias copy from #7.
+
+### Success Criteria
+
+- [ ] `GET /model-selection/models` returns 200 with `models` (11 entries) + `default_candidate_model_types`.
+- [ ] `capabilities.build_model_catalog()` is pure (no DB/IO) and its `model_type` set equals the slice
+      `ModelType` Literal (asserted by a test).
+- [ ] `/model-selection/models` is matched correctly (NOT captured by `/{selection_id}`) — route-order test green.
+- [ ] `/visualize/champion` route + Visualize nav entry render the page; lazy-loaded like its siblings.
+- [ ] Searchable store + product selects filter client-side and show the secondary descriptor line.
+- [ ] Pair validation: the form's primary CTA stays disabled until a store, product, valid date window, and
+      horizon are all chosen; the date window + horizon respect backend bounds.
+- [ ] Availability auto-fetches for a valid pair and renders `ready/limited/unusable` + metrics + recommended
+      split config; an empty/unusable pair renders a not-enough-data `EmptyState`.
+- [ ] The candidate-model picker is fed by `GET /model-selection/models`; opt-in-extra models are visibly
+      flagged; the default five are pre-selected.
+- [ ] The simple/advanced settings form mirrors `SplitConfig` bounds and keeps `split_config.horizon ===
+      forecast_horizon` (matching the backend request validator).
+- [ ] The "Run comparison" CTA is present but disabled with copy indicating it arrives next.
+- [ ] No `POST /model-selection/run` (or any mutation) is called; no chart/ranking results UI; no train/predict/
+      promotion UI; no agent tool; no migration; no new npm dependency.
+- [ ] `app/core/tests/test_strict_mode_policy.py` stays green (no new strict request model with date fields).
+- [ ] All backend Level-1..4 gates + frontend `pnpm tsc --noEmit && pnpm lint && pnpm test --run` pass.
+
+## All Needed Context
+
+### Documentation & References
+
+```yaml
+# Slice / contract source of truth
+- file: PRPs/forecast-champion-selector-backend.md
+  why: The merged backend foundation. LOCKED decisions #1-#7, the full /run + /{id} contract, the
+       availability semantics (ready/limited/unusable thresholds), and the default-five candidate list.
+       Slice A consumes this contract read-only; do not re-derive ranking/confidence in TS.
+- file: PRPs/ai_docs/forecast-champion-selector-backend-research.md
+  why: External-lib + runtime facts (FastAPI APIRouter, Pydantic strict mode, sklearn TimeSeriesSplit).
+- file: PRPs/templates/prp_base.md
+  why: Base PRP template structure. NOTE — the referenced "PRPs/prp-readme.md.md" does NOT exist
+       (`find PRPs -iname '*readme*'` empty on 2026-06-01); the backend PRP records the same finding.
+
+# Live backend slice to read (the contract the UI consumes)
+- file: app/features/model_selection/schemas.py
+  why: ModelType Literal (:34, the 11 model_types), RankingMetric (:48), AvailabilityStatus (:51),
+       ConfidenceLevel (:50), PairAvailabilityResponse (:239), ModelSelectionRunRequest (:118),
+       ModelSelectionRunResponse (:267), ModelRankEntry (:195), WinnerSummary (:216), ChartData (:225).
+       ADD the new ModelCatalogResponse + CandidateModelInfo here (plain BaseModel — outputs need no strict).
+- file: app/features/model_selection/routes.py
+  why: APIRouter(prefix="/model-selection") (:38); the literal `/availability` (:41) precedes `/{selection_id}`
+       (:94) — MIRROR that ordering for the new `/models` route. Error mapping: ValueError→BadRequestError,
+       SQLAlchemyError→DatabaseError.
+- file: app/features/model_selection/service.py
+  why: Stateless service pattern; lazy cross-slice imports inside methods (:215-219). ADD
+       get_model_catalog() delegating to capabilities.build_model_catalog() (no DB needed; keep signature
+       db-free or accept db and ignore — prefer db-free since the catalog is static).
+- file: app/features/model_selection/ranking.py
+  why: PURE-module precedent (no DB/IO, unit-tested directly). MIRROR this style for capabilities.py.
+- file: app/features/model_selection/explanations.py
+  why: Second pure-module precedent (deterministic text). Same import/style conventions.
+- file: app/features/model_selection/tests/test_routes.py
+  why: Route-test pattern (ASGITransport + AsyncClient + dependency_overrides[get_db]); ADD a /models 200
+       test + a route-ordering test (GET /model-selection/models is NOT treated as selection_id="models").
+- file: app/features/model_selection/tests/test_ranking.py
+  why: Pure-unit test pattern to MIRROR for tests/test_capabilities.py.
+
+# Backend authority for model family / union (catalog source)
+- file: app/features/forecasting/feature_metadata.py
+  why: model_family_for(model_type) -> ModelFamily (:57) and _MODEL_FAMILY_MAP (:42). The catalog `family`
+       field derives from here. ModelFamily enum is BASELINE/TREE/ADDITIVE (lowercase .value).
+- file: app/features/forecasting/schemas.py
+  why: ModelConfig union (the 11 flat members + their default params). Use to VERIFY default_params per model
+       (see Known Gotchas verification one-liner). ModelFamily enum lives here too (imported by feature_metadata).
+- file: app/features/backtesting/schemas.py
+  why: SplitConfig (:24) — strategy Literal["expanding","sliding"] (def "expanding"), n_splits 2-20 (def 5),
+       min_train_size >=7 (def 30), gap 0-30 (def 0), horizon 1-90 (def 14), field_validator horizon>gap (:65).
+       The TS SplitConfig type + advanced form bounds mirror this exactly.
+
+# Frontend examples to MIRROR (verified 2026-06-01)
+- file: frontend/src/pages/visualize/backtest.tsx
+  why: Canonical analytical page: Card sections, store/product Select fed by useStores/useProducts
+       ({page:1,pageSize:100}), DateRangePicker, numeric Inputs, a `formReady` gate, EmptyState/LoadingState,
+       getErrorMessage. Slice A's champion page mirrors this density (minus the results/charts).
+- file: frontend/src/components/forecast-intelligence/model-type-select.tsx
+  why: shadcn Select-based model picker convention + data-testid pattern. The Slice-A candidate picker mirrors
+       the labelling style but sources options from GET /model-selection/models (NOT the hardcoded util).
+- file: frontend/src/components/forecast-intelligence/model-type-utils.ts
+  why: The EXISTING hardcoded MODEL_FAMILY_MAP / MODEL_TYPE_LABELS used by OTHER pages. DO NOT refactor or
+       delete it in Slice A — other pages depend on it; the champion page just doesn't use it.
+- file: frontend/src/components/forecast-intelligence/batch-matrix-picker.tsx
+  why: Multi-select-of-models pattern (checkbox list, max-rows cap, data-testid scheme, Badge for state).
+       The candidate-model picker mirrors this (checkbox per model, opt-in-extra Badge), but rows = model_types
+       from the catalog, no feature-frame matrix (that's B/C).
+- file: frontend/src/components/forecast-intelligence/batch-matrix-picker.test.tsx
+  why: Component test convention — render + fireEvent + expect(onChange).toHaveBeenCalledWith; afterEach(cleanup).
+- file: frontend/src/hooks/use-stores.ts
+  why: useStores({page,pageSize,...,search,enabled}) query-hook shape + keyed query + keepPreviousData.
+- file: frontend/src/hooks/use-products.ts
+  why: useProducts(...) — identical shape; the searchable selects fetch at pageSize:100.
+- file: frontend/src/hooks/use-batches.test.ts
+  why: Hook test convention — vi.fn() fetch mock via vi.stubGlobal('fetch',...), QueryClient wrapper,
+       renderHook + waitFor, afterEach(vi.unstubAllGlobals()). MIRROR for use-model-selection.test.ts.
+- file: frontend/src/hooks/index.ts
+  why: Star-export barrel; ADD `export * from './use-model-selection'`.
+- file: frontend/src/lib/api.ts
+  why: `api<T>(endpoint,{params})` typed fetch helper; getErrorMessage(); ApiError. All hooks call `api`.
+- file: frontend/src/lib/constants.ts
+  why: ROUTES (VISUALIZE.* block) + NAV_ITEMS (Visualize group). ADD ROUTES.VISUALIZE.CHAMPION +
+       a { label:'Champion Selector', href: ROUTES.VISUALIZE.CHAMPION } nav entry under Visualize.
+- file: frontend/src/App.tsx
+  why: Lazy-page + <Route path={ROUTES.VISUALIZE.X} element={<Suspense><Page/></Suspense>}> pattern. ADD the
+       champion route mirroring the BATCH/PLANNER entries.
+- file: frontend/src/types/api.ts
+  why: Section-commented type file. ModelFamily (:177 = 'baseline'|'tree'|'additive'), ProblemDetail (:652),
+       Store/StoreListResponse (:10/:21), Product/ProductListResponse (:25/:37). ADD a new
+       "// === Model Selection (Champion Selector) ===" section near the Registry block.
+- file: frontend/src/components/common/error-display.tsx
+  why: EmptyState({title,description,action?,icon?}) — used for the not-enough-data state.
+- file: frontend/src/components/common/loading-state.tsx
+  why: LoadingState({message}) — used while availability/catalog load.
+- file: frontend/src/components/common/date-range-picker.tsx
+  why: DateRangePicker({value:DateRange|undefined,onChange}) — the time-period selector.
+- file: frontend/src/components/ui/{select,popover,input,card,button,badge,checkbox,table}.tsx
+  why: Available shadcn primitives. NOTE: there is NO command/combobox/cmdk primitive — build the searchable
+       select from Popover + Input + a filtered button list (LOCKED #6).
+- file: frontend/src/components/layout/top-nav.tsx
+  why: Renders NAV_ITEMS (grouped via NavigationMenu). No edit needed beyond the constants.ts NAV_ITEMS entry.
+- file: frontend/vitest.config.ts
+  why: jsdom env; include 'src/**/*.test.{ts,tsx}'; `@`→./src alias. No setup file. `pnpm test --run` runs once.
+
+# External official docs (with reasoning)
+- url: https://fastapi.tiangolo.com/tutorial/bigger-applications/#include-an-apirouter-with-a-custom-prefix-tags-responses-and-dependencies
+  why: APIRouter route-registration + the literal-before-path-param ordering rule that LOCKED #1 depends on.
+- url: https://www.ibm.com/design/language/  # (progressive disclosure principle)
+  why: Simple/advanced settings split — show the recommended split config by default, reveal n_splits/min_train/
+       gap/strategy under an "Advanced" toggle so novice users aren't overwhelmed. NOTE: the originally-cited
+       IBM technical-content URL 404s; use the IBM Design language site / Nielsen Norman
+       (https://www.nngroup.com/articles/progressive-disclosure/) as the canonical reference instead.
+- url: https://help.tableau.com/current/pro/desktop/en-us/dashboards_best_practices.htm
+  why: Analytical dashboard layout — lead with the question (which model?), group related controls, keep the
+       availability triage adjacent to the selection. Informs the Card grouping of the champion page.
+- url: https://scikit-learn.org/stable/modules/generated/sklearn.model_selection.TimeSeriesSplit.html
+  why: The split semantics behind SplitConfig (expanding window, n_splits, gap, horizon) — so the advanced
+       form's help text describes folds correctly.
+- url: https://tanstack.com/query/latest/docs/framework/react/guides/queries
+  why: useQuery enabled-gating (only fetch availability once a valid pair exists) + queryKey conventions.
+```
+
+### Current Codebase Tree (relevant)
+
+```bash
+app/features/model_selection/        # MERGED backend slice (issue #353)
+├── __init__.py
+├── models.py            # ModelSelectionRun ORM (NOT touched in Slice A)
+├── schemas.py           # request/response contract  ← ADD catalog response models
+├── ranking.py           # pure ranking (precedent for capabilities.py)
+├── explanations.py      # pure explanations (precedent)
+├── service.py           # ModelSelectionService     ← ADD get_model_catalog()
+├── routes.py            # APIRouter(/model-selection) ← ADD GET /models (before /{selection_id})
+└── tests/               # ← ADD test_capabilities.py; extend test_routes.py
+app/features/forecasting/feature_metadata.py   # model_family_for() — catalog family authority
+frontend/src/
+├── App.tsx                              # ← ADD lazy champion route
+├── lib/{api,constants}.ts               # ← constants: ROUTES.VISUALIZE.CHAMPION + NAV_ITEMS entry
+├── types/api.ts                         # ← ADD "Model Selection" section
+├── hooks/{use-stores,use-products,index}.ts  # ← index: export use-model-selection
+├── pages/visualize/{backtest,batch,...}.tsx  # page-density precedent
+└── components/
+    ├── common/{error-display,loading-state,date-range-picker}.tsx
+    ├── ui/{select,popover,input,card,button,badge,checkbox,table}.tsx
+    └── forecast-intelligence/{model-type-select,batch-matrix-picker}.tsx  # picker precedents
+```
+
+### Desired Codebase Tree (Slice A additions)
+
+```bash
+# Backend
+app/features/model_selection/capabilities.py          # NEW: pure build_model_catalog()
+app/features/model_selection/schemas.py               # MODIFIED: + CandidateModelInfo, ModelCatalogResponse
+app/features/model_selection/service.py               # MODIFIED: + get_model_catalog()
+app/features/model_selection/routes.py                # MODIFIED: + GET /models (before /{selection_id})
+app/features/model_selection/tests/test_capabilities.py   # NEW: pure catalog unit tests
+app/features/model_selection/tests/test_routes.py     # MODIFIED: + /models route + ordering tests
+
+# Frontend
+frontend/src/lib/constants.ts                         # MODIFIED: ROUTES.VISUALIZE.CHAMPION + NAV_ITEMS entry
+frontend/src/App.tsx                                  # MODIFIED: lazy ChampionSelectorPage route
+frontend/src/types/api.ts                             # MODIFIED: Model Selection section (full contract)
+frontend/src/hooks/use-model-selection.ts             # NEW: useModelCatalog + usePairAvailability
+frontend/src/hooks/use-model-selection.test.ts        # NEW
+frontend/src/hooks/index.ts                           # MODIFIED: + export
+frontend/src/pages/visualize/champion.tsx             # NEW: the page shell
+frontend/src/components/champion-selector/searchable-entity-select.tsx        # NEW (generic combobox)
+frontend/src/components/champion-selector/searchable-entity-select.test.tsx   # NEW
+frontend/src/components/champion-selector/availability-panel.tsx              # NEW
+frontend/src/components/champion-selector/availability-panel.test.tsx         # NEW
+frontend/src/components/champion-selector/backtest-settings-form.tsx          # NEW
+frontend/src/components/champion-selector/backtest-settings-form.test.tsx     # NEW
+frontend/src/components/champion-selector/candidate-model-picker.tsx          # NEW
+frontend/src/components/champion-selector/candidate-model-picker.test.tsx     # NEW
+frontend/src/components/champion-selector/copy.ts                             # NEW: BIAS_EXPLANATION const (LOCKED #7)
+```
+
+### Known Gotchas & VERIFIED Contracts
+
+```python
+# ── ROUTE ORDERING (LOCKED #1) ────────────────────────────────────────────────
+# Starlette matches routes in DECLARATION ORDER. The literal `GET /models` MUST be declared BEFORE
+# `GET /{selection_id}` or a request to /model-selection/models is captured as selection_id="models"
+# and 404s in the service. The existing `/availability` route (routes.py:41) already sits before
+# `/{selection_id}` (:94) — place `/models` immediately after `/availability`.
+
+# ── CATALOG default_params — VERIFY before hardcoding ─────────────────────────
+# default_params per model must match the forecasting ModelConfig member defaults. Verify with:
+#   uv run python -c "
+#   from pydantic import TypeAdapter
+#   from app.features.forecasting.schemas import ModelConfig
+#   a=TypeAdapter(ModelConfig)
+#   for mt in ['naive','seasonal_naive','moving_average','weighted_moving_average','seasonal_average',
+#              'trend_regression_baseline','regression','prophet_like','random_forest','lightgbm','xgboost']:
+#       try:
+#           m=a.validate_python({'model_type':mt}); d=m.model_dump(); d.pop('model_type',None)
+#           print(mt, d)
+#       except Exception as e:
+#           print(mt, 'NEEDS-PARAMS:', e)"
+# Use the printed defaults as `default_params` in capabilities.py. If a member REQUIRES a param (validation
+# error with only model_type), supply the contract default (seasonal_naive→{'season_length':7},
+# moving_average→{'window_size':7}) — match the backend PRP /run example. Pin these in test_capabilities.py.
+
+# ── feature_aware / requires_extra — VERIFY against forecasting predict() reject ──
+# LOCKED #3 sets feature_aware = {regression, prophet_like, lightgbm, xgboost, random_forest}. Confirm this
+# equals the set ForecastingService.predict() rejects (the backend PRP cites forecasting/service.py:491
+# "rejects feature-aware models"). If the live reject-set differs, the live code wins — update the
+# capabilities set and the test to match, and note the discrepancy in the PR description.
+
+# ── family literal mapping ────────────────────────────────────────────────────
+# model_family_for(mt) returns a ModelFamily enum; serialize via `.value` → "baseline"|"tree"|"additive"
+# which already matches the frontend ModelFamily TS union (types/api.ts:177). Import model_family_for
+# LAZILY inside build_model_catalog() (mirror service.py lazy cross-slice imports).
+
+# ── NO new strict request model ───────────────────────────────────────────────
+# GET /models has no body and no query params → no ConfigDict(strict=True) model, no date fields → the
+# strict-mode policy linter is unaffected. Do NOT add an AvailabilityQuery-style model for /models.
+
+# ── catalog is static/pure ─────────────────────────────────────────────────────
+# build_model_catalog() takes no args and does no I/O — it is unit-testable like ranking.py. get_model_catalog()
+# on the service is a thin pass-through (no db round-trip needed); keep it sync-pure or trivially async.
+```
+
+```typescript
+// ── FRONTEND ────────────────────────────────────────────────────────────────
+// NO combobox/cmdk primitive exists (only select/popover/input/dialog under components/ui). Build the
+// searchable select from <Popover> + <Input> (filter box) + a scrollable list of <button> rows. Filter the
+// already-fetched ≤100 rows CLIENT-SIDE (LOCKED #6). Do NOT add cmdk / a new npm dependency.
+//
+// Stores/products: useStores({page:1,pageSize:100}) / useProducts({page:1,pageSize:100}) (the dimensions
+// endpoints cap page_size at 100 — see backtest.tsx:97-98).
+//
+// IDs are NOT 1-based (memory: seeder-does-not-reset-id-sequences) — never hardcode store_id=1/product_id=1
+// in tests or examples; read real IDs from the dimensions list. selection_id is BACKEND-generated — do NOT
+// call crypto.randomUUID() client-side (memory: showcase-crypto-randomuuid-lan-crash; undefined over LAN HTTP).
+//
+// SplitConfig has NO existing TS type — add it. Mirror backend bounds EXACTLY:
+//   strategy: 'expanding'|'sliding' (def 'expanding'); n_splits 2..20 (def 5); min_train_size >=7 (def 30);
+//   gap 0..30 (def 0); horizon 1..90 (def 14); horizon must be > gap; AND split_config.horizon === forecast_horizon
+//   (the backend ModelSelectionRunRequest validator enforces both — mirror client-side so the assembled
+//   request is always valid for Slice B).
+//
+// Availability fetch is gated: usePairAvailability(storeId, productId, horizon, { enabled: !!storeId && !!productId })
+// — only fire once a pair is chosen (TanStack `enabled`). Mirror useStore(storeId, enabled) gating style.
+//
+// Mixed CRLF/LF line endings exist repo-wide (memory: repo-line-endings-crlf) — run `git diff --stat` before
+// committing to avoid whole-file noise diffs; keep new files LF.
+//
+// VITE_API_BASE_URL must be http://localhost:8123 for local dogfood (memory/CLAUDE.local.md).
+```
+
+## Implementation Blueprint
+
+### Backend data models (added to `app/features/model_selection/schemas.py`)
+
+```python
+# Response-only (plain BaseModel — no strict needed). Place after the existing response models.
+class CandidateModelInfo(BaseModel):
+    """One selectable forecasting model in the capability catalog."""
+    model_type: str
+    label: str
+    family: Literal["baseline", "tree", "additive"]
+    feature_aware: bool
+    requires_extra: bool          # lightgbm/xgboost — opt-in extra may be absent at runtime
+    default_params: dict[str, Any]
+    supports_auto_predict: bool   # False for feature-aware models (predict() rejects them)
+    description: str
+
+class ModelCatalogResponse(BaseModel):
+    """GET /model-selection/models — backend-owned candidate catalog."""
+    models: list[CandidateModelInfo]
+    default_candidate_model_types: list[str]
+```
+
+`app/features/model_selection/capabilities.py` (pure):
+
+```python
+# CRITICAL details only — not full code.
+# _CATALOG: an ORDERED dict/list keyed by model_type with (label, default_params, description) — keys MUST
+#   equal the ModelType Literal members (asserted in test_capabilities.py).
+# _FEATURE_AWARE = frozenset({"regression","prophet_like","lightgbm","xgboost","random_forest"})  # LOCKED #3
+# _REQUIRES_EXTRA = frozenset({"lightgbm","xgboost"})
+# DEFAULT_CANDIDATE_MODEL_TYPES = ["naive","seasonal_naive","moving_average","regression","prophet_like"]
+#
+# def build_model_catalog() -> ModelCatalogResponse:
+#     from app.features.forecasting.feature_metadata import model_family_for   # lazy cross-slice
+#     models = []
+#     for model_type, meta in _CATALOG.items():
+#         family = model_family_for(model_type).value          # "baseline"|"tree"|"additive"
+#         feature_aware = model_type in _FEATURE_AWARE
+#         models.append(CandidateModelInfo(
+#             model_type=model_type, label=meta.label, family=family,
+#             feature_aware=feature_aware, requires_extra=model_type in _REQUIRES_EXTRA,
+#             default_params=meta.default_params, supports_auto_predict=not feature_aware,
+#             description=meta.description))
+#     return ModelCatalogResponse(models=models, default_candidate_model_types=DEFAULT_CANDIDATE_MODEL_TYPES)
+```
+
+### Implementation Tasks (dependency-ordered)
+
+```yaml
+# ───────────────────────── BACKEND ─────────────────────────
+Task 1 — Catalog schemas:
+  MODIFY app/features/model_selection/schemas.py:
+    - ADD CandidateModelInfo + ModelCatalogResponse (plain BaseModel; reuse existing Literal/Any imports).
+
+Task 2 — Pure catalog builder:
+  CREATE app/features/model_selection/capabilities.py:
+    - MIRROR ranking.py module style (pure, no DB/IO, `from __future__ import annotations`).
+    - _CATALOG ordered map (label/default_params/description per model_type) — RUN the verification one-liner
+      (Known Gotchas) and pin default_params to the printed forecasting defaults.
+    - build_model_catalog() per blueprint; lazy-import model_family_for.
+
+Task 3 — Service delegate:
+  MODIFY app/features/model_selection/service.py:
+    - ADD get_model_catalog(self) -> ModelCatalogResponse  (thin: `return build_model_catalog()`).
+      (Keep it on the service for symmetry with availability/run; no db arg needed.)
+    - Import build_model_catalog + ModelCatalogResponse (module scope is fine — same slice, no cycle).
+
+Task 4 — Route (ORDER MATTERS):
+  MODIFY app/features/model_selection/routes.py:
+    - ADD `@router.get("/models", response_model=ModelCatalogResponse, status_code=200)` IMMEDIATELY AFTER the
+      `/availability` handler and BEFORE `GET /{selection_id}` (LOCKED #1).
+    - Handler: `service = ModelSelectionService(); return service.get_model_catalog()`  (wrap in the same
+      try/except SQLAlchemyError→DatabaseError shell only if it touches db; catalog is static so a bare return
+      is fine — but keep the import of the response model).
+
+Task 5 — Backend tests:
+  CREATE app/features/model_selection/tests/test_capabilities.py:
+    - test_catalog_model_types_match_literal  (keys == ModelType.__args__)
+    - test_catalog_families_are_valid_literals (each family in {baseline,tree,additive})
+    - test_requires_extra_flags_lightgbm_xgboost_only
+    - test_feature_aware_models_do_not_support_auto_predict
+    - test_default_candidate_model_types_are_the_default_five
+    - test_default_params_match_forecasting_defaults  (seasonal_naive season_length=7, moving_average window_size=7)
+  MODIFY app/features/model_selection/tests/test_routes.py:
+    - test_get_models_returns_catalog_200  (ASGITransport; assert models non-empty + default list)
+    - test_models_route_not_captured_by_selection_id  (GET /model-selection/models ≠ a 404 "selection run models
+      not found"; assert it returns the catalog shape, proving literal-before-param ordering)
+
+# ───────────────────────── FRONTEND ─────────────────────────
+Task 6 — TS contract:
+  MODIFY frontend/src/types/api.ts:
+    - ADD a "// === Model Selection (Champion Selector) ===" section. Declare the FULL workflow contract so
+      Slices B/C inherit it:
+      SplitConfig, CandidateModelConfig, RankingPolicy, ModelSelectionRunRequest, SelectionWindow,
+      CandidateModelInfo, ModelCatalogResponse, PairAvailability (mirror PairAvailabilityResponse),
+      ModelRankEntry, WinnerSummary, ChartData, ForecastSummary, ModelSelectionRunResponse.
+    - family field reuses the existing ModelFamily union; status uses 'pending'|'running'|'completed'|'partial'|'failed'.
+    - Mark with a comment which types Slice A CONSUMES (ModelCatalogResponse, PairAvailability, SplitConfig)
+      vs which are DECLARED-FOR-LATER (run request/response, ranking, chart).
+
+Task 7 — Query hooks:
+  CREATE frontend/src/hooks/use-model-selection.ts:
+    - useModelCatalog(): useQuery(['model-selection','models'], () => api<ModelCatalogResponse>('/model-selection/models'))
+      with staleTime long (catalog is static).
+    - usePairAvailability(storeId, productId, forecastHorizon, enabled): useQuery keyed on the triple, calling
+      api<PairAvailability>('/model-selection/availability', { params: { store_id, product_id, forecast_horizon } }),
+      enabled: enabled && storeId>0 && productId>0  (MIRROR useStore gating).
+  MODIFY frontend/src/hooks/index.ts: ADD `export * from './use-model-selection'` (alpha order).
+  CREATE frontend/src/hooks/use-model-selection.test.ts:
+    - MIRROR use-batches.test.ts (vi.stubGlobal('fetch',...), QueryClient wrapper, renderHook+waitFor).
+    - assert /model-selection/models URL + parsed catalog; assert availability URL carries the 3 query params;
+      assert availability query is DISABLED when storeId/productId absent (fetch not called).
+
+Task 8 — Shared copy + searchable select:
+  CREATE frontend/src/components/champion-selector/copy.ts:
+    - export const BIAS_EXPLANATION = "Positive bias means the model under-forecasts (risk of stockouts); "
+      + "negative bias means it over-forecasts (risk of overstock)."   # LOCKED #7
+    - export const RANKING_TIE_BREAK = "Ranked by WAPE, then sMAPE, then |bias|, then MAE."   # LOCKED #8
+  CREATE frontend/src/components/champion-selector/searchable-entity-select.tsx:
+    - Generic: props { items: {id:number; primary:string; secondary?:string}[]; value:number|null;
+      onChange:(id:number)=>void; placeholder; loading?; emptyLabel? }.
+    - Popover + trigger Button (shows selected primary/secondary) + Input filter (client-side, case-insensitive
+      over primary+secondary) + scrollable list of <button> rows. data-testid="searchable-entity-select".
+  CREATE searchable-entity-select.test.tsx: render, type a filter, assert filtered rows; click selects + calls onChange.
+
+Task 9 — Availability panel:
+  CREATE frontend/src/components/champion-selector/availability-panel.tsx:
+    - props { availability?: PairAvailability; isLoading; isError }.
+    - LoadingState while loading; EmptyState ("Not enough data to model this pair") when status==='unusable' OR
+      observed_days===0; otherwise a Card with a status Badge (ready=default, limited=secondary/amber,
+      unusable=destructive) + metric tiles (observed_days, coverage_ratio %, zero_sale_days, promotion_days
+      [or "—" when null], average_daily_demand) + a "Recommended split" summary (strategy, n_splits, min_train,
+      gap, horizon). Render warnings[] as muted lines.
+  CREATE availability-panel.test.tsx: ready→tiles render; unusable→EmptyState; null promotion_days→"—".
+
+Task 10 — Backtest settings form (simple/advanced):
+  CREATE frontend/src/components/champion-selector/backtest-settings-form.tsx:
+    - props { value: SplitConfig; rankingMetric: RankingMetric; forecastHorizon:number;
+      onChange:(next:SplitConfig)=>void; onRankingMetricChange:(m)=>void; recommended?:SplitConfig }.
+    - "Simple" view shows recommended split read-only + a "Use recommended" button; an "Advanced" toggle reveals
+      n_splits / min_train_size / gap / strategy inputs (bounds per SplitConfig). horizon is DERIVED from
+      forecastHorizon (kept equal — LOCKED Gotcha) and shown read-only with a note.
+    - ranking-metric Select (wape default / smape / mae / bias) with help text = RANKING_TIE_BREAK + BIAS_EXPLANATION.
+    - client-side validation surfaces inline errors (n_splits 2-20, min_train>=7, gap 0-30, gap<horizon).
+  CREATE backtest-settings-form.test.tsx: advanced toggle reveals inputs; invalid n_splits shows error; "Use
+    recommended" calls onChange with the recommended config.
+
+Task 11 — Candidate-model picker:
+  CREATE frontend/src/components/champion-selector/candidate-model-picker.tsx:
+    - props { catalog?: ModelCatalogResponse; selected:string[]; onChange:(types:string[])=>void; isLoading }.
+    - MIRROR batch-matrix-picker: checkbox per catalog model (grouped by family), opt-in-extra models show a
+      "extra" Badge, feature-aware models show a small "feature-aware" hint; cap selection at 10 (backend
+      candidate_models max_length=10) with a "max reached" Badge. Pre-select default_candidate_model_types on
+      first catalog load (controlled by the page). data-testid per model.
+  CREATE candidate-model-picker.test.tsx: toggling a model calls onChange; cap at 10 disables further adds;
+    extra Badge present for lightgbm/xgboost.
+
+Task 12 — Page shell:
+  CREATE frontend/src/pages/visualize/champion.tsx (default export):
+    - MIRROR backtest.tsx layout density. State: storeId, productId, dateRange, forecastHorizon, splitConfig,
+      rankingMetric, selectedModels.
+    - useStores/useProducts ({page:1,pageSize:100}) → feed two SearchableEntitySelect (store primary=`code · name`,
+      product primary=`sku · name`, secondary=category). useModelCatalog() → CandidateModelPicker (pre-select
+      defaults on load). usePairAvailability(storeId,productId,forecastHorizon, enabled=valid pair) → AvailabilityPanel.
+    - Keep splitConfig.horizon === forecastHorizon (sync on horizon change); seed splitConfig from
+      availability.recommended_split_config when it arrives (only if the user hasn't edited — simplest: a
+      "Use recommended" button rather than auto-overwrite).
+    - Assemble a typed `ModelSelectionRunRequest` (store_id, product_id, selection_window from dateRange,
+      forecast_horizon, ranking_metric, split_config, candidate_models=[{model_type, params:{}}...], V1 defaults).
+      Set `auto_train_winner: false` and `auto_predict: false` explicitly: the async run path (Slice B `POST /runs`)
+      treats both as NO-OPS, and training/prediction happen later via Slice C's explicit `train-winner`/`train-selected`/
+      `predict` actions — so these two request fields are effectively dead in the UI flow (set false, never surfaced).
+      Render a DISABLED "Run comparison" Button with help text "Model comparison runs in the next update"
+      (LOCKED #5). Gate en/disable purely on form validity; never call POST.
+    - EmptyState when no pair chosen; LoadingState while catalog loads; getErrorMessage on query errors.
+  MODIFY frontend/src/lib/constants.ts:
+    - ROUTES.VISUALIZE.CHAMPION = '/visualize/champion'
+    - NAV_ITEMS Visualize group: add { label: 'Champion Selector', href: ROUTES.VISUALIZE.CHAMPION }
+  MODIFY frontend/src/App.tsx:
+    - const ChampionSelectorPage = lazy(() => import('@/pages/visualize/champion'))
+    - <Route path={ROUTES.VISUALIZE.CHAMPION} element={<Suspense fallback={<PageLoader/>}><ChampionSelectorPage/></Suspense>} />
+```
+
+### Integration Points
+
+```yaml
+ROUTES (backend):
+  - app/features/model_selection/routes.py: GET /models added BEFORE /{selection_id} (no app/main.py change —
+    the router is already wired).
+ROUTES (frontend):
+  - constants.ts ROUTES.VISUALIZE.CHAMPION + NAV_ITEMS entry; App.tsx lazy <Route>.
+CONFIG: none (no settings, no .env var, no migration).
+OBSERVABILITY: catalog endpoint may log `model_selection.catalog_served` (optional; mirror existing logger.info
+  events) — not required.
+```
+
+## Validation Loop
+
+### Level 1 — Backend syntax & policy
+
+```bash
+uv run ruff check app/features/model_selection
+uv run ruff format --check app/features/model_selection
+uv run mypy app/features/model_selection
+uv run pyright app/features/model_selection
+uv run pytest app/core/tests/test_strict_mode_policy.py -v   # must stay green (no new strict date model)
+```
+
+### Level 2 — Backend unit tests
+
+```bash
+uv run pytest app/features/model_selection/tests/test_capabilities.py app/features/model_selection/tests/test_routes.py -v -m "not integration"
+```
+
+### Level 3 — Frontend gates
+
+```bash
+cd frontend && pnpm tsc --noEmit && pnpm lint && pnpm test --run
+```
+
+Expected: type-check clean; lint clean (react-refresh only-export-components — keep non-component exports like
+`copy.ts` constants in `.ts` files, not `.tsx`); new component + hook tests pass.
+
+### Level 4 — Full gates (must be green before PR)
+
+```bash
+uv run ruff check . && uv run ruff format --check .
+uv run mypy app/ && uv run pyright app/
+uv run pytest -v -m "not integration"
+cd frontend && pnpm tsc --noEmit && pnpm lint && pnpm test --run
+```
+
+> Known-local-noise: mypy/pyright report pre-existing `lightgbm`/`xgboost` optional-dep import errors in
+> `forecasting/`+`registry/` (CI installs the extras). Do NOT "fix" them — and remember a green LOCAL mypy can
+> MASK errors that only surface once the extras resolve types (memory: the #355 finalizer cast).
+
+### Manual dogfood probe (discover REAL ids first — IDs are NOT 1-based)
+
+```bash
+uv run uvicorn app.main:app --port 8123 &
+# 0) catalog
+curl -s http://localhost:8123/model-selection/models | python3 -m json.tool | head -40
+# 1) confirm /models is NOT captured by /{selection_id} (should be the catalog, not a 404)
+curl -s -o /dev/null -w "%{http_code}\n" http://localhost:8123/model-selection/models   # 200
+# 2) discover real ids, then availability
+curl -s "http://localhost:8123/dimensions/stores?page=1&page_size=5" | python3 -m json.tool | grep '"id"'
+curl -s "http://localhost:8123/dimensions/products?page=1&page_size=5" | python3 -m json.tool | grep '"id"'
+curl -s "http://localhost:8123/model-selection/availability?store_id=<ID>&product_id=<ID>&forecast_horizon=14" | python3 -m json.tool
+# 3) frontend: VITE_API_BASE_URL=http://localhost:8123; pnpm dev (or ./node_modules/.bin/vite --host 0.0.0.0);
+#    dogfood /visualize/champion over http://localhost:5173 (NOT a LAN IP — crypto/secure-context memory).
+```
+
+Expected: catalog 200 with 11 models + default-five list; availability renders ready/limited/unusable on the
+page; the "Run comparison" CTA is visibly disabled; no console call to `POST /model-selection/run`.
+
+## Final Validation Checklist
+
+- [ ] `GET /model-selection/models` returns 200 with 11 models + default-five list; declared BEFORE `/{selection_id}`.
+- [ ] `capabilities.build_model_catalog()` is pure; its model_type set == the slice `ModelType` Literal (tested).
+- [ ] `family` derives from `forecasting.feature_metadata.model_family_for` (lazy import); values lowercase.
+- [ ] `requires_extra`/`feature_aware`/`supports_auto_predict` flags verified against forecasting's predict-reject set.
+- [ ] No new strict request model; strict-mode policy test green; no migration; no new mutation/agent surface.
+- [ ] `/visualize/champion` route + Visualize nav entry render; page lazy-loaded like its siblings.
+- [ ] Searchable store/product selects filter client-side (no new npm dep); secondary descriptor line shown.
+- [ ] Availability auto-fetches for a valid pair; ready/limited/unusable + metrics + recommended split; empty
+      state for unusable/empty; null promotion_days renders "—".
+- [ ] Settings form mirrors SplitConfig bounds and keeps split_config.horizon === forecast_horizon.
+- [ ] Candidate picker sourced from the catalog; default five pre-selected; opt-in extras flagged; cap 10.
+- [ ] "Run comparison" CTA present but disabled; Slice A makes NO `POST /run` (or any mutation) call.
+- [ ] All Level-4 gates pass; `gh issue view <N>` confirms the tracking issue is open.
+- [ ] `git diff --stat` shows no whole-file CRLF noise; `docker-compose.lan.yml` NOT staged.
+
+## Anti-Patterns to Avoid
+
+- ❌ Don't implement Slice B (the comparison run, progress/cancel, ranking table, charts) or Slice C
+  (train/predict/business summary/manual override/promotion) — Slice A is selection + capability + availability ONLY.
+- ❌ Don't call `POST /model-selection/run` or any `/{selection_id}*` endpoint from Slice A.
+- ❌ Don't add a backend endpoint outside the `/model-selection` namespace, and don't put the catalog in the
+  forecasting slice (it stays slice-local — Option 1).
+- ❌ Don't re-derive the model catalog in TypeScript or refactor/delete the existing `model-type-utils.ts`
+  (other pages still use it). The champion page consumes the backend catalog.
+- ❌ Don't add `cmdk`/a combobox dependency — build the searchable select from existing Popover+Input+list.
+- ❌ Don't declare `GET /models` after `GET /{selection_id}` (it would be captured as a selection_id).
+- ❌ Don't hardcode store_id=1/product_id=1 in tests or probes (IDs aren't 1-based).
+- ❌ Don't call `crypto.randomUUID()` client-side (LAN secure-context crash); selection_id is backend-owned.
+- ❌ Don't add a new strict request model with date fields without `Field(strict=False)` (none is needed here).
+- ❌ Don't auto-overwrite a user-edited split config with the recommended one — offer a "Use recommended" button.
+
+## Confidence Score
+
+**8.5/10** for one-pass implementation success. The backend foundation is merged and its contract is read
+verbatim; every frontend convention (routing, nav, lazy page, query hooks, hook/component test harness, common
+components, available shadcn primitives) is verified against live files; the one new backend endpoint is a small
+pure-catalog read with a precise route-ordering rule and verification one-liners for the only data-shape risks
+(`default_params`, the `feature_aware` set). Residual risk (the 1.5): (a) the searchable-select UX is hand-built
+from primitives (no combobox to mirror), so its tests need care; (b) the Slice-A/Slice-B boundary on the disabled
+"Run comparison" CTA must be respected to avoid scope bleed; (c) this is the first frontend slice in this
+workflow, so the `react-refresh/only-export-components` lint rule (keep constants in `copy.ts`, components in
+`.tsx`) and CRLF noise are the most likely friction points — both are called out explicitly above.
diff --git a/PRPs/forecast-champion-selector-slice-b-async-comparison-results.md b/PRPs/forecast-champion-selector-slice-b-async-comparison-results.md
new file mode 100644
index 00000000..dbf03bfd
--- /dev/null
+++ b/PRPs/forecast-champion-selector-slice-b-async-comparison-results.md
@@ -0,0 +1,1010 @@
+name: "Forecast Champion Selector — Slice B: Async Comparison + Results Visualization"
+description: |
+  Convert the synchronous champion-comparison into a real DB-backed long-running
+  operation (LRO) and build the results-visualization half of the UI. Adds an
+  async submit endpoint (202 + Location/Retry-After/monitor_url/cancel_url), a
+  polling read with live per-candidate progress, cooperative honest cancellation,
+  a new per-candidate execution table, and the frontend progress panel + ranking
+  table + winner card + comparison charts + model detail drawer + partial-state
+  handling. Slice B STOPS before final-model decisioning: it does NOT train the
+  winner, generate a forecast, render a business summary beyond the existing
+  deterministic `business_summary`, do manual winner override, or promote/register
+  a champion — those are Slice C.
+
+**Created:** 2026-06-01 · **Slice:** B of 3 (A → B → C)
+**Current repo base observed:** `dev` @ `6c3f8d4` (Merge PR #354 — `model_selection` backend merged)
+**Backend foundation (source of truth):** `PRPs/forecast-champion-selector-backend.md` (issue #353, MERGED) +
+the live slice `app/features/model_selection/` (schemas/service/routes/ranking/explanations/models verified 2026-06-01).
+**Slice A (FIXED upstream dependency):** `PRPs/forecast-champion-selector-slice-a-selection-capability.md` —
+owns `/visualize/champion` page, `hooks/use-model-selection.ts`, `types/api.ts` "Model Selection" section,
+`components/champion-selector/*`, the `GET /model-selection/models` catalog, and the assembled
+`ModelSelectionRunRequest`. Slice B EXTENDS these; it MUST NOT redefine Slice A contracts.
+**Async precedent (source of truth):** `app/features/batch/` (runner/routes/models/service) +
+`PRPs/ai_docs/asyncio-taskgroup-cancellation.md` (the repo's own, runtime-verified, asyncio LRO doc).
+**Working-tree caveat:** `docker-compose.lan.yml` is an untracked local dogfood override; do NOT commit it.
+**Tracking issue:** create before implementation, suggested title
+`feat(api,db,ui): forecast champion selector slice B — async comparison & results`.
+**Suggested branch:** `feat/champion-selector-slice-b` (off `dev`, per `.claude/rules/branch-naming.md`).
+**Commit scope:** `api` (async endpoints + runner + service), `db` (child table + additive columns migration),
+`ui` (results page/components/hooks/types). One migration. Every commit references the tracking issue.
+
+---
+
+## VALIDATE — What exists vs. what Slice B adds
+
+### Already merged (the foundation Slice B builds on)
+
+- **`POST /model-selection/run` is SYNCHRONOUS and blocking.** `ModelSelectionService.run_selection`
+  (`app/features/model_selection/service.py:211`) loops candidates **sequentially in-process**
+  (`for candidate in request.candidate_models:` :274), runs each `BacktestingService().run_backtest`
+  (:279), ranks (`rank_candidates` :308), builds chart data (`build_chart_data` :370), and flips the
+  single `model_selection_run` row to a terminal status **before the request returns 200**. There is
+  **no progress, no per-candidate status rows, no cancellation**. The `PENDING`/`RUNNING` enum values
+  exist (`models.py:36-40`) but the row is only ever observed in its terminal state by any reader.
+- **Pure logic Slice B REUSES unchanged:** `ranking.rank_candidates` / `ranking.build_chart_data`
+  (`ranking.py:116,250`), `explanations.explain_winner` (`explanations.py`), and the service mappers
+  `_shape_candidate` / `_shape_failed_candidate` / `_forecast_summary` / `_response` (`service.py:468-568`).
+- **The stable contract Slice A's TS types mirror:** `ModelSelectionRunResponse` (`schemas.py:267`),
+  `ModelRankEntry` (:195), `WinnerSummary` (:216), `ChartData` (:225), `RankingResult` (:207),
+  `CandidateResult`+`FoldChart` (:178,169), `PairAvailabilityResponse` (:239).
+- **The proven async LRO pattern lives in `app/features/batch/`** — but in another slice, so it cannot
+  be imported (vertical-slice rule). It is the TEMPLATE Slice B mirrors slice-locally.
+
+### Slice B's gaps to fill
+
+1. **No true async run.** Batch's own `POST` `await`s the run to completion inline
+   (`batch/service.py:178` `await runner.run_batch(...)`; `batch/routes.py:52` returns the *settled*
+   parent) — a 202-shaped but client-blocking call. Slice B needs **fire-and-forget**: POST returns
+   202 *immediately* with `status=running`, the work continues in a detached task, the client polls.
+2. **No per-candidate execution records** — needed for live progress + audit of failed/cancelled candidates.
+3. **No cancellation** — no cooperative cancel, drain, or `cancelled` terminal state.
+4. **No results UI** — no progress panel, ranking table, winner card, comparison charts, detail drawer,
+   or partial-state rendering. Slice A ships only the selection shell with a DISABLED "Run comparison" CTA.
+
+---
+
+## BRAINSTORM / RERANK — Chosen packaging
+
+Three packaging alternatives for the async conversion were scored (user value / repo fit / implementation
+clarity / risk control / dependency isolation, each 1–5; total /25):
+
+| # | Option | User | Repo fit | Clarity | Risk | Isolation | **Total** |
+|---|--------|:----:|:--------:|:-------:|:----:|:---------:|:---------:|
+| **A** | **Fire-and-forget LRO: new `POST /runs` (202, immediate) + `model_selection_candidate` child table + slice-local TaskGroup runner + additive progress on GET + `DELETE` cancel/drain. Reuse all existing pure logic at settle.** | 5 | 5 | 4 | 4 | 5 | **23 ✅** |
+| C | New `/runs` + child table but **sequential** (concurrency=1, plain background task, no Semaphore/TaskGroup) | 3 | 3 | 5 | 5 | 5 | 21 |
+| B | **Convert `/run` in place** to async + reuse the parent's JSONB `candidate_results` for progress (no child table) | 4 | 2 | 3 | 2 | 2 | 13 |
+
+**Chosen: Option A.** It matches the brief exactly (parallel fan-out, true progress, honest cancel,
+rich results), mirrors the merged `batch` precedent (lowest novel-code risk), and keeps the legacy
+synchronous `POST /run` + the entire Slice A contract intact (additive only). Option C is the honest
+fallback — and is **one config away** from A: setting `model_selection_global_max_parallel=1` makes the
+Semaphore degenerate to sequential, so A *subsumes* C with no redesign. Option B is rejected: concurrent
+candidate tasks writing the SAME parent row's `candidate_results` JSONB is a read-modify-write lost-update
+race (the very reason batch uses child rows), and converting `/run` in place mutates a contract Slice A's
+types + the backend tests lock — higher blast radius for no gain.
+
+**One deliberate divergence from batch:** batch `await`s the runner inline; Slice B **detaches** the
+runner via `asyncio.create_task` so POST returns 202 before the work finishes (see LOCKED #2 + Known
+Gotchas). Everything else — the per-child-session runner internals, `CancelHandle` registry, drain→504,
+settle-then-`mark_completed` ordering — is mirrored verbatim.
+
+**Non-goals (Slice C, do NOT build here):** winner train/predict from this run, forecast summary/chart/daily
+table, safety-stock heuristic, manual winner override, champion/alias promotion, user-guide docs,
+end-to-end dogfood of the full journey. Slice B may surface the EXISTING deterministic `business_summary`
+JSONB read-only, but adds no new business-interpretation logic.
+
+---
+
+## Goal
+
+**Feature Goal:** Turn champion comparison into a genuine long-running operation a user can submit, watch
+progress on, cancel, and read rich comparison results from — wired into the Slice A `/visualize/champion`
+page so the previously-disabled "Run comparison" CTA now launches an async run and streams a live progress
+panel that resolves into a ranking table, winner card, comparison charts, and a per-model detail drawer.
+
+**Deliverable:**
+- **Backend:** `POST /model-selection/runs` (202, immediate, fire-and-forget) + `DELETE /model-selection/{selection_id}`
+  (cooperative cancel + drain) + additive progress fields on the existing `GET /model-selection/{selection_id}`;
+  a new `model_selection_candidate` child table + additive `model_selection_run` columns + one Alembic
+  migration; a slice-local `runner.py` (TaskGroup + Semaphore + `CancelHandle` registry, mirror of
+  `batch/runner.py`); new `Settings.model_selection_global_max_parallel` + `model_selection_cancel_drain_timeout_seconds`.
+- **Frontend (extends Slice A):** new mutation/poll hooks in `hooks/use-model-selection.ts`
+  (`useSubmitSelectionRun`, `useSelectionRun` polling, `useCancelSelectionRun`); a results component family
+  under `components/champion-selector/results/` (progress panel, ranking table, winner card, comparison
+  charts, model-detail drawer, partial-state empty/error); the `/visualize/champion` page wires the CTA →
+  submit → poll → results; additive types in the Slice-A `types/api.ts` "Model Selection" section.
+
+**Success Definition:**
+1. `POST /model-selection/runs` (same `ModelSelectionRunRequest` body Slice A assembles) returns **202**
+   within ~tens of ms, with a `selection_id`, `status="running"`, a `Location`/`monitor_url`
+   (`/model-selection/{id}`), a `cancel_url` (`/model-selection/{id}`), and a `Retry-After` header — BEFORE
+   any backtest finishes.
+2. `GET /model-selection/{selection_id}` returns live progress while running (counts + a per-candidate
+   list with `pending|running|completed|failed|cancelled`), and on terminal status returns the SAME
+   `ranking`/`winner`/`chart_data`/`business_summary` shape the legacy sync `/run` produces today.
+3. `DELETE /model-selection/{selection_id}` cooperatively cancels: pending candidates skip, running ones
+   stop at the next safe yield (sklearn/LightGBM mid-fit may finish first — honest), no candidate is left
+   `running` after drain; returns 200 (settled), 404 (missing), 409 (already terminal), or 504 (drain timeout).
+4. The `/visualize/champion` page CTA submits, shows a live progress panel, then renders a ranking table,
+   winner card, WAPE/MAE/sMAPE/bias + fold-stability + actual-vs-predicted charts, a per-model detail
+   drawer, and a clear partial-success / all-failed / cancelled state. Failed candidates stay visible.
+5. All Slice B validation gates pass (backend Level-1..4 incl. migration up/down + integration; frontend
+   `tsc`/`lint`/`test`).
+
+## Why
+
+- A multi-fold backtest across up to 10 candidates is genuinely long on a laptop; a blocking request gives
+  no feedback and cannot be stopped. Users need progress and an honest cancel.
+- The brief mandates a **true DB-backed LRO** (not FastAPI BackgroundTasks for heavy fits) with cooperative
+  cancellation and **one AsyncSession per concurrent candidate** — the batch slice already proves this on
+  this exact host/runtime, so Slice B inherits a de-risked pattern.
+- Slice A delivered the configuration half; Slice B delivers the *answer* half (which model won, by how
+  much, how stable across folds) — the payoff that makes the selector worth using.
+- Keeps the single-host architecture: no queue, no broker, no cloud SDK — just asyncio + Postgres.
+
+## What
+
+### New / changed endpoints (all under the existing `APIRouter(prefix="/model-selection")`)
+
+```http
+POST   /model-selection/runs            # NEW — async submit, 202 immediate, fire-and-forget
+GET    /model-selection/{selection_id}  # EXISTING — additive progress fields (no breaking change)
+DELETE /model-selection/{selection_id}  # NEW — cooperative cancel + drain
+# UNCHANGED & KEPT: GET /availability, GET /models (Slice A), POST /run (legacy sync), GET /{id}/ranking
+# Slice C owns: POST /{id}/train-winner, POST /{id}/predict (already present; Slice B does NOT call them)
+```
+
+`POST /model-selection/runs` 202 response (additive superset of `ModelSelectionRunResponse`):
+
+```json
+{
+  "selection_id": "9f3c…",
+  "status": "running",
+  "store_id": 5, "product_id": 8,
+  "monitor_url": "/model-selection/9f3c…",
+  "cancel_url": "/model-selection/9f3c…",
+  "progress": { "total": 5, "pending": 5, "running": 0, "completed": 0, "failed": 0, "cancelled": 0 },
+  "candidate_progress": [
+    { "candidate_id": "a1…", "model_type": "naive", "status": "pending", "ordinal": 0,
+      "error": null, "started_at": null, "completed_at": null, "duration_ms": null }
+  ],
+  "ranking": [], "winner": null, "chart_data": null, "business_summary": null,
+  "created_at": "…", "started_at": "…", "completed_at": null
+}
+```
+Headers: `Location: /model-selection/9f3c…`, `Retry-After: 2`.
+
+### LOCKED Slice-B decisions
+
+1. **New async endpoint is `POST /model-selection/runs`** (plural), distinct from the legacy synchronous
+   `POST /run` (singular), which is **kept unchanged** (existing tests + Slice A's typed `/run` notes
+   remain valid). The request body is the EXISTING `ModelSelectionRunRequest` verbatim (Slice A already
+   assembles it). Declare `/runs` BEFORE `GET /{selection_id}` is irrelevant for method collision (POST vs
+   GET), but for consistency declare all literal routes before path-param routes.
+   **Note:** the UI calls `POST /runs` (async); after Slice B the legacy `POST /run` (sync) has **no frontend
+   caller** — it is retained only for back-compat + the merged backend tests. Do NOT wire `/run` into the
+   frontend (and do NOT delete it).
+2. **Fire-and-forget, NOT await-inline.** The `POST /runs` handler: (a) inserts the parent (`status=running`,
+   `started_at=now`) + N `model_selection_candidate` child rows (`status=pending`) using the REQUEST session
+   and commits; (b) launches the worker as a **detached** `asyncio.create_task`, holding a reference (GC
+   foot-gun — see Gotchas); (c) returns 202 immediately. The worker uses its OWN sessions via
+   `get_session_maker()` (`app/core/database.py:33`) — NEVER the request `db` (it closes when the request
+   returns). This is the ONE divergence from `batch/service.py:178` (which `await`s inline).
+3. **Per-candidate execution rows, never JSONB-in-parent for progress.** Each candidate is a
+   `model_selection_candidate` row carrying `status`, `result` (the full `CandidateResult` JSONB incl.
+   folds, written on success), `error_message`/`error_type`, `started_at`/`completed_at`/`duration_ms`,
+   `ordinal`. Concurrent tasks write their OWN child rows in their OWN sessions — no shared-row write race
+   (the reason Option B was rejected). Live progress on GET is a `GROUP BY status` over children (race-free);
+   final counts are cached on the parent at settle.
+4. **Bounded parallel via a slice-local runner.** `app/features/model_selection/runner.py` mirrors
+   `app/features/batch/runner.py`: a module-level `_ACTIVE_SELECTIONS: dict[str, CancelHandle]` registry,
+   `asyncio.TaskGroup` + `asyncio.Semaphore(min(req-cap, global-cap))`, one `AsyncSession` per child from
+   the shared `session_maker`, fast-cancel checks before/after the semaphore + a `CancelledError` branch.
+   Concurrency cap = `Settings.model_selection_global_max_parallel` (default 4; setting it to 1 ⇒ sequential
+   = Option C). Do NOT import the batch runner (cross-slice rule) — mirror it. (Follow-up issue: promote the
+   shared runner to `app/shared/` so batch + model_selection dedupe — out of scope for B.)
+5. **Honest cooperative cancellation + drain.** `DELETE /{selection_id}`: 404 if missing, 409 if already
+   terminal, else set the `CancelHandle.cancel_event` + `task.cancel()` each child, `await_drain` up to
+   `Settings.model_selection_cancel_drain_timeout_seconds` (default 30) → 200 settled or **504** on timeout.
+   sklearn/LightGBM fits are uncancellable mid-call — an in-flight candidate may COMPLETE before observing
+   cancel; that is acceptable and must be surfaced honestly (the candidate ends `completed`, not `cancelled`).
+   The invariant: **no candidate row left in `running` after settle**. (See `asyncio-taskgroup-cancellation.md`
+   § "sklearn / LightGBM ignore CancelledError mid-fit".)
+6. **`cancelled` is an ADDITIVE status** (not a redefinition). Add `CANCELLED = "cancelled"` to
+   `ModelSelectionStatus`, extend the `model_selection_run` status CheckConstraint, extend the response
+   `SelectionStatusLiteral`, and (frontend) add `'cancelled'` to the Slice-A TS `SelectionStatus` union.
+   The child status enum is `pending|running|completed|failed|cancelled`. Terminal-status rule at settle
+   (mirror `batch/service.py:_settle`): all-cancelled-and-none-ran ⇒ `cancelled`; ≥1 completed & ≥1
+   failed/cancelled ⇒ `partial`; all completed ⇒ `completed`; all failed (and none completed) ⇒ `failed`.
+7. **Ranking/chart/business computed ONCE at settle, reusing existing pure logic.** When all children are
+   terminal, the worker loads each child's `result` JSONB → `list[CandidateResult]` (cancelled children →
+   an excluded entry, mirroring `_shape_failed_candidate` with `error="cancelled"`), then calls the
+   UNCHANGED `rank_candidates(...)`, `build_chart_data(...)`, `explain_winner(...)` and persists
+   `ranking_result` / `chart_data` / `winner_*` / `business_summary` into the SAME JSONB columns the sync
+   path uses — so the terminal GET response is byte-compatible with today's `/run`.
+8. **Slice B does NOT train, predict, override, or promote.** `auto_train_winner` / `auto_predict` on the
+   request are treated as **no-ops** by the `/runs` worker (comparison + ranking only). The existing
+   `POST /{id}/train-winner` + `POST /{id}/predict` endpoints stay as-is; Slice C wires the UI for them.
+   Slice B's results UI may show the deterministic `business_summary` read-only but adds no new
+   interpretation, no safety stock, no manual winner override.
+   **Coordination (ownership of "Explain Winner"):** `business_summary` is computed ONCE by the backend
+   (`explanations.explain_winner`, unchanged). Slice B's winner-card renders it read-only (headline /
+   confidence / reasons / `BIAS_EXPLANATION`); Slice C's business-interpretation-panel renders the SAME
+   `business_summary` read-only and ADDS only the decision-layer fields (bias-risk text + labeled safety
+   stock from `decision.py`). Neither slice re-derives explanation text or duplicates the other's panel.
+9. **WAPE stays the default ranking metric; tie-break WAPE → sMAPE → |bias| → MAE is unchanged** (it lives
+   in `ranking.py:96` `_sort_key` — Slice B does not touch ranking math). Bias copy wherever surfaced:
+   *"Positive bias means the model under-forecasts (risk of stockouts); negative bias means it over-forecasts
+   (risk of overstock)."* — reuse the Slice-A `BIAS_EXPLANATION` constant (`components/champion-selector/copy.ts`).
+
+### Success Criteria
+
+- [ ] `POST /model-selection/runs` returns 202 + `Location`/`Retry-After` headers + a `running` body
+      BEFORE any candidate finishes (assert via a slow/mocked backtest in a unit test).
+- [ ] Detached worker uses `get_session_maker()` sessions, never the request `db`; a held task reference
+      prevents GC; the run completes after the response returned.
+- [ ] `model_selection_candidate` rows track per-candidate `pending→running→{completed,failed,cancelled}`;
+      `result` JSONB carries the full `CandidateResult`; failed/cancelled candidates remain visible.
+- [ ] `GET /{selection_id}` returns live `progress` (GROUP BY children) + `candidate_progress` while running,
+      and the existing `ranking`/`winner`/`chart_data`/`business_summary` once terminal.
+- [ ] `DELETE /{selection_id}`: 404/409/200/504 per LOCKED #5; no candidate left `running` after a clean drain.
+- [ ] Concurrency is capped by the Semaphore; one `AsyncSession` per candidate; `global_max_parallel=1`
+      degrades to sequential without code change.
+- [ ] `cancelled` added additively to ORM enum + CheckConstraint + response Literal + TS union; strict-mode
+      policy test stays green (no new strict request model with date fields beyond the existing ones).
+- [ ] Migration creates `model_selection_candidate` + adds `model_selection_run` columns + alters the status
+      CheckConstraint; `downgrade` reverses cleanly on a fresh DB.
+- [ ] `/visualize/champion` CTA → submit → live progress panel → ranking table + winner card + 4 charts +
+      model detail drawer; partial/all-failed/cancelled states render clearly.
+- [ ] Polling stops on terminal status (`refetchInterval` returns false); cancel button confirms via
+      AlertDialog and invalidates the poll query.
+- [ ] All backend Level-1..4 gates + frontend `pnpm tsc --noEmit && pnpm lint && pnpm test --run` pass.
+
+## All Needed Context
+
+### Documentation & References
+
+```yaml
+# Slice / contract source of truth
+- file: PRPs/forecast-champion-selector-backend.md
+  why: Merged backend foundation — LOCKED #1-#7, the /run + /{id} contract, availability semantics,
+       the verified BacktestingService/ForecastingService signatures, strict-mode + migration gotchas.
+       Slice B reuses this verbatim; do NOT re-derive ranking/availability.
+- file: PRPs/forecast-champion-selector-slice-a-selection-capability.md
+  why: FIXED upstream dependency. Slice A owns the page (pages/visualize/champion.tsx), the hook module
+       (hooks/use-model-selection.ts), the types/api.ts "Model Selection" section (the full workflow
+       contract is DECLARED there — Slice B implements the run/poll/cancel behavior, not the types), the
+       champion-selector component family, and the disabled "Run comparison" CTA. Do NOT redefine these.
+- docfile: PRPs/ai_docs/asyncio-taskgroup-cancellation.md
+  why: THE async LRO reference for this repo — runtime-verified on Python 3.12.13. TaskGroup public surface
+       (only create_task), per-task cancel + cooperative event, semaphore-wraps-work (not scheduling),
+       one AsyncSession per child, ContextVar/request-id inheritance, SQLAlchemy pool bound
+       (size 5 + overflow 10 ⇒ global cap ≤ 12 safe), and the sklearn/LightGBM-uncancellable caveat.
+       Cite its verification commands in Known Gotchas.
+- file: PRPs/templates/prp_base.md
+  why: Base PRP template. NOTE — "PRPs/prp-readme.md.md" does NOT exist (`find PRPs -iname '*readme*'`
+       empty on 2026-06-01); both prior champion PRPs record the same finding.
+
+# Backend async precedent to MIRROR (the batch slice — same runtime, merged, proven)
+- file: app/features/batch/runner.py
+  why: THE runner to mirror slice-locally. run_batch(:74) TaskGroup(:187) + Semaphore(:115) +
+       _ACTIVE_BATCHES registry(:71) + CancelHandle(:47, cancel_event/completed_event/tasks); _child(:126)
+       fast-cancel before(:135)/after(:151) acquire + CancelledError branch(:157,179); cancel_batch(:208),
+       await_drain(:236), mark_completed(:270); _mark_cancelled_skipped(:305)/_mark_cancelled_running(:322)/
+       _mark_failed_unexpected(:353). Slice B reproduces this shape with a model_selection registry.
+- file: app/features/batch/service.py
+  why: submit() lifecycle (:88) — insert parent+children+commit(:137), parent→running(:148), get_session_maker
+       (:159), per-child _exec_one opens OWN session(:168), runner.run_batch(:178), finally settle(:191) +
+       mark_completed(:195). CRITICAL DIVERGENCE: batch AWAITS run_batch inline (:178); Slice B detaches it
+       via asyncio.create_task so POST returns 202 first (LOCKED #2). _settle(:387) terminal-status rule + counts.
+- file: app/features/batch/routes.py
+  why: POST returns 202 (:37); DELETE cancel contract (:75) — 200 drained / 404 / 409 terminal / 504 drain
+       timeout, with the cooperative-drain description (:79-88) to reuse near-verbatim. Mirror error mapping.
+- file: app/features/batch/models.py
+  why: Child-table shape to mirror — BatchJobItem (status String + CheckConstraint, JSONB metrics,
+       error_message/error_type, started_at/completed_at/duration_ms, indexes). BatchStatus/BatchItemStatus
+       enums incl. `cancelled`. TimestampMixin first.
+- file: alembic/versions/c1d2e3f40512_create_batch_tables.py
+  why: Migration template — postgresql.JSONB(astext_type=sa.Text()); named CheckConstraint; op.create_index
+       (op.f for single-col unique, explicit name for composite); FK with ondelete="CASCADE"; downgrade drops
+       indexes THEN table. Slice B's migration ALSO alters an existing CheckConstraint (drop+create).
+- file: app/core/database.py
+  why: get_session_maker() (:33) → async_sessionmaker(expire_on_commit=False) — the OUT-OF-REQUEST session
+       factory the detached worker + each child MUST use. get_engine() (:22). get_db (request-scoped) dep.
+- file: app/core/config.py
+  why: Settings(BaseSettings); batch_global_max_parallel=4 (:131), batch_cancel_drain_timeout_seconds=30
+       (:135) — MIRROR with model_selection_global_max_parallel + model_selection_cancel_drain_timeout_seconds
+       (typed attr + literal default; env var = UPPER_SNAKE; add to .env.example + a config test).
+
+# Live model_selection slice (the contract Slice B extends — verified 2026-06-01)
+- file: app/features/model_selection/service.py
+  why: run_selection (:211) is the SYNC body whose internals (per-candidate backtest :279, _shape_candidate
+       :468, rank_candidates :308, build_chart_data :370, explain_winner :316/:371, _response :526) Slice B
+       REUSES inside the async worker + settle. get_selection(:395)/_load(:513)/_response(:526) extend with
+       progress. Lazy cross-slice imports inside methods (:215-219).
+- file: app/features/model_selection/models.py
+  why: ModelSelectionRun + ModelSelectionStatus (:26). ADD CANCELLED enum value; ADD started_at + count
+       columns; ALTER status CheckConstraint (:82) to include 'cancelled'. ADD the new ModelSelectionCandidate ORM.
+- file: app/features/model_selection/schemas.py
+  why: ModelSelectionRunRequest (:118, REUSE as the /runs body), ModelSelectionRunResponse (:267, ADD
+       additive progress fields), SelectionStatusLiteral (:49, ADD 'cancelled'), CandidateResult (:178)/
+       FoldChart (:169) (persisted per-child), ChartData (:225)/ModelRankEntry (:195)/WinnerSummary (:216)
+       (unchanged). ADD SubmitRunResponse (202 superset), CandidateProgress, SelectionProgress.
+- file: app/features/model_selection/routes.py
+  why: APIRouter(prefix="/model-selection") (:38); error mapping ValueError→BadRequestError,
+       SQLAlchemyError→DatabaseError. ADD POST /runs (202) + DELETE /{selection_id}; extend GET /{id}.
+- file: app/features/model_selection/ranking.py
+  why: rank_candidates(:116)/build_chart_data(:250) — REUSE UNCHANGED at settle. Do NOT touch ranking math.
+- file: app/features/model_selection/tests/test_routes.py + test_routes_integration.py + conftest.py + test_service.py
+  why: ASGITransport + AsyncClient + app.dependency_overrides[get_db]; integration fixture (real engine,
+       prefix-scoped teardown in finally). MIRROR for the async route + drain integration tests.
+- file: app/features/batch/tests/  (test_runner.py, test_routes_cancel.py, test_runner_chaos.py)
+  why: Runner unit tests (fake session_maker, monkeypatched DB helpers, semaphore-cap + cancel-skip/running
+       assertions) + the chaos integration test asserting "no row left running after cancel". MIRROR for
+       app/features/model_selection/tests/test_runner.py + a cancel integration test.
+
+# Frontend examples to MIRROR (verified 2026-06-01)
+- file: frontend/src/pages/visualize/batch.tsx
+  why: THE polling/progress page. refetchInterval returns 2000ms while pending|running else false (via
+       use-batches.ts:44-54); TERMINAL check (:125-127); progress Card + StatusBadge + counts (:294-320);
+       per-item Table (:361-411); AlertDialog cancel confirm (:324-351) — pending skip / running-at-safe-yield
+       copy reusable. The champion results UI mirrors this density.
+- file: frontend/src/hooks/use-batches.ts
+  why: useBatch polling hook (:44-54, refetchInterval fn + enabled gate), useSubmitBatch (:13-25) +
+       useCancelBatch (:30-40) useMutation + queryClient.setQueryData/invalidateQueries. MIRROR for
+       useSubmitSelectionRun / useSelectionRun / useCancelSelectionRun in hooks/use-model-selection.ts.
+- file: frontend/src/hooks/use-batches.test.ts
+  why: Hook test harness — vi.stubGlobal('fetch',...), QueryClient wrapper (retry:false), renderHook +
+       act + waitFor, afterEach(vi.unstubAllGlobals()). MIRROR for the new hooks.
+- file: frontend/src/lib/status-utils.ts
+  why: getStatusVariant(status) → success|info|pending|error|warning (covers completed/running/pending/
+       failed/cancelled). Reuse for candidate + run status badges.
+- file: frontend/src/components/common/status-badge.tsx
+  why: StatusBadge variant component (cva). Reuse for run + per-candidate status.
+- file: frontend/src/components/charts/backtest-folds-chart.tsx
+  why: Bar chart of per-fold metrics — props {title, data: FoldMetric[] = {fold,mae,smape,wape,bias},
+       metricKey, height}. ChartContainer + Recharts BarChart; height via inline style (Tailwind JIT drops
+       dynamic h-[Npx]). Use for fold-stability (per-fold WAPE) of the winner/candidates.
+- file: frontend/src/components/charts/multi-series-chart.tsx
+  why: Multi-line chart — props {title, data: Record<string,number|string>[], series: {key,label}[],
+       xAxisKey, height}. ComposedChart; first line solid, rest dashed. Use for winner actual-vs-predicted
+       overlay (series: actual + predicted, x = date).
+- file: frontend/src/components/charts/  (revenue-bar-chart, time-series-chart, kpi-card, backtest-horizon-buckets-chart)
+  why: Reuse a simple Bar chart pattern for WAPE-by-model + bias-by-model (one bar per candidate). Mirror
+       backtest-folds-chart's ChartContainer/ChartConfig + ResizeObserver test stub.
+- file: frontend/src/components/ui/sheet.tsx
+  why: Sheet primitive (side, SheetContent/Header/Title/Description) — the model-detail DRAWER (no existing
+       drawer-usage precedent in pages; this is the first). Trigger on a ranking-row click.
+- file: frontend/src/components/ui/alert-dialog.tsx
+  why: AlertDialog — the cancel-run confirmation (mirror batch.tsx:324-351). Reuse the pending-skip/
+       running-at-safe-yield copy.
+- file: frontend/src/components/data-table/data-table.tsx  AND  frontend/src/pages/visualize/batch.tsx:366-411
+  why: Two table options — TanStack DataTable (sortable/paginated, manualSorting) for the ranking table, OR
+       a plain shadcn Table (batch.tsx) for a short candidate-progress list. Ranking ≤10 rows → plain Table
+       is sufficient; use DataTable only if sortable columns are wanted.
+- file: frontend/src/components/common/{loading-state,error-display}.tsx
+  why: LoadingState / ErrorDisplay / EmptyState — partial/failed/empty states; getErrorMessage (lib/api.ts:94).
+- file: frontend/src/lib/api.ts
+  why: api<T>(endpoint,{method,body,params}) — POST/DELETE/GET; ApiError + getErrorMessage; 204 handling.
+       NOTE: the 202 body is JSON (api<T> parses it); Location/Retry-After headers are not surfaced by api<T>
+       — the frontend uses the body's monitor_url/cancel_url/selection_id, not the headers (LOCKED note).
+- file: frontend/src/lib/constants.ts  +  frontend/src/App.tsx
+  why: ROUTES.VISUALIZE.CHAMPION + NAV_ITEMS + lazy route are ADDED by Slice A. Slice B does NOT add a new
+       route — it extends the existing champion page. (If Slice A is not yet merged at impl time, see
+       "Dependency on Slice A" below.)
+- file: frontend/src/types/api.ts
+  why: Slice A adds the "// === Model Selection (Champion Selector) ===" section with the full workflow
+       contract. Slice B ADDS (additively, same section): SubmitRunResponse, SelectionProgress,
+       CandidateProgress, and 'cancelled' on the SelectionStatus union. Do NOT duplicate Slice A's types.
+- file: frontend/vitest.config.ts
+  why: jsdom; include src/**/*.test.{ts,tsx}; @→./src. Chart tests need a ResizeObserver beforeAll stub
+       (see backtest-horizon-buckets-chart.test.tsx).
+
+# External official docs (with reasoning)
+- url: https://developer.mozilla.org/en-US/docs/Web/HTTP/Reference/Status/202
+  why: 202 Accepted semantics — the response is a promise, not a result; include a status-monitor pointer.
+       Justifies returning 202 + Location/Retry-After + a monitor_url body field for the running selection.
+- url: https://learn.microsoft.com/en-us/rest/api/fabric/articles/long-running-operation
+  why: Canonical async LRO contract — submit → 202 + Location + Retry-After → poll status → terminal. Shapes
+       SubmitRunResponse (monitor_url/cancel_url) + the GET polling response.
+- url: https://fastapi.tiangolo.com/tutorial/background-tasks/
+  why: FastAPI BackgroundTasks runs AFTER the response but is NOT suited to heavy/long CPU-bound fits and
+       offers no cancellation/progress — the brief forbids it for model fits. Justifies asyncio.create_task
+       (detached) + the DB-backed runner instead.
+- url: https://docs.python.org/3.12/library/asyncio-task.html#asyncio.create_task
+  why: "Save a reference to the result of this function, to avoid a task disappearing mid-execution." The
+       GC foot-gun for the detached worker (LOCKED #2) — hold the task ref (in the CancelHandle or a module set).
+- url: https://docs.python.org/3.12/library/asyncio-task.html#asyncio.TaskGroup
+  why: TaskGroup structured concurrency + except* ExceptionGroup — the runner's child fan-out + cancel absorb.
+- url: https://docs.sqlalchemy.org/en/21/orm/extensions/asyncio.html#using-multiple-asyncio-event-loops
+  why: AsyncSession is NOT concurrency-safe to share across tasks — one session per concurrent candidate
+       (the contract's explicit rule; matches batch _exec_one).
+- url: https://docs.aws.amazon.com/forecast/latest/dg/metrics.html
+  why: WAPE/MAPE/RMSE definitions — so the comparison-chart axis labels + tooltips describe each metric
+       correctly (and the bias under/over-forecast copy stays accurate).
+```
+
+### Current Codebase Tree (relevant)
+
+```bash
+app/features/model_selection/        # MERGED backend (issue #353) — SYNC /run today
+├── models.py        # ModelSelectionRun + ModelSelectionStatus  ← ADD CANCELLED, started_at, counts; ADD ModelSelectionCandidate
+├── schemas.py       # request/response contract                 ← ADD SubmitRunResponse, SelectionProgress, CandidateProgress; +'cancelled'
+├── service.py       # ModelSelectionService (sync run_selection) ← ADD submit_run + worker + settle + cancel; extend _response
+├── ranking.py       # rank_candidates / build_chart_data        ← REUSE UNCHANGED
+├── explanations.py  # explain_winner                            ← REUSE UNCHANGED
+├── routes.py        # APIRouter(/model-selection)               ← ADD POST /runs (202), DELETE /{id}; extend GET /{id}
+└── tests/           # conftest + unit + integration             ← ADD test_runner, test_async_routes, extend integration
+app/features/batch/{runner,service,routes,models}.py  # the async LRO TEMPLATE to mirror (do NOT import)
+app/core/{database,config}.py        # get_session_maker; Settings (mirror batch_* keys)
+alembic/versions/                     # head observed 6c3f8d4-era; run `uv run alembic heads` at impl time
+frontend/src/
+├── pages/visualize/champion.tsx      # Slice A page                ← WIRE CTA → submit → poll → results
+├── hooks/use-model-selection.ts      # Slice A catalog/availability ← ADD useSubmitSelectionRun/useSelectionRun/useCancelSelectionRun
+├── types/api.ts                      # Slice A Model Selection sect ← ADD progress/submit types additively
+├── components/champion-selector/     # Slice A selection components ← ADD results/ subfamily
+├── components/charts/{backtest-folds-chart,multi-series-chart}.tsx
+├── components/ui/{sheet,alert-dialog,table,card,badge,progress}.tsx
+└── components/common/{status-badge,loading-state,error-display}.tsx
+```
+
+### Desired Codebase Tree (Slice B additions)
+
+```bash
+# Backend
+app/features/model_selection/runner.py                        # NEW: slice-local TaskGroup+Semaphore runner (mirror batch/runner.py)
+app/features/model_selection/models.py                        # MOD: + ModelSelectionCandidate; +CANCELLED; +started_at/counts; alter CheckConstraint
+app/features/model_selection/schemas.py                       # MOD: + SubmitRunResponse, SelectionProgress, CandidateProgress; +'cancelled' literal
+app/features/model_selection/service.py                       # MOD: + submit_run / _run_in_background / _execute_candidate / _settle / cancel_run; extend _response/get_selection
+app/features/model_selection/routes.py                        # MOD: + POST /runs (202), + DELETE /{id}; extend GET /{id}
+app/core/config.py                                            # MOD: + model_selection_global_max_parallel, model_selection_cancel_drain_timeout_seconds
+.env.example                                                  # MOD: + the two new env vars (UPPER_SNAKE + comment)
+alembic/versions/<rev>_add_model_selection_candidate_and_progress.py   # NEW migration
+app/features/model_selection/tests/test_runner.py            # NEW: runner unit (semaphore cap, cancel skip/running)
+app/features/model_selection/tests/test_async_routes.py      # NEW: 202 immediacy, progress GET, DELETE 404/409/200/504
+app/features/model_selection/tests/test_models.py            # MOD: + ModelSelectionCandidate constraints
+app/features/model_selection/tests/test_schemas.py           # MOD: + progress/submit schema cases
+app/features/model_selection/tests/test_service.py           # MOD: + worker/settle/cancel unit (mock backtest)
+app/features/model_selection/tests/test_routes_integration.py# MOD: + async run + cancel-drain integration (no row left running)
+app/core/tests/test_config.py                                # MOD: + the two new settings defaults (Settings(_env_file=None))
+
+# Frontend (extends Slice A — no new route)
+frontend/src/types/api.ts                                    # MOD: + SubmitRunResponse, SelectionProgress, CandidateProgress; +'cancelled'
+frontend/src/hooks/use-model-selection.ts                    # MOD: + useSubmitSelectionRun, useSelectionRun (poll), useCancelSelectionRun
+frontend/src/hooks/use-model-selection.test.ts               # MOD: + submit/poll/cancel hook tests
+frontend/src/pages/visualize/champion.tsx                    # MOD: CTA enabled → submit → poll → results section
+frontend/src/components/champion-selector/results/run-progress-panel.tsx        # NEW (+ .test.tsx)
+frontend/src/components/champion-selector/results/ranking-table.tsx             # NEW (+ .test.tsx)
+frontend/src/components/champion-selector/results/winner-card.tsx               # NEW (+ .test.tsx)
+frontend/src/components/champion-selector/results/comparison-charts.tsx         # NEW (+ .test.tsx)  (WAPE/bias bars + fold-stability + actual-vs-predicted)
+frontend/src/components/champion-selector/results/model-detail-drawer.tsx       # NEW (+ .test.tsx)  (Sheet)
+frontend/src/components/champion-selector/results/cancel-run-dialog.tsx         # NEW (+ .test.tsx)  (AlertDialog)
+```
+
+### Known Gotchas & VERIFIED Contracts
+
+```python
+# ── FIRE-AND-FORGET vs BATCH'S AWAIT-INLINE (the core divergence — LOCKED #2) ──
+# batch/service.py:178 does `await runner.run_batch(...)` INSIDE the POST handler, so batch's POST blocks
+# to completion and returns the SETTLED parent (batch/routes.py:52). That is a 202-shaped SYNC call —
+# unusable for Slice B's poll/progress/Retry-After brief. Slice B MUST detach:
+#   task = asyncio.create_task(self._run_in_background(selection_id, request_snapshot))
+#   _BACKGROUND_TASKS.add(task); task.add_done_callback(_BACKGROUND_TASKS.discard)   # hold a ref!
+#   return SubmitRunResponse(...)   # 202 immediately
+# GC FOOT-GUN: asyncio only keeps a WEAK ref to the task; without a strong ref it can be GC'd mid-run
+#   (https://docs.python.org/3.12/library/asyncio-task.html#asyncio.create_task). Hold it in a module-level
+#   set (and/or the CancelHandle.tasks). The CancelHandle in _ACTIVE_SELECTIONS also keeps the runner's
+#   child task refs (mirror batch CancelHandle.tasks).
+
+# ── THE DETACHED WORKER MUST NOT USE THE REQUEST SESSION ───────────────────────
+# Depends(get_db) closes when the POST handler returns. The detached worker outlives the request, so EVERY
+# DB touch in _run_in_background / _execute_candidate / _settle opens its OWN session from get_session_maker()
+# (app/core/database.py:33), exactly like batch _exec_one (batch/service.py:168). Sharing the request db = a
+# closed-session error (or worse, a use-after-free of the connection). One AsyncSession per concurrent child.
+
+# ── NO SHARED-ROW WRITE RACE — child rows, atomic where needed ─────────────────
+# Concurrent candidate tasks write their OWN model_selection_candidate rows (per LOCKED #3). NEVER have two
+# tasks read-modify-write the same parent JSONB (Option B's bug). Live progress on GET = a GROUP BY status
+# over children (race-free). If you cache live counts on the parent, use atomic SQL `col = col + 1` UPDATEs
+# (mirror batch _bump_running) — but the SIMPLER, recommended path is: derive counts on read, write FINAL
+# counts only once at settle. Prefer the latter (no live parent writes at all from children).
+
+# ── COOPERATIVE + HONEST CANCEL (LOCKED #5) ───────────────────────────────────
+# Mirror batch/runner.py exactly: fast-cancel check BEFORE sem acquire (skip) + AFTER acquire (skip) +
+# `except asyncio.CancelledError: mark child cancelled_running; raise`. cancel_run() sets cancel_event +
+# task.cancel() per child. await_drain waits CancelHandle.completed_event up to the drain timeout → 504.
+# mark_completed() pops the registry AFTER settle commits (never before — else DELETE's drain races settle).
+# sklearn/LightGBM fits are sync C — uncancellable mid-call: an in-flight candidate may COMPLETE (status
+# completed, not cancelled). That is correct/honest. Invariant: NO candidate left `running` after settle
+# (assert in the chaos integration test, mirror batch/tests/test_runner_chaos.py).
+
+# ── TaskGroup absorbs CancelledError; the runner returns normally ──────────────
+# `async with asyncio.TaskGroup() as tg:` ... `except* asyncio.CancelledError: pass` — cancellation does NOT
+# propagate out of run_selection_candidates; the worker proceeds to settle the parent to its observed state
+# (mirror batch/runner.py:186-205). Verified TaskGroup surface: only `create_task`
+# (PRPs/ai_docs/asyncio-taskgroup-cancellation.md:13-16). Re-verify on upgrade:
+#   uv run python -c "import asyncio; print([m for m in dir(asyncio.TaskGroup) if not m.startswith('_')])"  # ['create_task']
+
+# ── CONCURRENCY CAP / POOL BOUND ──────────────────────────────────────────────
+# effective = min(req.split-derived cap?, Settings.model_selection_global_max_parallel). There is NO per-run
+# max_parallel field on ModelSelectionRunRequest (Slice A did not add one) — use the GLOBAL setting as the
+# cap (a future PRP may add a per-run field). SQLAlchemy pool default size 5 + overflow 10 ⇒ keep the global
+# cap ≤ 12 (asyncio-taskgroup-cancellation.md:170-191). Default 4 is safe. Verify pool:
+#   uv run python -c "from sqlalchemy.ext.asyncio import create_async_engine; e=create_async_engine('postgresql+asyncpg://x:x@h:5433/x'); print(e.pool.size(), e.pool._max_overflow)"  # 5 10
+
+# ── ADDITIVE 'cancelled' STATUS (LOCKED #6) ───────────────────────────────────
+# Add CANCELLED='cancelled' to ModelSelectionStatus; the migration must DROP+CREATE the named CheckConstraint
+# ck_model_selection_run_valid_status to include 'cancelled' (forward-only). Extend SelectionStatusLiteral
+# (schemas.py:49) and the TS SelectionStatus union. The child status enum literal is
+# pending|running|completed|failed|cancelled with its own CheckConstraint on model_selection_candidate.
+
+# ── REUSE THE PURE LOGIC AT SETTLE (LOCKED #7) ────────────────────────────────
+# Do NOT rewrite ranking/chart/business. At settle: load children, build list[CandidateResult]
+#   (success child → CandidateResult.model_validate(child.result); cancelled child → an excluded result with
+#    failed=True, error="cancelled"; failed child → failed=True, error=child.error_message), then call the
+# UNCHANGED rank_candidates(results, policy, ranking_metric, availability.status), build_chart_data(results,
+# ranking), explain_winner(ranking, availability). Persist into the SAME JSONB columns the sync path writes
+# so terminal GET output is byte-compatible (service.py:307-389 is the reference for which columns).
+
+# ── ROUTE ORDERING / METHOD COLLISION ─────────────────────────────────────────
+# POST /runs (literal) vs GET/DELETE /{selection_id} (path-param) are different METHODS — no Starlette
+# collision. Still, declare literal routes before path-param routes for consistency (mirror /availability
+# before /{selection_id}). DELETE /{selection_id} is a NEW method on the existing path-param.
+
+# ── STRICT-MODE POLICY (unchanged) ────────────────────────────────────────────
+# No NEW strict request model with date fields is added (the /runs body is the EXISTING
+# ModelSelectionRunRequest). SubmitRunResponse/SelectionProgress/CandidateProgress are RESPONSE models
+# (plain BaseModel — no strict). app/core/tests/test_strict_mode_policy.py stays green.
+
+# ── VERIFIED INTERNAL SIGNATURES (from the merged backend, do NOT re-derive) ──
+# BacktestingService().run_backtest(db, store_id, product_id, start_date, end_date, BacktestConfig(...))
+#   -> BacktestResponse  (service.py:279 call site; LOCKED #4 in backend PRP: include_baselines=False,
+#   store_fold_details=True). _shape_candidate(candidate, backtest) -> CandidateResult (service.py:468).
+# TypeAdapter(ModelConfig).validate_python({"model_type": c.model_type, **c.params}) — FLATTEN params
+#   (service.py:276). lightgbm/xgboost may ImportError → that candidate becomes failed (caught per-candidate).
+```
+
+```typescript
+// ── FRONTEND ────────────────────────────────────────────────────────────────
+// POLLING: useSelectionRun(selectionId) mirrors useBatch (use-batches.ts:44-54):
+//   refetchInterval: (q) => { const s = q.state.data?.status; return s==='running'||s==='pending' ? 2000 : false }
+//   enabled: !!selectionId. A TERMINAL_SELECTION_STATES set = {completed,failed,partial,cancelled}.
+// SUBMIT: useSubmitSelectionRun -> api<SubmitRunResponse>('/model-selection/runs',{method:'POST',body:req}).
+//   onSuccess: setQueryData(['model-selection','run', data.selection_id], data) so polling starts warm.
+// CANCEL: useCancelSelectionRun -> api(`/model-selection/${id}`,{method:'DELETE'}); onSuccess invalidate the
+//   run query. Confirm via AlertDialog (mirror batch.tsx:324-351) — reuse the pending-skip/running-yield copy.
+// api<T> (lib/api.ts) parses the JSON body but does NOT expose Location/Retry-After headers — drive the UI
+//   from the body's selection_id/monitor_url/cancel_url, NOT the headers.
+// selection_id is BACKEND-generated — never crypto.randomUUID() client-side (memory:
+//   showcase-crypto-randomuuid-lan-crash — undefined over LAN HTTP). Dogfood over http://localhost:5173.
+// CHARTS need a ResizeObserver beforeAll stub in jsdom (backtest-horizon-buckets-chart.test.tsx pattern);
+//   pass height via inline style (Tailwind JIT drops dynamic h-[Npx]).
+// react-refresh/only-export-components: keep non-component constants (TERMINAL_SELECTION_STATES) in a .ts
+//   file (reuse Slice A's copy.ts or a results/constants.ts), not exported from a .tsx component.
+// Mixed CRLF/LF repo-wide (memory: repo-line-endings-crlf) — `git diff --stat` before committing; new files LF.
+// IDs are NOT 1-based (memory: seeder-does-not-reset-id-sequences) — never hardcode store_id=1/product_id=1.
+```
+
+## Implementation Blueprint
+
+### Backend data models
+
+`app/features/model_selection/models.py` — additions:
+
+```python
+# ModelSelectionStatus: ADD  CANCELLED = "cancelled"
+# ModelSelectionRun: ADD
+#   started_at: Mapped[datetime | None] = mapped_column(DateTime(timezone=True), nullable=True)
+#   total_candidates / completed_candidates / failed_candidates / cancelled_candidates: Mapped[int]
+#     = mapped_column(Integer, default=0, server_default="0")   # FINAL counts cached at settle
+#   ALTER __table_args__ CheckConstraint to: status IN ('pending','running','completed','partial','failed','cancelled')
+
+class CandidateStatus(str, Enum):
+    PENDING = "pending"; RUNNING = "running"; COMPLETED = "completed"
+    FAILED = "failed"; CANCELLED = "cancelled"
+
+class ModelSelectionCandidate(TimestampMixin, Base):
+    __tablename__ = "model_selection_candidate"
+    id: Mapped[int] = mapped_column(Integer, primary_key=True)
+    candidate_id: Mapped[str] = mapped_column(String(32), unique=True, index=True)
+    selection_id: Mapped[str] = mapped_column(
+        String(32), ForeignKey("model_selection_run.selection_id", ondelete="CASCADE"), index=True)
+    ordinal: Mapped[int] = mapped_column(Integer)          # submit order, stable display
+    model_type: Mapped[str] = mapped_column(String(40))
+    params: Mapped[dict[str, Any]] = mapped_column(JSONB)
+    status: Mapped[str] = mapped_column(String(20), default=CandidateStatus.PENDING.value, index=True)
+    result: Mapped[dict[str, Any] | None] = mapped_column(JSONB, nullable=True)   # full CandidateResult on success
+    error_message: Mapped[str | None] = mapped_column(String(2000), nullable=True)
+    error_type: Mapped[str | None] = mapped_column(String(100), nullable=True)
+    started_at: Mapped[datetime | None] = mapped_column(DateTime(timezone=True), nullable=True)
+    completed_at: Mapped[datetime | None] = mapped_column(DateTime(timezone=True), nullable=True)
+    duration_ms: Mapped[int | None] = mapped_column(Integer, nullable=True)
+    __table_args__ = (
+        CheckConstraint("status IN ('pending','running','completed','failed','cancelled')",
+                        name="ck_model_selection_candidate_valid_status"),
+        Index("ix_model_selection_candidate_selection_status", "selection_id", "status"),
+    )
+```
+
+`app/features/model_selection/schemas.py` — additive response models (plain BaseModel):
+
+```python
+class CandidateProgress(BaseModel):
+    candidate_id: str; ordinal: int; model_type: str
+    status: Literal["pending","running","completed","failed","cancelled"]
+    error: str | None = None
+    started_at: datetime | None = None
+    completed_at: datetime | None = None
+    duration_ms: int | None = None
+
+class SelectionProgress(BaseModel):
+    total: int; pending: int; running: int; completed: int; failed: int; cancelled: int
+
+# ADD 'cancelled' to SelectionStatusLiteral (line 49).
+# EXTEND ModelSelectionRunResponse additively:
+#   started_at: datetime | None
+#   progress: SelectionProgress | None
+#   candidate_progress: list[CandidateProgress]   (default_factory=list)
+
+class SubmitRunResponse(ModelSelectionRunResponse):  # 202 superset
+    monitor_url: str
+    cancel_url: str
+```
+
+### Backend runner (`app/features/model_selection/runner.py`)
+
+```python
+# MIRROR app/features/batch/runner.py 1:1, renaming batch→selection:
+#   _ACTIVE_SELECTIONS: dict[str, CancelHandle]
+#   @dataclass CancelHandle(cancel_event, completed_event, tasks)
+#   async def run_selection_candidates(*, selection_id, candidate_ids, max_parallel, global_max_parallel,
+#                                      session_maker, execute_candidate) -> int
+#     effective = min(max_parallel, global_max_parallel); sem = Semaphore(effective)
+#     handle = _ACTIVE_SELECTIONS.setdefault(selection_id, CancelHandle())
+#     async def _child(cid):
+#         async with session_maker() as session:
+#             if handle.cancel_event.is_set(): await _mark_cancelled_skipped(session, cid); return
+#             acquired=False
+#             try:
+#                 async with sem:
+#                     acquired=True
+#                     if handle.cancel_event.is_set(): await _mark_cancelled_skipped(session, cid); return
+#                     try: await execute_candidate(cid)
+#                     except asyncio.CancelledError: await _mark_cancelled_running(session, cid); raise
+#                     except Exception: await _mark_failed_unexpected(session, cid)   # do NOT re-raise (don't kill siblings)
+#             except asyncio.CancelledError:
+#                 if not acquired: await _mark_cancelled_skipped(session, cid)
+#                 raise
+#     try:
+#         async with asyncio.TaskGroup() as tg:
+#             for cid in candidate_ids:
+#                 handle.tasks.append(tg.create_task(_child(cid), name=f"model_selection:{selection_id}:{cid}"))
+#     except* asyncio.CancelledError: pass
+#     return effective
+#   def cancel_selection(selection_id) -> bool   # set cancel_event + task.cancel() each; False if not registered
+#   async def await_drain(selection_id, timeout_seconds) -> bool   # wait completed_event; mirror batch
+#   def mark_completed(selection_id) -> None      # set completed_event + pop registry (AFTER settle)
+#   helpers _mark_cancelled_skipped/_mark_cancelled_running/_mark_failed_unexpected — UPDATE the candidate row
+#     status + completed_at + duration_ms in the child's own session (mirror batch helpers).
+# The runner does NOT bump parent counters (counts derived on read; final counts at settle).
+```
+
+### Backend service (`app/features/model_selection/service.py`)
+
+```python
+# ADD (sync run_selection stays for legacy POST /run):
+async def submit_run(self, db, request) -> SubmitRunResponse:
+    # 1) availability gate (REUSE get_availability). If unusable → persist failed row, raise BadRequestError (LOCKED #2 parity).
+    # 2) insert parent (status=running, started_at=now, total_candidates=N, snapshots) + N ModelSelectionCandidate
+    #    rows (status=pending, ordinal=i) using REQUEST db; await db.commit().
+    # 3) snapshot the request into a plain dict / re-validated request (the worker must NOT close over the
+    #    request session). Launch detached:
+    #        task = asyncio.create_task(self._run_in_background(selection_id))
+    #        _BACKGROUND_TASKS.add(task); task.add_done_callback(_BACKGROUND_TASKS.discard)
+    # 4) re-read the parent (or build from known fields) and return SubmitRunResponse(..., status="running",
+    #    monitor_url=f"/model-selection/{sid}", cancel_url=f"/model-selection/{sid}", progress=all-pending).
+
+async def _run_in_background(self, selection_id) -> None:
+    session_maker = get_session_maker()
+    # load parent + children + the persisted request snapshot via a fresh session.
+    async def _exec(cid):
+        async with session_maker() as s:
+            cand = await s.scalar(select(ModelSelectionCandidate).where(...candidate_id==cid))
+            cand.status = RUNNING; cand.started_at = now; await s.commit()
+            try:
+                cfg = TypeAdapter(ModelConfig).validate_python({"model_type": cand.model_type, **cand.params})  # lazy import
+                bt = await BacktestingService().run_backtest(s, store_id, product_id, start, end,
+                         BacktestConfig(split_config=..., model_config_main=cfg, include_baselines=False, store_fold_details=True))
+                result = self._shape_candidate(CandidateModelConfig(model_type=cand.model_type, params=cand.params), bt)
+                cand.result = result.model_dump(mode="json"); cand.status = COMPLETED
+            except Exception as exc:
+                cand.status = FAILED; cand.error_message = str(exc)[:2000]; cand.error_type = type(exc).__name__
+            cand.completed_at = now; cand.duration_ms = ...; await s.commit()
+    try:
+        await runner.run_selection_candidates(selection_id=selection_id, candidate_ids=[...],
+            max_parallel=self.settings.model_selection_global_max_parallel,
+            global_max_parallel=self.settings.model_selection_global_max_parallel,
+            session_maker=session_maker, execute_candidate=_exec)
+    finally:
+        await self._settle(selection_id, session_maker)     # ranking/chart/business + terminal status + counts
+        runner.mark_completed(selection_id)
+
+async def _settle(self, selection_id, session_maker) -> None:
+    async with session_maker() as s:
+        # load parent + all children; build list[CandidateResult] (LOCKED #7 mapping);
+        # availability = PairAvailabilityResponse.model_validate(parent.availability_snapshot)
+        # ranking = rank_candidates(results, policy_from_snapshot, parent.ranking_metric, availability.status)
+        # if ranking.winner: chart = build_chart_data(results, ranking); winner_* set
+        # business = explain_winner(ranking, availability)
+        # counts from children; terminal status per LOCKED #6 rule; completed_at=now; commit.
+
+async def cancel_run(self, db, selection_id) -> ModelSelectionRunResponse:
+    # load parent (404). If status terminal → ConflictError (409). 
+    # fired = runner.cancel_selection(selection_id); if not fired → ConflictError (race: settled). 
+    # drained = await runner.await_drain(selection_id, self.settings.model_selection_cancel_drain_timeout_seconds)
+    # if not drained → GatewayTimeoutError (504). reload + return _response.
+
+# EXTEND get_selection/_response to attach progress:
+#   progress = SelectionProgress(**counts_from_groupby_or_cached); candidate_progress = [CandidateProgress(...) per child]
+#   (a run created by the legacy sync /run has NO children → progress=None, candidate_progress=[]).
+```
+
+`app/core/exceptions.py` already provides `ConflictError` (409, :130) and `GatewayTimeoutError` (504, :203);
+`batch/routes.py:18` imports both for its DELETE drain. Reuse those exact classes — no new exception needed.
+
+### Backend routes (`app/features/model_selection/routes.py`)
+
+```python
+@router.post("/runs", response_model=SubmitRunResponse, status_code=status.HTTP_202_ACCEPTED)
+async def submit_run(request: ModelSelectionRunRequest, response: Response, db = Depends(get_db)):
+    service = ModelSelectionService()
+    try:
+        result = await service.submit_run(db, request)
+        response.headers["Location"] = result.monitor_url
+        response.headers["Retry-After"] = "2"
+        return result
+    except ValueError as exc: raise BadRequestError(message=str(exc)) from exc
+    except SQLAlchemyError as exc: raise DatabaseError(message="Failed to submit selection run", details={"error": str(exc)}) from exc
+
+@router.delete("/{selection_id}", response_model=ModelSelectionRunResponse, status_code=200,
+               description="Cooperative cancel + drain. 200 settled / 404 missing / 409 terminal / 504 drain timeout.")
+async def cancel_run(selection_id: str, db = Depends(get_db)):
+    service = ModelSelectionService()
+    try: return await service.cancel_run(db, selection_id)
+    except SQLAlchemyError as exc: raise DatabaseError(message="Failed to cancel selection run", details={"error": str(exc)}) from exc
+    # NotFoundError(404)/ConflictError(409)/GatewayTimeoutError(504) raised in-service bubble to the global handler.
+# GET /{selection_id} unchanged signature — service now attaches progress.
+```
+
+### Implementation Tasks (dependency-ordered)
+
+```yaml
+# ───────────────────────── BACKEND ─────────────────────────
+Task 1 — Config:
+  MODIFY app/core/config.py: ADD model_selection_global_max_parallel: int = 4 ;
+    model_selection_cancel_drain_timeout_seconds: int = 30  (mirror batch_* placement/typing).
+  MODIFY .env.example: ADD MODEL_SELECTION_GLOBAL_MAX_PARALLEL / MODEL_SELECTION_CANCEL_DRAIN_TIMEOUT_SECONDS (+comments).
+  MODIFY app/core/tests/test_config.py: assert the two defaults via Settings(_env_file=None).
+
+Task 2 — ORM + migration:
+  MODIFY app/features/model_selection/models.py: +CANCELLED enum; +started_at/count columns on ModelSelectionRun;
+    ALTER status CheckConstraint to include 'cancelled'; +ModelSelectionCandidate + CandidateStatus (blueprint).
+  RUN: uv run alembic heads   # chain down_revision to the LIVE head
+  CREATE alembic/versions/<rev>_add_model_selection_candidate_and_progress.py:
+    - create_table model_selection_candidate (mirror c1d2e3f40512 JSONB/index/FK ondelete=CASCADE style)
+    - add_column started_at + the four count columns to model_selection_run (server_default "0" / NULL)
+    - DROP+CREATE ck_model_selection_run_valid_status to include 'cancelled'
+    - downgrade(): reverse (recreate old constraint, drop columns, drop indexes+table)
+  MODIFY tests/test_models.py: candidate constraint + CRUD; run status accepts 'cancelled'.
+
+Task 3 — Schemas:
+  MODIFY app/features/model_selection/schemas.py: +'cancelled' on SelectionStatusLiteral; +CandidateProgress,
+    SelectionProgress; EXTEND ModelSelectionRunResponse (started_at/progress/candidate_progress, all additive
+    with safe defaults); +SubmitRunResponse(ModelSelectionRunResponse){monitor_url, cancel_url}.
+  MODIFY tests/test_schemas.py: progress/submit models validate; existing-response back-compat (defaults).
+
+Task 4 — Runner (pure-ish concurrency module):
+  CREATE app/features/model_selection/runner.py: MIRROR batch/runner.py (registry, CancelHandle,
+    run_selection_candidates, cancel_selection, await_drain, mark_completed, the 3 mark_* helpers).
+  CREATE tests/test_runner.py: MIRROR batch/tests/test_runner.py — semaphore caps concurrency (peak==effective),
+    cancel-before-start → skipped, cancel-mid-flight → cancelled_running; fake session_maker + monkeypatched
+    DB helpers (NO real DB; not @integration).
+
+Task 5 — Service:
+  MODIFY app/features/model_selection/service.py: ADD submit_run, _run_in_background, _execute_candidate (inline
+    _exec), _settle, cancel_run; module-level _BACKGROUND_TASKS set; EXTEND get_selection/_response with progress.
+    REUSE _shape_candidate/rank_candidates/build_chart_data/explain_winner UNCHANGED. Lazy import services + runner.
+  MODIFY tests/test_service.py: mock BacktestingService (patch the lazy target); assert submit_run returns
+    running+children pending; worker settles completed/partial/failed; cancel mapping; all reuse the pure logic.
+
+Task 6 — Routes:
+  MODIFY app/features/model_selection/routes.py: ADD POST /runs (202 + Location/Retry-After) + DELETE /{id}
+    (404/409/200/504); GET /{id} now carries progress (no signature change). Mirror error mapping.
+  CREATE tests/test_async_routes.py: 202 immediacy (mock backtest to block; assert response returns first +
+    status 'running' + Location header + body monitor_url/cancel_url); GET shows progress; DELETE 404/409/200.
+
+Task 7 — Integration:
+  MODIFY tests/test_routes_integration.py (@pytest.mark.integration, real engine, prefix-scoped teardown):
+    - submit /runs → poll GET until terminal → ranking/winner present; failed candidate stays visible.
+    - cancel mid-flight → no model_selection_candidate left status='running' after drain (mirror
+      batch/tests/test_runner_chaos.py); 504 path optional (hard to force deterministically — document, may skip).
+
+# ───────────────────────── FRONTEND (extends Slice A) ─────────────────────────
+Task 8 — Types:
+  MODIFY frontend/src/types/api.ts (Model Selection section): +SubmitRunResponse, SelectionProgress,
+    CandidateProgress; +'cancelled' on the SelectionStatus union; ADD TERMINAL_SELECTION_STATES set in a .ts
+    (results/constants.ts) NOT a component file. Do NOT redefine Slice A's types.
+
+Task 9 — Hooks:
+  MODIFY frontend/src/hooks/use-model-selection.ts: +useSubmitSelectionRun (POST /runs, seed query cache on
+    success), +useSelectionRun(selectionId) (poll, refetchInterval false on terminal, enabled gate),
+    +useCancelSelectionRun (DELETE, invalidate run query). MIRROR use-batches.ts.
+  MODIFY hooks/use-model-selection.test.ts: submit posts to /model-selection/runs; poll stops on terminal;
+    cancel DELETEs /model-selection/{id}; query disabled without id (fetch not called). MIRROR use-batches.test.ts.
+
+Task 10 — Results components (under components/champion-selector/results/):
+  CREATE run-progress-panel.tsx (+test): StatusBadge + counts + per-candidate Table (mirror batch.tsx:294-411).
+  CREATE ranking-table.tsx (+test): rows from response.ranking (ModelRankEntry); winner highlighted; excluded
+    rows show exclusion_reason; row click → onSelectModel (opens drawer). Plain shadcn Table (≤10 rows).
+  CREATE winner-card.tsx (+test): winner model_type + metrics + recommendation_confidence + confidence_reasons
+    + BIAS_EXPLANATION (Slice A copy.ts). Null-safe when no winner (failed/cancelled run).
+  CREATE comparison-charts.tsx (+test): WAPE-by-model + bias-by-model bar charts (from chart_data), fold-stability
+    (backtest-folds-chart style, per-fold WAPE), winner actual-vs-predicted (multi-series-chart: actual+predicted
+    by date from chart_data.winner_actual_vs_predicted). ResizeObserver beforeAll stub in tests.
+  CREATE model-detail-drawer.tsx (+test): Sheet showing one candidate's metrics + per-fold table + error/exclusion.
+  CREATE cancel-run-dialog.tsx (+test): AlertDialog (mirror batch.tsx:324-351); confirm → useCancelSelectionRun.
+
+Task 11 — Page wiring:
+  MODIFY frontend/src/pages/visualize/champion.tsx: ENABLE the "Run comparison" CTA (gated on form validity);
+    onClick → useSubmitSelectionRun(request); on submit store selection_id; render RunProgressPanel while
+    running (useSelectionRun polling) + CancelRunDialog; on terminal render WinnerCard + RankingTable +
+    ComparisonCharts + ModelDetailDrawer; partial/all-failed/cancelled → EmptyState/ErrorDisplay with failed
+    candidates still listed. Do NOT add train/predict/promote UI (Slice C).
+```
+
+### Integration Points
+
+```yaml
+DATABASE:
+  - migration: + model_selection_candidate (FK CASCADE to model_selection_run.selection_id); + started_at +
+    {total,completed,failed,cancelled}_candidates on model_selection_run; alter status CheckConstraint (+cancelled).
+CONFIG:
+  - app/core/config.py: model_selection_global_max_parallel (4), model_selection_cancel_drain_timeout_seconds (30);
+    add to .env.example (UPPER_SNAKE) + a config test.
+ROUTES:
+  - app/features/model_selection/routes.py only (router already wired in app/main.py — no app/main.py change).
+FRONTEND:
+  - No new ROUTE/NAV (Slice A added /visualize/champion); Slice B extends the page + hooks + types only.
+OBSERVABILITY (structlog, mirror existing model_selection.* + batch.* events):
+  - model_selection.run_submitted / .candidate_started / .candidate_completed / .candidate_failed /
+    .candidate_cancelled / .run_settled / .run_cancel_requested / .run_cancel_drained.
+```
+
+## Validation Loop
+
+### Level 1 — Backend syntax & policy
+
+```bash
+uv run ruff check app/features/model_selection app/core/config.py alembic/versions
+uv run ruff format --check app/features/model_selection app/core/config.py alembic/versions
+uv run mypy app/features/model_selection app/core/config.py
+uv run pyright app/features/model_selection app/core/config.py
+uv run pytest app/core/tests/test_strict_mode_policy.py -v   # must stay green (no new strict date model)
+```
+
+### Level 2 — Backend unit tests
+
+```bash
+uv run pytest app/features/model_selection/tests -v -m "not integration"
+```
+Required new test names (additive to the backend foundation suite):
+- `test_submit_run_returns_202_before_backtests_finish` (block a mocked backtest; assert response returns first)
+- `test_submit_run_inserts_running_parent_and_pending_candidates`
+- `test_worker_settles_completed_when_all_candidates_succeed`
+- `test_worker_settles_partial_when_some_candidates_fail`
+- `test_worker_settles_failed_when_all_candidates_fail` (winner None, 200-shaped GET, status failed)
+- `test_settle_reuses_rank_candidates_and_build_chart_data` (terminal output byte-compatible with sync /run)
+- `test_runner_semaphore_caps_concurrency` / `test_runner_cancel_before_start_skips` / `test_runner_cancel_mid_flight_marks_cancelled`
+- `test_cancel_run_404_when_missing` / `test_cancel_run_409_when_terminal` / `test_cancel_run_returns_settled_on_drain`
+- `test_get_selection_attaches_live_progress_groupby` / `test_legacy_sync_run_has_no_progress_children`
+- `test_run_status_literal_accepts_cancelled`
+
+### Level 3 — Migration & integration
+
+```bash
+docker compose up -d
+uv run alembic upgrade head
+uv run pytest app/features/model_selection/tests -v -m integration
+uv run alembic downgrade -1 && uv run alembic upgrade head   # round-trips cleanly
+```
+Integration expectations: `model_selection_candidate` exists with FK CASCADE + indexes; `/runs` → poll →
+terminal with a winner; a cancel mid-flight leaves NO candidate row in `running`; failed candidate visible.
+
+### Level 4 — Full gates (must be green before PR)
+
+```bash
+uv run ruff check . && uv run ruff format --check .
+uv run mypy app/ && uv run pyright app/
+uv run pytest -v -m "not integration"
+cd frontend && pnpm tsc --noEmit && pnpm lint && pnpm test --run
+```
+> Known-local-noise: mypy/pyright report pre-existing lightgbm/xgboost optional-dep import errors in
+> forecasting/+registry/ (CI installs the extras). Do NOT "fix" them; a green LOCAL mypy can MASK errors that
+> only surface once the extras resolve types (memory: the #355 finalizer cast). Reset the DB
+> (`docker compose down -v && up -d && alembic upgrade head`) before any Level-3 integration run.
+
+### Manual dogfood probe (discover REAL ids first — IDs are NOT 1-based)
+
+```bash
+uv run uvicorn app.main:app --port 8123 &
+curl -s "http://localhost:8123/dimensions/stores?page=1&page_size=5" | python3 -m json.tool | grep '"id"'
+curl -s "http://localhost:8123/dimensions/products?page=1&page_size=5" | python3 -m json.tool | grep '"id"'
+# submit (note Location/Retry-After + immediate 202 running)
+curl -s -D - -X POST http://localhost:8123/model-selection/runs -H "Content-Type: application/json" -d '{
+  "store_id": <ID>, "product_id": <ID>,
+  "selection_window": {"start_date":"2026-01-01","end_date":"2026-05-31"},
+  "forecast_horizon": 14,
+  "split_config": {"strategy":"expanding","n_splits":5,"min_train_size":30,"gap":0,"horizon":14},
+  "candidate_models": [{"model_type":"naive","params":{}},{"model_type":"seasonal_naive","params":{"season_length":7}},
+    {"model_type":"moving_average","params":{"window_size":7}},{"model_type":"regression","params":{}},
+    {"model_type":"prophet_like","params":{}}]}' | head -40
+# poll (watch progress → terminal)
+curl -s "http://localhost:8123/model-selection/<selection_id>" | python3 -m json.tool | grep -E 'status|progress|winner'
+# cancel a fresh run mid-flight
+curl -s -o /dev/null -w "%{http_code}\n" -X DELETE "http://localhost:8123/model-selection/<selection_id>"   # 200/409
+# frontend: VITE_API_BASE_URL=http://localhost:8123; dogfood /visualize/champion over http://localhost:5173 (NOT a LAN IP).
+```
+
+## Final Validation Checklist
+
+- [ ] `POST /model-selection/runs` returns 202 + Location + Retry-After + `status="running"` BEFORE any backtest finishes.
+- [ ] Detached worker uses `get_session_maker()` (never the request `db`); a held task ref prevents GC.
+- [ ] `model_selection_candidate` rows track pending→running→{completed,failed,cancelled}; `result` JSONB on success.
+- [ ] GET attaches live `progress` (GROUP BY children) + `candidate_progress`; terminal output byte-compatible with sync `/run`.
+- [ ] `DELETE /{id}`: 404/409/200/504; no candidate row left `running` after a clean drain (integration-proven).
+- [ ] Concurrency Semaphore-capped; one AsyncSession per candidate; `global_max_parallel=1` ⇒ sequential.
+- [ ] `cancelled` added additively (ORM enum + CheckConstraint + response Literal + TS union); strict-mode test green.
+- [ ] Migration up/down round-trips on a fresh DB; FK CASCADE + indexes present.
+- [ ] Ranking/chart/business at settle REUSE `rank_candidates`/`build_chart_data`/`explain_winner` UNCHANGED.
+- [ ] Frontend CTA → submit → progress panel → ranking table + winner card + 4 charts + detail drawer; partial/
+      all-failed/cancelled states render; failed candidates stay visible; polling stops on terminal.
+- [ ] No train/predict/override/promote UI (Slice C); no new npm dependency; no Slice A contract redefinition.
+- [ ] All Level-1..4 gates pass; `gh issue view <N>` confirms the tracking issue is open; `git diff --stat`
+      shows no CRLF whole-file noise; `docker-compose.lan.yml` NOT staged.
+
+## Anti-Patterns to Avoid
+
+- ❌ Don't `await` the runner inline in the POST handler (batch's pattern) — Slice B must detach via
+  `asyncio.create_task` and return 202 first, or there is no progress/poll/cancel.
+- ❌ Don't use the request `Depends(get_db)` session in the detached worker — it's closed; open fresh ones from `get_session_maker()`.
+- ❌ Don't `asyncio.create_task` without holding a reference — the task can be GC'd mid-run.
+- ❌ Don't write per-candidate progress into one shared parent JSONB from concurrent tasks (lost-update race) — use child rows.
+- ❌ Don't import `app/features/batch/runner.py` — mirror it slice-locally (cross-slice rule).
+- ❌ Don't rewrite ranking/chart/business at settle — reuse the existing pure modules.
+- ❌ Don't pretend a mid-fit candidate cancelled when sklearn/LightGBM completed it — surface the honest outcome.
+- ❌ Don't drop partial/failed/cancelled candidates — keep them visible in `ranking` + `candidate_progress`.
+- ❌ Don't train, predict, override, or promote (Slice C). Don't add safety stock (Slice C; must not affect ranking).
+- ❌ Don't redefine Slice A's types/page/route/catalog — extend additively. Don't break the legacy sync `POST /run`.
+- ❌ Don't crypto.randomUUID() client-side; don't hardcode store_id=1/product_id=1; don't add a per-run max_parallel field (use the global setting).
+
+## Confidence Score
+
+**8.5/10** for one-pass implementation success. The async LRO pattern is fully proven in the merged `batch`
+slice on this exact runtime, the repo ships a runtime-verified `asyncio-taskgroup-cancellation.md`, every
+reused signature (backtest/ranking/chart/explain) is locked by the merged backend PRP, and every frontend
+convention (polling hook, status badge, charts, Sheet drawer, AlertDialog, test harness) is cited to live
+file:line. Residual risk (the 1.5): (a) the **fire-and-forget divergence** from batch (detached
+`create_task` + the GC ref + worker-owns-its-sessions) is the one genuinely novel mechanic — it's spelled
+out with the Python-docs citation, but it's the most likely place to slip; (b) a **process restart mid-run**
+leaves a parent stuck in `running` with no reconcile pass (accepted single-host limitation; note it in the
+PR, do not build crash-recovery here); (c) **504 drain-timeout** is hard to force deterministically in an
+integration test (an in-flight sklearn fit is uncancellable) — unit-test the timeout via a stalled drain and
+document that the integration 504 path may be probe-only.
+
+### Scoring table (packaging brainstorm)
+
+| Option | User value | Repo fit | Impl clarity | Risk control | Dep isolation | Total /25 |
+|--------|:---:|:---:|:---:|:---:|:---:|:---:|
+| **A — Fire-and-forget LRO + child table + slice-local runner (CHOSEN)** | 5 | 5 | 4 | 4 | 5 | **23** |
+| C — New runs + child table, sequential (no fan-out) | 3 | 3 | 5 | 5 | 5 | 21 |
+| B — Convert `/run` in place, JSONB-in-parent progress | 4 | 2 | 3 | 2 | 2 | 13 |
diff --git a/PRPs/forecast-champion-selector-slice-c-forecast-decision-operationalization.md b/PRPs/forecast-champion-selector-slice-c-forecast-decision-operationalization.md
new file mode 100644
index 00000000..8c46d962
--- /dev/null
+++ b/PRPs/forecast-champion-selector-slice-c-forecast-decision-operationalization.md
@@ -0,0 +1,1107 @@
+name: "Forecast Champion Selector — Slice C: Forecast Decision, Business Summary + Operationalization"
+description: |
+  Close the champion-selection workflow after comparison. Slice C adds the
+  *decision* half: accept the recommended winner OR manually override to another
+  candidate (with an explicit non-recommended warning + audit), train the chosen
+  model, generate its forecast, surface a business-readable interpretation
+  (why it won, expected demand, bias risk, a clearly-labeled safety-stock
+  heuristic, confidence caveats), and — through an explicit, approval-gated,
+  audited path — promote the trained champion to a registry alias. It ships the
+  user-guide page and an end-to-end dogfood that closes the full journey.
+
+  Slice C builds on (does NOT redefine) Slice A (selection shell + capability
+  catalog) and Slice B (async run + per-candidate progress + ranking/winner/
+  chart results). It reuses the ALREADY-MERGED `POST /{id}/train-winner` and
+  `POST /{id}/predict` endpoints verbatim and ADDS: `POST /{id}/train-selected`
+  (override), an optional forecast-decision body on predict, and
+  `POST /{id}/promote` (the future approval-gated promotion the backend
+  foundation PRP explicitly deferred).
+
+**Created:** 2026-06-01 · **Slice:** C of 3 (A → B → C)
+**Current repo base observed:** `dev` @ `6c3f8d4` (Merge PR #354 — `model_selection` backend merged); alembic head `b667d321603c`.
+**Backend foundation (source of truth):** `PRPs/forecast-champion-selector-backend.md` (issue #353, MERGED) + the live slice
+`app/features/model_selection/{models,schemas,service,routes,ranking,explanations}.py` (verified 2026-06-01).
+**Slice A (FIXED upstream):** `PRPs/forecast-champion-selector-slice-a-selection-capability.md` — owns `/visualize/champion`
+page, `hooks/use-model-selection.ts`, `types/api.ts` "Model Selection" section, `components/champion-selector/*`,
+`GET /model-selection/models` catalog (incl. `supports_auto_predict`), the `BIAS_EXPLANATION`/`RANKING_TIE_BREAK`
+copy constants. Slice C EXTENDS these.
+**Slice B (FIXED upstream):** `PRPs/forecast-champion-selector-slice-b-async-comparison-results.md` — owns `POST /runs`
+(202 async), `model_selection_candidate` child table, `DELETE /{id}` cancel, the live progress + ranking table +
+winner card + comparison charts + model-detail drawer, the `cancelled` status, `SubmitRunResponse`/`SelectionProgress`/
+`CandidateProgress`. Slice C consumes a terminal run's `winner`/`ranking`/`business_summary` and adds the decision layer
+BELOW the results. Slice C MUST NOT redefine Slice B's run/progress/cancel/results contracts.
+**Working-tree caveat:** `docker-compose.lan.yml` is an untracked local dogfood override; do NOT commit it. `uv.lock` (M) is pre-existing — do NOT stage.
+**Tracking issue:** create before implementation, suggested title
+`feat(api,db,ui): forecast champion selector slice C — forecast decision, business summary & promotion`.
+**Suggested branch:** `feat/champion-selector-slice-c` (off `dev`, per `.claude/rules/branch-naming.md`).
+**Commit scope:** `api` (override-train + predict-decision + promote endpoints, decision module, service), `db` (one
+migration: additive decision/promotion columns on `model_selection_run`), `ui` (decision components/hooks/types),
+`docs` (user-guide page). Every commit references the tracking issue.
+
+---
+
+## VALIDATE — Scope vs. backend foundation, Slice A, Slice B
+
+### Already merged (the foundation Slice C builds on — verified 2026-06-01)
+
+- **`POST /model-selection/{selection_id}/train-winner`** EXISTS (`routes.py:132`, `service.train_winner` `service.py:405`).
+  It trains `ranking.winner` ONLY (no override), writes `row.final_model_path`, returns
+  `TrainWinnerResponse{selection_id, model_type, model_path}` (`schemas.py:291`). It takes **no request body**.
+- **`POST /model-selection/{selection_id}/predict`** EXISTS (`routes.py:154`, `service.predict_winner` `service.py:442`).
+  Requires a trained model (`row.final_model_path`, else `BadRequestError`), calls
+  `ForecastingService().predict(...)`, returns `PredictWinnerResponse{selection_id, forecast: ForecastSummary}`
+  (`schemas.py:299`). It takes **no request body**.
+- **`ForecastingService().predict()` REJECTS feature-aware models** (`forecasting/service.py:491`):
+  `if bundle.model.requires_features: raise ValueError("Feature-aware models forecast through POST /scenarios/simulate …")`.
+  The reject set is `regression`, `prophet_like`, `lightgbm`, `xgboost`, `random_forest`. Slice A's catalog already
+  encodes this as `supports_auto_predict = not feature_aware`.
+- **`ForecastSummary`** (`schemas.py:258`) = `{points, total_demand, average_demand, horizon}` — has **no peak/low day**.
+- **`business_summary`** (built by `explanations.explain_winner`, `explanations.py:26`) = `{headline, winner{model_type,
+  summary}, recommendation_confidence, confidence_reasons, comparison{runner_up…}, data_notes, caveats}` — has **no
+  bias-risk wording, no safety stock, no expected-demand-from-forecast**.
+- **`ModelSelectionRun` ORM** (`models.py:43`) has `final_model_path: str|None` but **no registry `run_id` linkage, no
+  `trained_model_type`/override columns, no promotion/alias columns**.
+- **Forecasting `train_model` does NOT register a registry run** (verified `forecasting/service.py:247` — writes a joblib
+  bundle to `./artifacts/models`, returns `TrainResponse.model_path`; **no `run_id`**). Therefore promotion must itself
+  orchestrate the registry: `RegistryService.create_run` → `update_run`(→SUCCESS w/ artifact) → `create_alias`.
+- **Registry promotion mechanics** (`registry/service.py`): `create_run(db, RunCreate) -> RunResponse` (`:183`, PENDING,
+  generates `run_id`); `update_run(db, run_id, RunUpdate) -> RunResponse|None` (`:368`, state machine
+  PENDING→RUNNING→SUCCESS); `create_alias(db, AliasCreate) -> AliasResponse` (`:432`) with the **hard precondition**
+  "Only SUCCESS runs can be aliased" (`service.py:457`). `AliasCreate.alias_name` regex `^[a-z0-9][a-z0-9\-_]*$`
+  (`registry/schemas.py:224`). Artifact storage: `LocalFSProvider.save(source_path, artifact_uri) -> (sha256, size)`
+  (`registry/storage.py:169`); `compute_hash` (`:106`).
+- **Backend foundation PRP Non-Goals** (`forecast-champion-selector-backend.md:65`):
+  *"No alias auto-promotion (the selector may recommend a winner; alias mutation is a **future approval-gated PRP**)."*
+  **Slice C IS that PRP** — promotion lands here, explicitly approval-gated + audited (never auto).
+
+### Slice C's gaps to fill
+
+1. **Manual winner override** — there is no way to train a user-chosen non-winner candidate. Need `train-selected` +
+   override audit + a non-recommended warning contract.
+2. **Forecast decision enrichment** — peak/low day, a labeled safety-stock heuristic, bias-risk interpretation, and
+   expected demand are absent. Deterministic, not LLM-dependent. Safety stock must NOT influence ranking.
+3. **Capability-limited forecast state** — a feature-aware winner cannot auto-predict; today predict 400s with a raw
+   error. The UI must show an explicit blocked/unsupported state (driven by Slice A's `supports_auto_predict`).
+4. **Approval-gated, audited promotion** — no promote path exists. Need a single orchestrated, explicitly-approved,
+   recorded promotion to a registry alias (the deferred future PRP).
+5. **Decision UI + user guide + dogfood** — no decision components, no guide page, no end-to-end dogfood of the journey.
+
+---
+
+## BRAINSTORM / RERANK — Chosen packaging
+
+Three packaging alternatives (the brief's expected three), scored on user value / repo fit / implementation clarity /
+risk control / dependency isolation (each 1–5; total /25):
+
+| # | Option | User | Repo fit | Clarity | Risk | Isolation | **Total** |
+|---|--------|:----:|:--------:|:-------:|:----:|:---------:|:---------:|
+| **1** | **Extend `model_selection` with decision endpoints (`train-selected` override, optional decision body on `predict`, `POST /{id}/promote` orchestrating registry) + a pure `decision.py` + a `components/champion-selector/decision/*` UI family. Backend owns capability + audit.** | 5 | 5 | 4 | 4 | 4 | **22 ✅** |
+| 3 | Forecast output only (override/train/predict/summary/chart/table/business/safety-stock) and **defer promotion + governance** to a later PRP | 2 | 4 | 5 | 5 | 5 | 21 |
+| 2 | Reuse `/forecasting` + `/registry` endpoints **directly from the frontend**; no new `model_selection` orchestration endpoints (TS orchestrates train→register→alias) | 4 | 2 | 2 | 2 | 2 | 12 |
+
+**Chosen: Option 1.** It is the only option that delivers the brief's full operationalization (override + train +
+forecast + business interpretation + safety stock + **promotion with approval/audit** + docs + dogfood) while keeping
+capability **backend-owned** (coordination contract) and respecting the vertical-slice rule (the service already
+lazy-imports `BacktestingService`/`ForecastingService`; Slice C lazy-imports `RegistryService` the same way). It matches
+the merged slice's pattern, the governance doc's promotion-decision-record, and the existing
+`promote-confirmation-dialog.tsx` UX precedent.
+
+**Option 3 is the de-risking fallback, not a rival.** Promotion (Task set 5) is the LAST, separable task; if its registry
+artifact-registration mechanic proves heavier than budgeted, the slice can ship Option-3 scope (everything except
+`POST /{id}/promote` + the promote dialog) and a follow-up issue, still passing all gates. Its low user-value score
+reflects that it drops a *required* Slice-C deliverable. **Option 2 is rejected:** it bypasses the merged backend-owned
+`train-winner`/`predict`, pushes a fragile multi-step registry write (artifact copy + hash + alias) into TypeScript with
+no audit record, and violates "backend-owned model capability metadata is preferred over frontend hardcoding."
+
+**Non-goals (NOT built here):** re-running comparison / async progress / cancel / ranking math (Slice B); the selection
+shell / catalog / availability (Slice A); feature-aware *auto*-predict (explicitly unsupported — surfaced as a capability
+limitation, NOT faked); any agent tool / `agent_require_approval` entry (promotion is a user REST flow, not an agent
+mutation); batch model-zoo; multi-tenant/cloud anything.
+
+---
+
+## Goal
+
+**Feature Goal:** Let a user, after a champion comparison run (Slice B) finishes with a winner, **decide and operate**:
+accept the recommended model or override to another candidate (warned + audited), train it, generate and read its
+forecast (summary with peak/low, chart, daily table), understand it in business terms (why it won, expected demand,
+bias risk, a labeled safety-stock heuristic, confidence caveats), and — only on explicit approval — promote the trained
+champion to a registry alias with a recorded decision. All deterministic, no LLM.
+
+**Deliverable:**
+- **Backend (additive to the `model_selection` slice):**
+  - `POST /model-selection/{selection_id}/train-selected` — train a user-chosen candidate (override); persists
+    `trained_model_type` / `is_override` / `override_reason`; returns a `TrainWinnerResponse` + `override_warning`.
+  - `POST /model-selection/{selection_id}/predict` — KEEP existing behavior; ADD an **optional** `ForecastDecisionParams`
+    body (`lead_time_days`, `service_level`); response gains peak/low (on `ForecastSummary`) + a `decision: ForecastDecision`.
+  - `POST /model-selection/{selection_id}/promote` — approval-gated, audited orchestration: register a registry
+    `model_run`, transition it to SUCCESS with the verified artifact + winner metrics, create the alias; persist a
+    `promotion_decision` audit + `champion_run_id` + `promoted_alias`. Returns `PromoteResponse`.
+  - A pure `app/features/model_selection/decision.py` (mirrors `ranking.py`/`explanations.py`): forecast peak/low,
+    safety-stock heuristic (deterministic z-table, King formula), bias-risk text, expected demand.
+  - One Alembic migration: additive columns on `model_selection_run`.
+- **Frontend (extends the Slice A/B `/visualize/champion` page):** decision hooks
+  (`useTrainWinner`/`useTrainSelected`/`usePredictWinner`/`usePromoteChampion`), a
+  `components/champion-selector/decision/*` family (override panel, train/forecast actions with the capability-limited
+  state, forecast summary card, forecast chart, daily forecast table, business-interpretation panel, safety-stock panel,
+  promote dialog), and additive types in the Slice-A "Model Selection" section.
+- **Docs:** `docs/user-guide/champion-selector-guide.md` + a row in any guide index.
+- **Dogfood:** an end-to-end manual probe (select → run → decide → train → forecast → promote) over `localhost`.
+
+**Success Definition:**
+1. `POST /{id}/train-selected` trains a chosen candidate; an override to a non-winner returns `override_warning` and
+   persists `is_override=true` + `override_reason`; an unknown/non-candidate `model_type` → RFC 7807 400.
+2. `POST /{id}/predict` returns the forecast PLUS peak/low day and a `decision` block (safety stock, expected demand,
+   bias-risk text, caveats); the safety-stock value never feeds ranking; a feature-aware winner returns a clear 400 and
+   the UI shows a blocked/unsupported state instead of calling predict.
+3. `POST /{id}/promote` requires `approved_by` (and explicit ack for a non-recommended model), creates a SUCCESS
+   registry run + alias, and persists a `promotion_decision` audit; promoting before training → 422; a bad `alias_name`
+   → 422; promoting a non-recommended model without ack → 422.
+4. The `/visualize/champion` page, after a terminal winning run, renders the decision section: accept/override → train →
+   forecast (summary + chart + daily table) → business interpretation (incl. safety stock + bias risk) → gated promote.
+5. All Slice C validation gates pass (backend Level-1..4 incl. migration up/down + integration; frontend `tsc`/`lint`/
+   `test`); the new guide page exists; the dogfood journey completes.
+
+## Why
+
+- Comparison answers "which model is best?"; operationalization answers "now what?" — train it, see the forecast, judge
+  its business impact, and (deliberately, with a record) put it into service. Without Slice C the selector stops at a
+  ranking table and never produces a usable forecast or a promoted champion.
+- Promotion must be **explicit + audited** (governance doc + foundation PRP): the app may *recommend* a champion, but a
+  human approves and the decision is recorded. This is the controlled counterpart to the recommendation.
+- A labeled safety-stock heuristic + bias-risk wording turn raw metrics into an inventory decision a planner can act on,
+  while staying honest (heuristic, correlation-not-causation caveats, never influences ranking).
+- Keeps the single-host architecture: deterministic Python + Postgres + the existing registry; no new dependency,
+  no queue, no cloud SDK, no LLM in the decision path.
+
+## What
+
+### New / changed endpoints (all under the existing `APIRouter(prefix="/model-selection")`)
+
+```http
+POST /model-selection/{selection_id}/train-winner    # EXISTING (unchanged) — train the ranked winner
+POST /model-selection/{selection_id}/train-selected  # NEW — train a chosen candidate (override + audit)
+POST /model-selection/{selection_id}/predict         # EXISTING — ADD optional ForecastDecisionParams body + decision in response
+POST /model-selection/{selection_id}/promote         # NEW — approval-gated, audited registry promotion
+# UNCHANGED & KEPT: GET /availability, GET /models (A); POST /run, POST /runs, DELETE /{id}, GET /{id}, GET /{id}/ranking (A/B)
+```
+
+`POST /{id}/train-selected` request `TrainSelectedRequest` (strict):
+```json
+{ "model_type": "seasonal_naive", "override_reason": "domain seasonality outweighs WAPE lead" }
+```
+Response = `TrainWinnerResponse` superset: `{ selection_id, model_type, model_path, is_override, override_warning }`.
+
+`POST /{id}/predict` optional body `ForecastDecisionParams` (strict; all JSON-native → no `Field(strict=False)` needed):
+```json
+{ "lead_time_days": 7, "service_level": 0.95 }
+```
+Response `PredictWinnerResponse` (additive): `forecast: ForecastSummary` (now incl. `peak_date/peak_demand/low_date/low_demand`)
++ `decision: ForecastDecision`.
+
+`POST /{id}/promote` request `PromoteRequest` (strict):
+```json
+{ "alias_name": "champion-store5-prod8", "approved_by": "gabor", "acknowledge_non_recommended": false, "description": "Q3 champion" }
+```
+Response `PromoteResponse`: `{ selection_id, alias_name, run_id, run_status, model_type, is_override, promoted_at }`.
+
+### LOCKED Slice-C decisions
+
+1. **Override is a NEW sibling endpoint `POST /{id}/train-selected`, NOT a change to `train-winner`.** `train-winner`
+   stays byte-for-byte as merged (Slice B treats it as fixed; its tests must not break). `train-selected` validates that
+   `model_type` is one of the run's `candidate_models` AND appears as a ranking entry; trains it via the SAME
+   `ForecastingService.train_model` call `train_winner` uses; sets `final_model_path`, `trained_model_type`,
+   `is_override = (model_type != ranking.winner.model_type)`, `override_reason`. If `is_override`, the response carries
+   `override_warning` (deterministic copy naming the recommended model + the chosen model's WAPE gap). A model_type not in
+   the candidate set → `BadRequestError` (400). `train-winner` ALSO now persists `trained_model_type=winner`,
+   `is_override=False` (one tiny additive write in the existing method — its response shape is unchanged; the new columns
+   are nullable so this is back-compatible).
+2. **Predict gains an OPTIONAL decision body + an additive `decision` block.** The body is
+   `ForecastDecisionParams{lead_time_days: int = 7 (ge=1, le=365), service_level: float = 0.95 (ge=0.5, lt=1.0)}`. Declare
+   the route param so an empty body still works (`request: ForecastDecisionParams | None = Body(default=None)`; treat
+   `None` as defaults). `ForecastSummary` gains `peak_date/peak_demand/low_date/low_demand` (all `Optional`, default
+   `None` → back-compatible with Slice B's reuse of `ForecastSummary`). `PredictWinnerResponse` gains
+   `decision: ForecastDecision | None`. The existing `predict_winner` still 400s for an untrained model and for a
+   feature-aware model (the `ForecastingService.predict` `ValueError`).
+3. **Safety stock is a pure, deterministic heuristic in `decision.py`, CLEARLY LABELED, and NEVER touches ranking.**
+   `compute_forecast_decision(points, average_demand, lead_time_days, service_level) -> ForecastDecision`. Formula
+   (King 2011, demand-variability-only, constant lead time):
+   `safety_stock = z(service_level) * sigma_daily * sqrt(lead_time_days)`, `sigma_daily = stdev(daily forecast values)`,
+   `expected_demand_over_lead_time = average_demand * lead_time_days`,
+   `reorder_point = expected_demand_over_lead_time + safety_stock`. `z` from a fixed lookup (NO scipy): `0.90→1.2816,
+   0.95→1.6449, 0.975→1.9600, 0.99→2.3263`; nearest-key fallback for in-between levels (documented). Every `ForecastDecision`
+   field carries a `method="heuristic"` marker and a caveat string; the UI labels the panel "Safety stock (heuristic)".
+   `rank_candidates`/`build_chart_data` are NOT touched and never receive safety-stock inputs.
+4. **Bias-risk wording is locked and reuses Slice A's `BIAS_EXPLANATION` constant.** Wherever bias is surfaced (business
+   interpretation panel + `decision.bias_risk_text`): *"Positive bias means the model under-forecasts (risk of stockouts);
+   negative bias means it over-forecasts (risk of overstock)."* The backend `decision.py` returns the same sentence
+   (single source) plus the winner's bias sign read from `winner_metrics["bias"]`.
+5. **Feature-aware winners are a CAPABILITY LIMITATION, not a faked forecast.** The UI reads the winner's
+   `supports_auto_predict` from the Slice-A catalog (`GET /model-selection/models`); when `false` it renders a blocked
+   "Forecast not available for feature-aware models — use the What-If Planner (`/scenarios`)" state and does NOT call
+   `POST /{id}/predict`. The backend keeps `predict`'s clean 400 as a server-side guard (the `ForecastingService.predict`
+   `ValueError` message is already explicit). Do NOT add a scenarios call here (out of slice).
+6. **Promotion is approval-gated, audited, and orchestrates the registry — never auto.** `POST /{id}/promote`:
+   (a) load run; require `final_model_path` + `trained_model_type` (else 422 "train the model first");
+   (b) if `is_override` (a non-recommended model was trained) and `acknowledge_non_recommended` is `False` → 422;
+   (c) `RegistryService.create_run(db, RunCreate(model_type=trained_model_type, model_config_data=<trained params>,
+       data_window_start=row.start_date, data_window_end=row.end_date, store_id, product_id,
+       runtime_info_extras={"feature_frame_version": row.feature_frame_version}))` → PENDING `run_id`
+       — pass the **REAL persisted** `feature_frame_version` (V1 or V2) read off the run row, NEVER a hardcoded literal
+       (see LOCKED #7 for the column + run-creation persistence, and Known Gotchas for the V2 fidelity rule);
+   (d) `update_run(db, run_id, RunUpdate(status=RUNNING))`;
+   (e) register the artifact: copy the bundle at `row.final_model_path` into registry storage via the provider's
+       `save(Path(final_model_path), artifact_uri) -> (hash, size)` (see Known Gotchas — VERIFY the exact
+       artifact-registration call before coding);
+   (f) `update_run(db, run_id, RunUpdate(status=SUCCESS, metrics=row.winner_metrics, artifact_uri, artifact_hash=hash,
+       artifact_size_bytes=size))`;
+   (g) `create_alias(db, AliasCreate(alias_name=request.alias_name, run_id=run_id, description=request.description))`
+       — alias only attaches to a SUCCESS run (guaranteed by step f);
+   (h) persist on `model_selection_run`: `champion_run_id=run_id`, `promoted_alias=alias_name`, and a `promotion_decision`
+       JSONB = `{decision_id, alias, champion_run_id, approved_by, approved_at, decision:"promoted", reason,
+       trained_model_type, is_override}` (governance-doc decision-record shape).
+   `alias_name` is validated against the registry regex `^[a-z0-9][a-z0-9\-_]*$` at the schema layer (422 on violation).
+   **Compare and promote stay separate** — promote performs NO ranking/comparison; it only registers + aliases the
+   already-trained champion.
+7. **One migration, additive only (seven columns).** `model_selection_run` gains: `trained_model_type VARCHAR(40)`
+   (nullable), `is_override BOOLEAN NOT NULL DEFAULT false` (server_default `'false'`), `override_reason VARCHAR(2000)`
+   (nullable), `champion_run_id VARCHAR(32)` (nullable), `promoted_alias VARCHAR(100)` (nullable), `promotion_decision
+   JSONB` (nullable), and **`feature_frame_version INTEGER NOT NULL server_default '1'`** (M1 — V2-promotion support).
+   The `'1'` server_default backfills pre-existing rows only; it is NOT a code hardcode. **Run-creation persists the
+   real value:** Slice C ADDS `row.feature_frame_version = request.feature_frame_version` to BOTH `run_selection` (sync,
+   merged) AND `submit_run` (async, Slice B's) so every new run records what the user configured (V1 or V2); this is an
+   additive column write, not a redefinition of Slice B's run contract. No table drop, no CheckConstraint change. Chain
+   `down_revision` off the LIVE head at impl time (Slice B's migration must land first; run `uv run alembic heads`).
+   `downgrade` drops all seven columns.
+8. **WAPE stays default; tie-break unchanged; ranking math untouched.** Slice C reads `winner_metrics`/`ranking` as
+   produced by Slice A/B; it does not re-rank, re-derive confidence, or alter `ranking.py`/`explanations.py`.
+   **Coordination (ownership of "Explain Winner"):** `business_summary` is computed ONCE by the backend
+   (`explanations.explain_winner`, unchanged here). Slice B's winner-card already renders it read-only; Slice C's
+   business-interpretation-panel renders the SAME `business_summary` read-only and ADDS only the decision-layer fields
+   (bias-risk text + labeled safety stock from `decision.py`). Slice C does NOT re-derive explanation text or duplicate
+   Slice B's winner-card — it renders the decision section BELOW it.
+9. **No new strict request model carries a date/datetime/UUID/Decimal field.** `TrainSelectedRequest`,
+   `ForecastDecisionParams`, `PromoteRequest` are all `str`/`int`/`float`/`bool` only → `ConfigDict(strict=True)` with
+   NO `Field(strict=False)` needed; `app/core/tests/test_strict_mode_policy.py` stays green. `promoted_at`/`approved_at`
+   are server-set, never request fields.
+
+### Success Criteria
+
+- [ ] `POST /{id}/train-selected` trains a chosen candidate; non-candidate `model_type` → 400; override persists
+      `is_override=true` + `override_reason` and returns `override_warning`; `train-winner` still passes its existing tests.
+- [ ] `POST /{id}/predict` (with or without a body) returns `forecast` incl. `peak_date/peak_demand/low_date/low_demand`
+      and a `decision` block; safety stock is labeled heuristic; ranking output is unchanged by the decision call.
+- [ ] A feature-aware winner: `predict` returns a clean 400; the UI shows the blocked state and never calls predict.
+- [ ] `POST /{id}/promote` requires `approved_by`; non-recommended without ack → 422; before-train → 422; bad alias_name
+      → 422; on success creates a SUCCESS registry run + alias and persists `champion_run_id`/`promoted_alias`/
+      `promotion_decision`; a re-promote with the same alias_name updates the alias (registry upsert semantics).
+- [ ] Migration adds the seven columns (incl. `feature_frame_version`) and `downgrade` removes them cleanly on a fresh DB; strict-mode policy test green.
+- [ ] `decision.py` is pure (no DB/IO); its z-table + safety-stock + peak/low + bias-risk text are unit-tested deterministically.
+- [ ] `/visualize/champion` decision section renders after a terminal winning run: accept/override → train → forecast
+      (summary card + chart + daily table) → business interpretation (bias risk + labeled safety stock + caveats) →
+      gated promote dialog (alias name + approver + non-recommended ack); feature-aware → blocked forecast state.
+- [ ] `docs/user-guide/champion-selector-guide.md` exists and documents the full journey incl. the promotion-is-audited rule.
+- [ ] All backend Level-1..4 gates + frontend `pnpm tsc --noEmit && pnpm lint && pnpm test --run` pass; dogfood completes.
+
+## All Needed Context
+
+### Documentation & References
+
+```yaml
+# Slice / contract source of truth
+- file: PRPs/forecast-champion-selector-backend.md
+  why: Merged foundation. Non-Goals (:61-67) defer alias promotion to a "future approval-gated PRP" — THIS slice.
+       The /train-winner + /predict endpoint contract (:106-107). Do NOT re-derive ranking/availability.
+- file: PRPs/forecast-champion-selector-slice-a-selection-capability.md
+  why: FIXED upstream. Owns the page, hooks module, types/api.ts "Model Selection" section, champion-selector/*,
+       GET /models catalog (supports_auto_predict = not feature_aware), and the BIAS_EXPLANATION / RANKING_TIE_BREAK
+       constants in components/champion-selector/copy.ts. Slice C REUSES BIAS_EXPLANATION and the catalog flag.
+- file: PRPs/forecast-champion-selector-slice-b-async-comparison-results.md
+  why: FIXED upstream. Owns POST /runs, the child table, DELETE cancel, the results UI (winner card/ranking table/
+       charts/detail drawer) + 'cancelled' status. Slice C renders the decision section BELOW Slice B's results and
+       reuses winner/ranking/business_summary read-only. Do NOT redefine these.
+- file: PRPs/templates/prp_base.md
+  why: Base template. NOTE — "PRPs/prp-readme.md.md" does NOT exist (find PRPs -iname '*readme*' empty 2026-06-01);
+       all three prior champion PRPs record the same.
+
+# Live model_selection slice (the contract Slice C extends — verified 2026-06-01)
+- file: app/features/model_selection/service.py
+  why: train_winner (:405) + predict_winner (:442) are the methods Slice C extends/mirrors. _load (:513), _load_ranking
+       (:521), _forecast_summary (:505), _response (:526). Lazy cross-slice imports of ForecastingService inside methods
+       (:410, :444) — MIRROR that for the lazy RegistryService import in promote. train_winner builds the winner
+       ModelConfig via TypeAdapter(ModelConfig).validate_python({"model_type":…, **params}) (:417) — reuse for selected.
+- file: app/features/model_selection/schemas.py
+  why: ForecastSummary (:258) — ADD peak/low (Optional). TrainWinnerResponse (:291)/PredictWinnerResponse (:299) — ADD
+       fields. ModelType Literal (:34). ConfigDict(strict=True) on request bodies; SelectionWindow uses Field(strict=False)
+       ONLY for its dates (:64) — the new request bodies need NO strict=False (no date/uuid/decimal fields). ADD
+       TrainSelectedRequest, ForecastDecisionParams, ForecastDecision, PromoteRequest, PromoteResponse.
+- file: app/features/model_selection/models.py
+  why: ModelSelectionRun (:43) — ADD the seven columns: six decision/promotion + feature_frame_version (LOCKED #7). The status CheckConstraint
+       (:82) is NOT changed by Slice C (it is by Slice B). final_model_path (:73) is the trained-bundle path promote copies.
+- file: app/features/model_selection/routes.py
+  why: APIRouter(prefix="/model-selection") (:38); train_winner (:132) + predict_winner (:154) handlers + error mapping
+       (ValueError→BadRequestError, SQLAlchemyError→DatabaseError). ADD POST /train-selected, /promote; extend predict body.
+- file: app/features/model_selection/ranking.py
+  why: rank_candidates/build_chart_data — Slice C does NOT touch ranking. Read-only awareness only.
+- file: app/features/model_selection/explanations.py
+  why: explain_winner (:26) builds business_summary; decision.py is the SECOND pure module (mirror its style/imports).
+       Slice C does NOT change explain_winner; the bias-risk/safety-stock additions live in decision.py + the UI panel.
+- file: app/features/model_selection/tests/conftest.py
+  why: client fixture (:226 — app.dependency_overrides[get_db]=yield db_session; ASGITransport+AsyncClient) and the
+       integration db_session fixture (:191 — real engine, prefix-scoped teardown deleting ModelSelectionRun by store_id).
+- file: app/features/model_selection/tests/test_routes.py
+  why: _client() route harness (:32 — override get_db with AsyncMock; ASGITransport). MIRROR for /train-selected,
+       /predict-with-body, /promote route tests.
+- file: app/features/model_selection/tests/test_service.py
+  why: monkeypatch target for ForecastingService is the STRING "app.features.forecasting.service.ForecastingService"
+       (:176). For promote, monkeypatch "app.features.registry.service.RegistryService" the same way.
+
+# Forecasting + registry (services Slice C orchestrates via lazy import — verified 2026-06-01)
+- file: app/features/forecasting/service.py
+  why: train_model(db, store_id, product_id, train_start, train_end, config, *, feature_frame_version=1,
+       feature_groups=None) -> TrainResponse{model_path,…} (:247) — NO registry write. predict(store_id, product_id,
+       horizon, model_path) -> PredictResponse (:402); REJECTS feature-aware at :491 (ValueError). ForecastPoint has
+       {date, forecast, lower_bound, upper_bound}.
+- file: app/features/forecasting/feature_metadata.py
+  why: model_family_for(model_type) (:57) — only needed if you ever derive feature_aware backend-side; Slice C prefers
+       Slice A's catalog flag. Reject set = requires_features models (regression/lightgbm/xgboost/random_forest/prophet_like).
+- file: app/features/registry/service.py
+  why: create_run(db, RunCreate) -> RunResponse (:183, PENDING, generates run_id); update_run(db, run_id, RunUpdate)
+       -> RunResponse|None (:368, state machine); create_alias(db, AliasCreate) -> AliasResponse (:432) — "Only SUCCESS
+       runs can be aliased" (:457). These are the three calls promote() orchestrates (lazy import RegistryService()).
+- file: app/features/registry/schemas.py
+  why: RunCreate (:71 — model_type, model_config_data[alias model_config], data_window_start/end, store_id, product_id;
+       optional runtime_info_extras), RunUpdate (:116 — status/metrics/artifact_uri/artifact_hash/artifact_size_bytes),
+       AliasCreate (:219 — alias_name regex ^[a-z0-9][a-z0-9\-_]*$, run_id, description), RunStatus (:30), RunResponse
+       (:129), AliasResponse (:229).
+- file: app/features/registry/storage.py
+  why: LocalFSProvider.save(source_path: Path, artifact_uri: str) -> (sha256, size) (:169); compute_hash (:106);
+       load (:201). The artifact-registration step in promote() (LOCKED #6e) uses this — VERIFY the exact call/URI
+       convention against how ops/demo register artifacts before coding (see Known Gotchas).
+- file: app/core/config.py
+  why: forecast_model_artifacts_dir = "./artifacts/models" (:100); registry_artifact_root = "./artifacts/registry" (:112).
+       The trained bundle lives under forecast_model_artifacts_dir; promote copies it into the registry root.
+- file: app/core/exceptions.py
+  why: BadRequestError(400, :152), NotFoundError(404, :64), ConflictError(409, :130), UnprocessableEntityError(422, :174),
+       DatabaseError(500, :108). Use UnprocessableEntityError for "train first" / "ack required" / bad-alias states; the
+       schema regex already 422s a bad alias_name at validation.
+
+# Frontend examples to MIRROR (verified 2026-06-01)
+- file: frontend/src/components/forecast-intelligence/promote-confirmation-dialog.tsx
+  why: THE gated-promotion UX (props open/onOpenChange/run/currentChampion/defaultAliasName/onConfirm(aliasName)/
+       isPromoting; alias-name input; verify-artifact gate; worse-WAPE + version-mismatch checkbox acknowledgements).
+       MIRROR its structure for promote-champion-dialog.tsx (alias name + approver + non-recommended ack), but call the
+       NEW usePromoteChampion hook (POST /model-selection/{id}/promote), not useCreateAlias.
+- file: frontend/src/components/forecast-intelligence/champion-compatibility-badge.tsx
+  why: Compatibility signalling (Comparable/Not comparable badge from grain+window+feature-frame). Use read-only in the
+       promote dialog if showing champion-vs-current context; do NOT make promote perform the comparison (keep separate).
+- file: frontend/src/pages/visualize/forecast.tsx
+  why: Forecast rendering pattern — TimeSeriesChart usage (:448, predictedKey="forecast", showInterval + lower/upper_bound)
+       and CSV export. NOTE: there is NO daily-table pattern here (it CSV-exports) — Slice C BUILDS the daily table.
+- file: frontend/src/components/charts/time-series-chart.tsx
+  why: The forecast curve chart (ComposedChart; actual/predicted lines + optional interval band). Props data + predictedKey
+       + lowerKey/upperKey + showInterval. ResizeObserver beforeAll stub needed in jsdom tests.
+- file: frontend/src/components/charts/kpi-card.tsx
+  why: KPI metric tile — for the forecast summary card (total demand / average / peak day / low day / horizon).
+- file: frontend/src/components/data-table/data-table.tsx  AND  frontend/src/components/ui/table.tsx
+  why: The daily forecast table — a plain shadcn Table (date, forecast, lower, upper) is sufficient; DataTable only if
+       sortable columns are wanted. Mirror the batch.tsx plain-Table usage from Slice B.
+- file: frontend/src/pages/explorer/run-compare.tsx
+  why: Champion-vs-challenger side-by-side + DeltaCell pattern — reference for any compatibility/delta display in the
+       promote dialog (read-only context only; promote ≠ compare).
+- file: frontend/src/hooks/use-runs.ts
+  why: useCreateAlias (:136 — POST /registry/aliases) + useVerifyArtifact patterns. Slice C does NOT reuse these for
+       promotion (promotion is a single model_selection endpoint) but mirrors their useMutation + invalidate shape.
+- file: frontend/src/hooks/use-model-selection.ts
+  why: Slice A/B module. Slice C ADDS useTrainWinner/useTrainSelected/usePredictWinner/usePromoteChampion (useMutation,
+       invalidate the run query so Slice B's poll/GET reflects the new final_model_path/forecast/promotion). Do NOT
+       redefine Slice A/B hooks.
+- file: frontend/src/lib/api.ts
+  why: api<T>(endpoint,{method,body,params}) (:23); 202 (:79) / 204 (:44) handling; getErrorMessage (:95). POST bodies
+       are JSON; promote/train/predict are plain POSTs returning JSON 200.
+- file: frontend/src/types/api.ts
+  why: ModelFamily union (:177), ForecastPoint (:102 — date/forecast/lower_bound/upper_bound), Alias (:276),
+       RunCompareResponse (:286). ADD (additive, Model Selection section) TrainSelectedRequest, ForecastDecisionParams,
+       ForecastDecision, PromoteRequest, PromoteResponse; EXTEND ForecastSummary (peak/low) + the train/predict response types.
+- file: frontend/src/lib/constants.ts
+  why: ROUTES.VISUALIZE.CHAMPION + the Visualize NAV entry are added by Slice A — Slice C adds NO route/nav.
+- file: frontend/vitest.config.ts
+  why: jsdom; include src/**/*.test.{ts,tsx}; @→./src. Chart tests need a ResizeObserver beforeAll stub.
+
+# Governance / external docs (with reasoning)
+- file: docs/optional-features/09-model-champion-challenger-governance.md
+  why: The promotion-decision-record shape (decision_id, alias, champion_run_id, challenger_run_id, gate_results,
+       approved_by, approved_at, decision, reason) + the "require approval and record the decision" rule. Slice C's
+       promotion_decision JSONB mirrors this (challenger_run_id/gate_results omitted in this slice — compare is separate).
+- file: docs/user-guide/  (advanced-forecasting-guide.md, agents-and-rag-guide.md, dashboard-guide.md, feature-reference.md,
+        getting-started.md, showcase-manual-demo-guide.md, showcase-walkthrough.md)
+  why: Naming convention `{feature}-guide.md`. ADD champion-selector-guide.md; cross-link from feature-reference.md.
+- url: https://www.mlflow.org/docs/latest/ml/model-registry/workflow/
+  why: Alias/champion registry workflow — confirms the "register a versioned model, then move a named alias to it"
+       pattern Slice C's promote() implements (create_run → success → create_alias). Aliases are mutable pointers; the
+       run/version is immutable.
+- url: https://web.mit.edu/course/2/2.810/www/files/readings/King_SafetyStock.pdf
+  why: Safety-stock formula reference. Slice C uses the demand-variability-only form SS = z·σ_D·√L (constant lead time);
+       the doc's z-from-service-level table grounds the z lookup in decision.py. Cite as the heuristic's source in the UI.
+- url: https://otexts.com/fpp2/accuracy.html
+  why: Forecast-accuracy metric definitions (WAPE/MAE/bias) — so the business-interpretation copy describes each metric
+       correctly and the bias under/over-forecast wording stays accurate.
+- url: https://cloud.google.com/vertex-ai/docs/evaluation/introduction
+  why: Model-evaluation framing (a recommended model is a recommendation, not an automatic deployment) — supports the
+       explicit-approval gate on promotion.
+- url: https://fastapi.tiangolo.com/tutorial/bigger-applications/#apirouter
+  why: APIRouter route registration — the new /train-selected + /promote handlers follow the slice's existing pattern.
+```
+
+### Current Codebase Tree (relevant)
+
+```bash
+app/features/model_selection/        # MERGED (issue #353) — train-winner + predict already present
+├── models.py        # ModelSelectionRun                 ← ADD trained_model_type/is_override/override_reason/champion_run_id/promoted_alias/promotion_decision
+├── schemas.py       # request/response contract          ← ADD TrainSelectedRequest, ForecastDecisionParams, ForecastDecision, PromoteRequest, PromoteResponse; EXTEND ForecastSummary + train/predict responses
+├── service.py       # train_winner/predict_winner present ← ADD train_selected, promote; EXTEND predict_winner (decision); persist trained_model_type in train_winner
+├── ranking.py       # rank_candidates / build_chart_data  ← UNCHANGED
+├── explanations.py  # explain_winner                      ← UNCHANGED (decision.py is the new pure module)
+├── routes.py        # APIRouter(/model-selection)         ← ADD POST /train-selected, POST /promote; extend POST /predict body
+└── tests/           # conftest + unit + integration       ← ADD test_decision; extend test_routes/test_service/test_models/test_routes_integration
+app/features/forecasting/service.py  # train_model / predict (feature-aware reject)   — orchestrated, not changed
+app/features/registry/{service,schemas,storage}.py  # create_run/update_run/create_alias + LocalFSProvider.save — orchestrated, not changed
+app/core/{config,exceptions}.py
+alembic/versions/                     # head b667d321603c today; Slice B adds one; chain Slice C off the live head at impl time
+frontend/src/
+├── pages/visualize/champion.tsx      # Slice A/B page          ← ADD the decision section below Slice B's results
+├── hooks/use-model-selection.ts      # Slice A/B hooks          ← ADD useTrainWinner/useTrainSelected/usePredictWinner/usePromoteChampion
+├── types/api.ts                      # Model Selection section  ← ADD decision/promote types; EXTEND ForecastSummary
+├── components/champion-selector/     # Slice A/B components      ← ADD decision/ subfamily
+├── components/charts/{time-series-chart,kpi-card}.tsx
+├── components/ui/{table,dialog,alert-dialog,input,select,checkbox,card,badge}.tsx
+└── components/forecast-intelligence/{promote-confirmation-dialog,champion-compatibility-badge}.tsx  # promotion-UX precedents
+docs/user-guide/                      # ADD champion-selector-guide.md
+```
+
+### Desired Codebase Tree (Slice C additions)
+
+```bash
+# Backend
+app/features/model_selection/decision.py                       # NEW: pure forecast-decision (peak/low, z-table, safety stock, bias-risk text)
+app/features/model_selection/models.py                         # MOD: + 6 nullable decision/promotion columns
+app/features/model_selection/schemas.py                        # MOD: + TrainSelectedRequest, ForecastDecisionParams, ForecastDecision, PromoteRequest, PromoteResponse; EXTEND ForecastSummary + TrainWinnerResponse + PredictWinnerResponse
+app/features/model_selection/service.py                        # MOD: + train_selected, promote; EXTEND predict_winner; train_winner persists trained_model_type
+app/features/model_selection/routes.py                         # MOD: + POST /train-selected, POST /promote; predict gains optional body
+alembic/versions/<rev>_add_model_selection_decision_promotion.py  # NEW migration (additive columns)
+app/features/model_selection/tests/test_decision.py            # NEW: pure decision unit tests (z-table, safety stock, peak/low, bias text)
+app/features/model_selection/tests/test_routes.py              # MOD: + train-selected, predict-with-body, promote route tests
+app/features/model_selection/tests/test_service.py             # MOD: + train_selected/promote/predict-decision unit (mock Forecasting + Registry services)
+app/features/model_selection/tests/test_models.py              # MOD: + new columns CRUD/default
+app/features/model_selection/tests/test_schemas.py             # MOD: + new request/response schema cases (alias regex 422, defaults)
+app/features/model_selection/tests/test_routes_integration.py  # MOD: + train-selected → predict → promote integration (real registry run + alias)
+
+# Frontend (extends Slice A/B — no new route/nav)
+frontend/src/types/api.ts                                      # MOD: + decision/promote types; EXTEND ForecastSummary
+frontend/src/hooks/use-model-selection.ts                      # MOD: + useTrainWinner/useTrainSelected/usePredictWinner/usePromoteChampion
+frontend/src/hooks/use-model-selection.test.ts                 # MOD: + train/predict/promote hook tests
+frontend/src/pages/visualize/champion.tsx                      # MOD: render decision section after a terminal winning run
+frontend/src/components/champion-selector/decision/winner-decision-panel.tsx       # NEW (+test): accept winner OR override (candidate select + non-recommended warning AlertDialog)
+frontend/src/components/champion-selector/decision/train-forecast-actions.tsx      # NEW (+test): train + forecast buttons; capability-limited (feature-aware) blocked state
+frontend/src/components/champion-selector/decision/forecast-summary-card.tsx       # NEW (+test): total/avg/peak/low/horizon KPI tiles
+frontend/src/components/champion-selector/decision/forecast-chart.tsx              # NEW (+test): TimeSeriesChart wrapper
+frontend/src/components/champion-selector/decision/daily-forecast-table.tsx        # NEW (+test): shadcn Table (date, forecast, lower, upper)
+frontend/src/components/champion-selector/decision/business-interpretation-panel.tsx # NEW (+test): why-won + expected demand + bias risk (BIAS_EXPLANATION) + caveats
+frontend/src/components/champion-selector/decision/safety-stock-panel.tsx          # NEW (+test): lead_time/service_level inputs → safety stock (labeled heuristic)
+frontend/src/components/champion-selector/decision/promote-champion-dialog.tsx     # NEW (+test): alias name + approver + non-recommended ack (mirror promote-confirmation-dialog.tsx)
+
+# Docs
+docs/user-guide/champion-selector-guide.md                     # NEW: full journey + promotion-is-audited rule
+docs/user-guide/feature-reference.md                           # MOD: cross-link the new guide (if it carries an index)
+```
+
+### Known Gotchas & VERIFIED Contracts
+
+```python
+# ── train-winner IS ALREADY PRESENT — DO NOT REWRITE IT ────────────────────────
+# service.train_winner (service.py:405) trains ranking.winner and its tests exist. Slice C ADDS train_selected as a
+# SIBLING and makes ONE additive write inside train_winner: row.trained_model_type = ranking.winner.model_type;
+# row.is_override = False. The TrainWinnerResponse shape is UNCHANGED (new fields go on TrainSelectedResponse-superset,
+# or set defaults on the shared response model — keep train-winner's response back-compatible).
+
+# ── OVERRIDE VALIDATION ────────────────────────────────────────────────────────
+# train_selected must reject a model_type not in the run's candidate set. The candidates live on the row:
+# row.candidate_models (JSONB list of {model_type, params}). Validate against THAT set — {c["model_type"] for c in
+#   row.candidate_models} — NOT only the included/ranked entries: a candidate that FAILED its backtest is still
+#   override-trainable (training ≠ backtesting), so it must remain selectable. A model never offered as a candidate → 400.
+# Build the ModelConfig the SAME way train_winner does:
+#   TypeAdapter(ModelConfig).validate_python({"model_type": mt, **params})  (lazy import ModelConfig).
+# is_override = (mt != ranking.winner.model_type). The override_warning text names the recommended model + the WAPE gap
+# read from ranking entries (deterministic; no LLM). NOTE: if the chosen candidate failed backtesting it has no ranked
+# metrics — the warning then states the model was not successfully evaluated rather than quoting a WAPE gap.
+
+# ── PREDICT OPTIONAL BODY (FastAPI) ────────────────────────────────────────────
+# predict currently takes NO body. To stay backward-compatible, declare:
+#   request: ForecastDecisionParams | None = Body(default=None)
+# and treat None as ForecastDecisionParams() defaults. A single Pydantic-model param without Body(default=...) is a
+# REQUIRED body in FastAPI — that would break empty-body callers. VERIFY the empty-body path in a route test
+# (POST with no body returns 200 + decision computed from defaults).
+# RETURN CONTRACT: predict_winner now returns tuple[ForecastSummary, ForecastDecision | None]; the ROUTE (not the
+#   service) builds PredictWinnerResponse(selection_id, forecast, decision). Do NOT have the service return the
+#   response model — keep it a pure (forecast, decision) tuple so the existing happy-path service tests stay simple and
+#   the route owns the HTTP shape (mirrors the merged routes.py:168 which already builds the response in the route).
+
+# ── ForecastSummary EXTENSION IS REUSED BY SLICE A/B — KEEP IT ADDITIVE ─────────
+# ForecastSummary is serialized by the sync /run auto_predict path AND Slice B. ADD peak_date/peak_demand/low_date/
+# low_demand as Optional (default None) so old JSONB snapshots still validate (forecast_result reload at service.py:535).
+
+# ── SAFETY STOCK MUST NOT TOUCH RANKING (LOCKED #3) ────────────────────────────
+# decision.py is called only by predict_winner (and the UI). rank_candidates / build_chart_data NEVER receive
+# safety-stock inputs. z-table is a fixed dict (NO scipy): {0.90:1.2816, 0.95:1.6449, 0.975:1.9600, 0.99:2.3263}.
+# sigma_daily = statistics.pstdev([p["forecast"] for p in points]) (population stdev; 0.0 for a flat/1-point forecast →
+# safety_stock 0.0 — that is honest). Verify the z math with:
+#   uv run python -c "import statistics as s; pts=[10,12,8,11,9]; z=1.6449; ss=z*s.pstdev(pts)*(7**0.5); print(round(ss,3))"
+# Label every decision field method='heuristic' + a caveat; the UI panel header says 'Safety stock (heuristic)'.
+
+# ── PROMOTION ARTIFACT REGISTRATION IS THE #1 RISK — VERIFY BEFORE CODING ───────
+# Forecasting train writes a joblib to row.final_model_path under ./artifacts/models (NOT registry storage). To make
+# the promoted run's artifact verifiable, promote() must register the artifact into registry storage. There is NO
+# RegistryService.register_artifact wrapper (verified: artifact_uri is set via PATCH; storage.save returns (hash,size)).
+# BEFORE coding promote, grep how existing code registers an artifact + names artifact_uri:
+#   grep -rn "\.save(" app/features/registry app/features/demo app/features/ops scripts | grep -i artifact
+#   grep -rn "artifact_uri=" app/features --include=*.py | grep -v test
+# Then in promote(): construct artifact_uri per that convention, call the provider's save(Path(final_model_path),
+# artifact_uri) -> (hash, size), then update_run(SUCCESS, artifact_uri, artifact_hash=hash, artifact_size_bytes=size).
+# FALLBACK (documented, Option-3 boundary): if artifact registration proves out of budget, ship train/predict/decision
+# WITHOUT promote (a follow-up issue) rather than registering an unverifiable artifact — promotion is the LAST task.
+
+# ── REGISTRY STATE MACHINE ─────────────────────────────────────────────────────
+# create_run → PENDING (run_id = uuid hex). update_run(status=RUNNING) THEN update_run(status=SUCCESS, …). create_alias
+# requires SUCCESS (registry/service.py:457 raises ValueError → map to BadRequestError/422). Do all promote DB work in
+# the REQUEST db session (one transaction); RegistryService takes the same db. Lazy-import RegistryService inside
+# promote() (mirror the ForecastingService lazy import at service.py:410) to avoid an alembic cold-boot import cycle.
+# VERIFIED: create_run/update_run/create_alias each `await db.flush()` (NOT commit) — registry/service.py:260,419,495 —
+#   so the whole promote orchestration is ONE atomic request transaction: any step raising rolls the lot back (no
+#   half-promoted run). Pass the trained params via the field name `model_config_data=` (RunCreate aliases it to
+#   `model_config` with populate_by_name=True, registry/schemas.py:74,77) — do NOT use the `model_config=` alias kwarg,
+#   it shadows Pydantic's own ConfigDict attribute name and reads as a bug.
+
+# ── FEATURE-FRAME-VERSION PERSISTENCE → V2 PROMOTION (LOCKED #7) ───────────────
+# Slice C SUPPORTS V2 promotion by PERSISTING the run's feature_frame_version and carrying it end-to-end — NO hardcoded
+# `1` in code (the only `1` is the column's server_default for legacy rows, and a fallback-error case in tests).
+# WHY a column is required: feature_frame_version is a ModelSelectionRunRequest field consumed at run-creation, but it
+#   is NOT available at train/promote time unless persisted (the merged ORM never stored it). To train the winner as the
+#   user configured (V1 or V2) AND record the true version on the registry run, the value must live on the row.
+# WIRING (all additive, Slice C owns service.py):
+#   1. Migration adds `feature_frame_version INTEGER NOT NULL server_default '1'` to model_selection_run (LOCKED #7).
+#      server_default '1' backfills pre-existing rows ONLY; new rows always carry the real request value.
+#   2. Run-creation writes the real value: ADD `row.feature_frame_version = request.feature_frame_version` to BOTH
+#      run_selection (sync, merged) AND submit_run (async, Slice B's) — both live in service.py which Slice C edits.
+#      This is additive (a new column write), not a redefinition of Slice B's contract.
+#   3. train_winner / train_selected pass `feature_frame_version=row.feature_frame_version` to
+#      ForecastingService.train_model (the merged auto-train path already threads it — mirror that). feature_groups stays
+#      None → forecasting's DEFAULT_V2_GROUPS (the champion-selector UI never exposes per-group selection; a custom-group
+#      V2 run via raw curl would train on default groups — documented limitation, future PRP may persist feature_groups).
+#   4. promote passes `runtime_info_extras={"feature_frame_version": row.feature_frame_version}` (the REAL value).
+# This is load-bearing: the registry's PRP-36 comparable-run / stale-alias logic keys on feature_frame_version
+#   (docs/_base/DOMAIN_MODEL.md; memory feature-frame-version-clamp-1-2) — a wrong value silently corrupts comparability.
+# TEST the REAL propagation: a V2 run → promote records 2 (test_promote_carries_real_feature_frame_version_v2); a
+#   legacy/unset row → the server_default 1 (test_promote_defaults_feature_frame_version_1_for_legacy_run, the ONLY place
+#   the literal 1 appears, as a fallback case).
+
+# ── MIGRATION (LOCKED #7) ──────────────────────────────────────────────────────
+# uv run alembic heads   # chain down_revision off the LIVE head (Slice B's migration must land first).
+# All seven columns are ADDITIVE (is_override + feature_frame_version are NOT NULL with server_defaults 'false'/'1';
+# the rest nullable). No CheckConstraint change.
+# downgrade() drops the seven columns. JSONB import in migration: from sqlalchemy.dialects import postgresql ->
+# postgresql.JSONB(astext_type=sa.Text()).
+
+# ── STRICT-MODE POLICY (LOCKED #9) ─────────────────────────────────────────────
+# TrainSelectedRequest/ForecastDecisionParams/PromoteRequest are ConfigDict(strict=True) with ONLY str/int/float/bool
+# fields → NO Field(strict=False) needed. app/core/tests/test_strict_mode_policy.py stays green. Add a request-body
+# test that exercises Model.model_validate({...}) (the validate_python path) per the security policy.
+
+# ── NO AGENT SURFACE ───────────────────────────────────────────────────────────
+# Promotion is a USER REST flow (approved_by in the body), NOT an agent tool. Do NOT add an agent tool or an entry to
+# agent_require_approval. (Widening the agent mutation surface is out of scope and would require that list update.)
+```
+
+```typescript
+// ── FRONTEND ────────────────────────────────────────────────────────────────
+// Slice C EXTENDS the Slice A/B champion page — it adds NO route/nav. The decision section renders only when a Slice B
+// run is terminal (completed|partial) AND response.winner is non-null. Reuse Slice B's useSelectionRun(selectionId).
+// HOOKS (mirror use-batches.ts / use-runs.ts useMutation shape): useTrainWinner / useTrainSelected / usePredictWinner /
+//   usePromoteChampion all POST to /model-selection/{id}/... and on success invalidate ['model-selection','run',id] so
+//   Slice B's GET reflects the new final_model_path / forecast / promotion. Do NOT redefine Slice A/B hooks.
+// CAPABILITY LIMIT (LOCKED #5): read the winner's supports_auto_predict from useModelCatalog() (Slice A). If false,
+//   render the blocked forecast state ("Forecast not available for feature-aware models — use the What-If Planner") and
+//   DO NOT call usePredictWinner. The Train + Promote actions still work for feature-aware winners.
+// OVERRIDE WARNING: when the user picks a candidate != winner, confirm via AlertDialog before train-selected; carry the
+//   override_reason. Reuse BIAS_EXPLANATION from components/champion-selector/copy.ts (Slice A) for bias wording.
+// PROMOTE DIALOG: mirror forecast-intelligence/promote-confirmation-dialog.tsx — alias-name input (regex
+//   ^[a-z0-9][a-z0-9\-_]*$), approver field (required), a "promote a non-recommended model" checkbox shown only when
+//   is_override; confirm → usePromoteChampion. Promote performs NO comparison (compare is separate).
+// CHARTS need a ResizeObserver beforeAll stub in jsdom (backtest-horizon-buckets-chart.test.tsx pattern); pass chart
+//   height via inline style (Tailwind JIT drops dynamic h-[Npx]).
+// react-refresh/only-export-components: keep any non-component constants in a .ts file (reuse Slice A copy.ts or a
+//   decision/constants.ts), not exported from a .tsx component.
+// IDs are NOT 1-based (memory: seeder-does-not-reset-id-sequences); selection_id is backend-owned — never
+//   crypto.randomUUID() client-side (memory: showcase-crypto-randomuuid-lan-crash). Dogfood over http://localhost:5173.
+// Mixed CRLF/LF repo-wide (memory: repo-line-endings-crlf) — git diff --stat before committing; new files LF.
+```
+
+## Implementation Blueprint
+
+### Backend data models
+
+`app/features/model_selection/models.py` — additive columns on `ModelSelectionRun`:
+
+```python
+trained_model_type: Mapped[str | None] = mapped_column(String(40), nullable=True)
+is_override: Mapped[bool] = mapped_column(Boolean, default=False, server_default="false", nullable=False)
+override_reason: Mapped[str | None] = mapped_column(String(2000), nullable=True)
+champion_run_id: Mapped[str | None] = mapped_column(String(32), nullable=True)        # registry model_run.run_id
+promoted_alias: Mapped[str | None] = mapped_column(String(100), nullable=True)
+promotion_decision: Mapped[dict[str, Any] | None] = mapped_column(JSONB, nullable=True)  # audit record
+feature_frame_version: Mapped[int] = mapped_column(                                   # M1 — V2 promotion support
+    Integer, default=1, server_default="1", nullable=False
+)  # set from request at run-creation (run_selection + submit_run); promote passes the REAL value to the registry
+```
+
+`app/features/model_selection/schemas.py` — additive models:
+
+```python
+class TrainSelectedRequest(BaseModel):
+    model_config = ConfigDict(strict=True)
+    model_type: ModelType
+    override_reason: str | None = Field(default=None, max_length=2000)
+
+# EXTEND TrainWinnerResponse additively (defaults keep train-winner back-compatible):
+#   is_override: bool = False
+#   override_warning: str | None = None
+
+class ForecastDecisionParams(BaseModel):
+    model_config = ConfigDict(strict=True)
+    lead_time_days: int = Field(default=7, ge=1, le=365)
+    service_level: float = Field(default=0.95, ge=0.5, lt=1.0)
+
+class ForecastDecision(BaseModel):                  # plain BaseModel (response)
+    method: Literal["heuristic"] = "heuristic"
+    lead_time_days: int
+    service_level: float
+    z_value: float
+    sigma_daily_demand: float
+    expected_demand_over_lead_time: float
+    safety_stock: float
+    reorder_point: float
+    bias_risk_text: str                              # reuses BIAS_EXPLANATION + the winner's bias sign
+    caveats: list[str]
+
+# EXTEND ForecastSummary additively:
+#   peak_date: date | None = None ; peak_demand: float | None = None
+#   low_date: date | None = None  ; low_demand: float | None = None
+# EXTEND PredictWinnerResponse additively:
+#   decision: ForecastDecision | None = None
+
+class PromoteRequest(BaseModel):
+    model_config = ConfigDict(strict=True)
+    alias_name: str = Field(..., min_length=1, max_length=100, pattern=r"^[a-z0-9][a-z0-9\-_]*$")
+    approved_by: str = Field(..., min_length=1, max_length=100)
+    acknowledge_non_recommended: bool = False
+    description: str | None = Field(default=None, max_length=500)
+
+class PromoteResponse(BaseModel):                    # plain BaseModel (response)
+    selection_id: str
+    alias_name: str
+    run_id: str
+    run_status: str
+    model_type: str
+    is_override: bool
+    promoted_at: datetime
+```
+
+`app/features/model_selection/decision.py` (pure — mirror `explanations.py`):
+
+```python
+# from app.features.model_selection.copy or a local constant: the locked bias sentence (single source).
+_Z_TABLE = {0.90: 1.2816, 0.95: 1.6449, 0.975: 1.9600, 0.99: 2.3263}  # one-sided service-level z (no scipy)
+
+def z_for_service_level(service_level: float) -> float:
+    # exact key, else nearest key (documented heuristic)
+    ...
+
+def compute_forecast_decision(points: list[dict], average_demand: float, lead_time_days: int,
+                              service_level: float, winner_bias: float | None) -> ForecastDecision:
+    import statistics
+    values = [float(p["forecast"]) for p in points]
+    sigma = statistics.pstdev(values) if len(values) > 1 else 0.0
+    z = z_for_service_level(service_level)
+    safety_stock = z * sigma * (lead_time_days ** 0.5)
+    expected_lt = average_demand * lead_time_days
+    bias_dir = "under-forecasts (risk of stockouts)" if (winner_bias or 0) > 0 else \
+               "over-forecasts (risk of overstock)" if (winner_bias or 0) < 0 else "is roughly unbiased"
+    return ForecastDecision(lead_time_days=lead_time_days, service_level=service_level, z_value=z,
+        sigma_daily_demand=sigma, expected_demand_over_lead_time=expected_lt,
+        safety_stock=safety_stock, reorder_point=expected_lt + safety_stock,
+        bias_risk_text=f"{BIAS_EXPLANATION} For this winner, bias {winner_bias:.2f} indicates it {bias_dir}.",
+        caveats=["Safety stock is a deterministic heuristic (demand variability only; constant lead time).",
+                 "Not a substitute for a full inventory-optimisation model."])
+
+def forecast_peak_low(points: list[dict]) -> tuple[date|None, float|None, date|None, float|None]:
+    # max/min over points by 'forecast'; None on empty.
+    ...
+```
+
+### Backend service (`app/features/model_selection/service.py`)
+
+```python
+async def train_selected(self, db, selection_id, model_type, override_reason) -> TrainWinnerResponse:
+    # _load row; _load_ranking.
+    # ELIGIBILITY (LOCKED #1): model_type must be one of the run's CONFIGURED candidates —
+    #   {c["model_type"] for c in row.candidate_models} — else BadRequestError(400). A candidate that FAILED its
+    #   backtest is STILL override-trainable (training is independent of backtesting), so validate against
+    #   candidate_models, NOT only the ranked/included entries. (A model never offered as a candidate → 400.)
+    # build cfg = TypeAdapter(ModelConfig).validate_python({"model_type": model_type, **params_for(model_type)});
+    # train = ForecastingService().train_model(db, store, product, start, end, cfg,
+    #             feature_frame_version=row.feature_frame_version)   # M1 — train as the run was configured (V1/V2)
+    # row.final_model_path = train.model_path; row.trained_model_type = model_type
+    # row.is_override = (model_type != ranking.winner.model_type if ranking.winner else True)
+    # row.override_reason = override_reason; await db.flush()
+    # override_warning = deterministic copy when is_override (names recommended model + WAPE gap), else None
+    # return TrainWinnerResponse(..., is_override=row.is_override, override_warning=warning)
+    # NOTE: train_winner (the merged sibling) likewise threads feature_frame_version=row.feature_frame_version when
+    #   Slice C adds its `row.trained_model_type = winner; row.is_override = False` write (keep its response shape).
+
+# EXTEND predict_winner — PIN THE RETURN CONTRACT.
+#   Live signature today: `predict_winner(db, selection_id) -> ForecastSummary` (service.py:442); the ROUTE builds
+#   `PredictWinnerResponse(selection_id, forecast)` (routes.py:168). Slice C must surface `decision` too, so CHANGE the
+#   service return type to a TUPLE:
+#     async def predict_winner(self, db, selection_id, lead_time_days: int, service_level: float)
+#         -> tuple[ForecastSummary, ForecastDecision | None]
+#   Body: build the ForecastSummary as today; set peak/low via decision.forecast_peak_low; compute
+#   decision = decision.compute_forecast_decision(points, average_demand, lead_time_days, service_level,
+#   winner_bias=row.winner_metrics.get('bias')); persist forecast_result (incl. peak/low) on the row; RETURN
+#   (forecast, decision). The ROUTE (not the service) assembles PredictWinnerResponse(selection_id=…, forecast=…,
+#   decision=…) — see the route blueprint below. The merged train-winner→predict happy-path tests assert only on
+#   `forecast`, so they keep passing; the new `decision` field is additive (PredictWinnerResponse.decision defaults None).
+
+async def promote(self, db, selection_id, req: PromoteRequest) -> PromoteResponse:
+    from app.features.registry.schemas import RunCreate, RunUpdate, AliasCreate, RunStatus  # lazy
+    from app.features.registry.service import RegistryService                                # lazy
+    row = await self._load(db, selection_id)                       # 404
+    if not row.final_model_path or not row.trained_model_type:
+        raise UnprocessableEntityError(message="Train the model before promoting.")
+    if row.is_override and not req.acknowledge_non_recommended:
+        raise UnprocessableEntityError(message="Promoting a non-recommended model requires acknowledge_non_recommended=true.")
+    registry = RegistryService()
+    params = self._params_for_trained(row)                         # from candidate_models / winner_metrics
+    run = await registry.create_run(db, RunCreate(model_type=row.trained_model_type, model_config_data=params,
+            data_window_start=row.start_date, data_window_end=row.end_date, store_id=row.store_id,
+            product_id=row.product_id,
+            runtime_info_extras={"feature_frame_version": row.feature_frame_version}))  # REAL persisted version (LOCKED #7)
+    await registry.update_run(db, run.run_id, RunUpdate(status=RunStatus.RUNNING))
+    artifact_uri, ahash, asize = self._register_artifact(row.final_model_path, run.run_id)   # VERIFY mechanics (Gotchas)
+    await registry.update_run(db, run.run_id, RunUpdate(status=RunStatus.SUCCESS, metrics=row.winner_metrics,
+            artifact_uri=artifact_uri, artifact_hash=ahash, artifact_size_bytes=asize))
+    alias = await registry.create_alias(db, AliasCreate(alias_name=req.alias_name, run_id=run.run_id,
+            description=req.description))
+    promoted_at = datetime.now(UTC)
+    row.champion_run_id = run.run_id; row.promoted_alias = alias.alias_name
+    row.promotion_decision = {"decision_id": uuid.uuid4().hex, "alias": alias.alias_name,
+        "champion_run_id": run.run_id, "approved_by": req.approved_by, "approved_at": promoted_at.isoformat(),
+        "decision": "promoted", "reason": req.description, "trained_model_type": row.trained_model_type,
+        "is_override": row.is_override}
+    await db.flush()
+    return PromoteResponse(selection_id=row.selection_id, alias_name=alias.alias_name, run_id=run.run_id,
+        run_status=alias.run_status, model_type=row.trained_model_type, is_override=row.is_override, promoted_at=promoted_at)
+```
+
+### Backend routes (`app/features/model_selection/routes.py`)
+
+```python
+@router.post("/{selection_id}/train-selected", response_model=TrainWinnerResponse, status_code=200)
+async def train_selected(selection_id: str, request: TrainSelectedRequest, db=Depends(get_db)):
+    try: return await ModelSelectionService().train_selected(db, selection_id, request.model_type, request.override_reason)
+    except ValueError as exc: raise BadRequestError(message=str(exc)) from exc
+    except SQLAlchemyError as exc: raise DatabaseError(message="Failed to train selected model", details={"error": str(exc)}) from exc
+
+# predict gains an optional body; the ROUTE assembles the response from the service tuple (service returns
+# tuple[ForecastSummary, ForecastDecision | None], NOT the response model):
+@router.post("/{selection_id}/predict", response_model=PredictWinnerResponse, status_code=200)
+async def predict_winner(selection_id: str, request: ForecastDecisionParams | None = Body(default=None), db=Depends(get_db)):
+    params = request or ForecastDecisionParams()
+    service = ModelSelectionService()
+    try:
+        forecast, decision = await service.predict_winner(db, selection_id, params.lead_time_days, params.service_level)
+        return PredictWinnerResponse(selection_id=selection_id, forecast=forecast, decision=decision)
+    except ValueError as exc: raise BadRequestError(message=str(exc)) from exc   # feature-aware reject → 400
+    except SQLAlchemyError as exc: raise DatabaseError(message="Failed to forecast with winning model", details={"error": str(exc)}) from exc
+
+@router.post("/{selection_id}/promote", response_model=PromoteResponse, status_code=200)
+async def promote(selection_id: str, request: PromoteRequest, db=Depends(get_db)):
+    try: return await ModelSelectionService().promote(db, selection_id, request)
+    except ValueError as exc: raise BadRequestError(message=str(exc)) from exc   # registry "only SUCCESS runs" → 400
+    except SQLAlchemyError as exc: raise DatabaseError(message="Failed to promote champion", details={"error": str(exc)}) from exc
+# NotFoundError(404)/UnprocessableEntityError(422) raised in-service bubble to the global handler.
+```
+
+### Implementation Tasks (dependency-ordered)
+
+```yaml
+# ───────────────────────── BACKEND ─────────────────────────
+Task 1 — Schemas:
+  MODIFY app/features/model_selection/schemas.py: + TrainSelectedRequest, ForecastDecisionParams, ForecastDecision,
+    PromoteRequest, PromoteResponse; EXTEND ForecastSummary (peak/low Optional), TrainWinnerResponse (is_override,
+    override_warning defaults), PredictWinnerResponse (decision Optional).
+  MODIFY tests/test_schemas.py: alias_name regex 422; service_level bound; back-compat defaults; validate_python path.
+
+Task 2 — Pure decision module:
+  CREATE app/features/model_selection/decision.py: z_for_service_level, compute_forecast_decision, forecast_peak_low
+    (pure, no DB/IO; mirror explanations.py). Reuse the locked bias sentence (single constant).
+  CREATE tests/test_decision.py: z-table exact + nearest; safety_stock=z*pstdev*sqrt(L) (verify one-liner); flat forecast
+    → safety_stock 0.0; peak/low correctness; bias text under/over/neutral.
+
+Task 3 — ORM + migration:
+  MODIFY app/features/model_selection/models.py: + the seven columns (Boolean + Integer imports) — the six
+    decision/promotion columns PLUS feature_frame_version (Integer, NOT NULL, server_default "1", default 1).
+  RUN: uv run alembic heads   # chain off the LIVE head (Slice B migration must precede)
+  CREATE alembic/versions/<rev>_add_model_selection_decision_promotion.py: add_column x7 (server_default 'false' for
+    is_override; server_default '1' for feature_frame_version — backfills legacy rows only); downgrade drops all seven.
+    NO CheckConstraint change.
+  MODIFY tests/test_models.py: defaults (is_override False, feature_frame_version 1); JSONB promotion_decision round-trip.
+
+Task 4 — Service:
+  MODIFY app/features/model_selection/service.py:
+    - PERSIST feature_frame_version at run-creation (M1): ADD `row.feature_frame_version = request.feature_frame_version`
+      in run_selection (sync, merged) AND submit_run (async, Slice B's) — additive column write, both live here.
+    - + train_selected (validate against row.candidate_models incl. failed candidates; thread
+      feature_frame_version=row.feature_frame_version into train_model), + promote (lazy RegistryService import; pass
+      runtime_info_extras={"feature_frame_version": row.feature_frame_version} — the REAL value, never a hardcoded 1).
+    - EXTEND predict_winner → returns tuple[ForecastSummary, ForecastDecision | None] (route assembles the response).
+    - + _params_for_trained, + _register_artifact helper; train_winner additively sets trained_model_type/
+      is_override=False and threads feature_frame_version=row.feature_frame_version into its train_model call.
+      REUSE _load/_load_ranking/_forecast_summary.
+  MODIFY tests/test_service.py: train_selected happy + non-candidate 400 + override warning + failed-candidate still
+    trainable; predict decision math + tuple return; run-creation persists request feature_frame_version; train_selected
+    threads V2 into train_model; promote orchestration with monkeypatched "app.features.registry.service.RegistryService"
+    (create_run/update_run/create_alias) + "app.features.forecasting.service.ForecastingService"; promote carries the
+    REAL feature_frame_version (V2 run → 2); promote-before-train 422; non-recommended-no-ack 422.
+
+Task 5 — Routes:
+  MODIFY app/features/model_selection/routes.py: + POST /train-selected, + POST /promote; predict gains
+    `request: ForecastDecisionParams | None = Body(default=None)`. Mirror error mapping.
+  MODIFY tests/test_routes.py (ASGITransport _client harness): train-selected 200 + 400 (bad model_type);
+    predict no-body 200 (decision from defaults) + with-body 200; promote 200 + 422 (before train / no ack) +
+    422 (bad alias_name via schema); train-winner unchanged (regression).
+
+Task 6 — Integration:
+  MODIFY tests/test_routes_integration.py (@pytest.mark.integration, real engine, prefix-scoped teardown):
+    seed a pair → POST /runs (or legacy /run) to terminal winner → train-selected/train-winner → predict (decision
+    present, peak/low set) → promote → assert a registry model_run (SUCCESS) + alias exist and champion_run_id/
+    promoted_alias/promotion_decision persisted on the selection, and the registry run's runtime_info carries the run's
+    REAL feature_frame_version (a V2-configured run promotes as 2). Teardown must also clean the created registry
+    run/alias (extend the prefix-scoped finally; delete RunAlias + ModelRun by run_id/store_id).
+
+# ───────────────────────── FRONTEND (extends Slice A/B) ─────────────────────────
+Task 7 — Types:
+  MODIFY frontend/src/types/api.ts (Model Selection section): + TrainSelectedRequest, ForecastDecisionParams,
+    ForecastDecision, PromoteRequest, PromoteResponse; EXTEND ForecastSummary (peak/low) + train/predict response types.
+    Do NOT redefine Slice A/B types.
+
+Task 8 — Hooks:
+  MODIFY frontend/src/hooks/use-model-selection.ts: + useTrainWinner, useTrainSelected, usePredictWinner,
+    usePromoteChampion (useMutation; on success invalidate ['model-selection','run', id]). MIRROR use-runs.ts mutation shape.
+  MODIFY hooks/use-model-selection.test.ts: each hook POSTs to the right /model-selection/{id}/... endpoint; cache invalidated.
+
+Task 9 — Decision components (components/champion-selector/decision/):
+  CREATE winner-decision-panel.tsx (+test): show recommended winner; candidate Select to override; AlertDialog warning
+    + override_reason when picking non-winner; calls useTrainWinner / useTrainSelected.
+  CREATE train-forecast-actions.tsx (+test): Train + Forecast buttons; if winner.supports_auto_predict===false (catalog),
+    render the blocked "feature-aware → use What-If Planner" state and disable Forecast.
+  CREATE forecast-summary-card.tsx (+test): KpiCard tiles — total/avg/peak day/low day/horizon (null-safe).
+  CREATE forecast-chart.tsx (+test): TimeSeriesChart wrapper (predictedKey='forecast', interval if bounds).
+  CREATE daily-forecast-table.tsx (+test): shadcn Table — date, forecast, lower, upper.
+  CREATE business-interpretation-panel.tsx (+test): headline/why-won (from business_summary) + expected demand +
+    bias_risk_text (BIAS_EXPLANATION) + caveats.
+  CREATE safety-stock-panel.tsx (+test): lead_time/service_level inputs → re-predict (or recompute) → labeled
+    "Safety stock (heuristic)" with z, sigma, expected demand, reorder point + caveat.
+  CREATE promote-champion-dialog.tsx (+test): alias-name input (regex), approver field, non-recommended ack checkbox
+    (only when is_override) → usePromoteChampion; success toast + show promoted alias. MIRROR promote-confirmation-dialog.tsx.
+
+Task 10 — Page wiring:
+  MODIFY frontend/src/pages/visualize/champion.tsx: when useSelectionRun is terminal AND winner != null, render the
+    decision section (WinnerDecisionPanel → TrainForecastActions → ForecastSummaryCard + ForecastChart + DailyForecastTable
+    → BusinessInterpretationPanel + SafetyStockPanel → PromoteChampionDialog). Gate forecast on supports_auto_predict.
+    Do NOT alter Slice B's progress/results blocks above it.
+
+# ───────────────────────── DOCS + DOGFOOD ─────────────────────────
+Task 11 — User guide:
+  CREATE docs/user-guide/champion-selector-guide.md: the full journey (select → run → results → decide/override → train →
+    forecast → interpret → promote), the WAPE-default + tie-break note, the bias under/over wording, the safety-stock
+    heuristic caveat, and the "promotion requires explicit approval and is recorded" rule. Cross-link from feature-reference.md.
+
+Task 12 — Dogfood (manual; see Validation Loop):
+  Run the end-to-end probe over http://localhost:5173 with REAL discovered ids; confirm train-selected override warning,
+  forecast summary/chart/table, business + safety-stock panels, the feature-aware blocked state, and a gated promote that
+  yields a registry alias. Capture a note in the PR description.
+```
+
+### Integration Points
+
+```yaml
+DATABASE:
+  - migration: + trained_model_type / is_override / override_reason / champion_run_id / promoted_alias /
+    promotion_decision on model_selection_run (all nullable; is_override server_default 'false'). No constraint change.
+CONFIG: none new (reuses forecast_model_artifacts_dir + registry_artifact_root + the registry storage provider).
+ROUTES (backend): app/features/model_selection/routes.py only (+ /train-selected, /promote; predict body) — router
+  already wired in app/main.py.
+CROSS-SLICE (lazy imports inside service methods, mirroring the existing ForecastingService import):
+  - ForecastingService (train_selected); RegistryService + registry schemas (promote). NEVER import another slice's
+    ORM at module scope beyond the sanctioned data_platform read.
+FRONTEND: no new ROUTE/NAV (Slice A added /visualize/champion); extend the page + hooks + types only.
+OBSERVABILITY (structlog, mirror existing model_selection.* events):
+  - model_selection.winner_selected_override / .winner_predicted (extend) / .champion_promoted (approved_by, alias, run_id).
+DOCS: docs/user-guide/champion-selector-guide.md (+ feature-reference.md cross-link).
+```
+
+## Validation Loop
+
+### Level 1 — Backend syntax & policy
+
+```bash
+uv run ruff check app/features/model_selection app/features/model_selection/decision.py alembic/versions
+uv run ruff format --check app/features/model_selection alembic/versions
+uv run mypy app/features/model_selection
+uv run pyright app/features/model_selection
+uv run pytest app/core/tests/test_strict_mode_policy.py -v   # must stay green (no new strict date field)
+```
+
+### Level 2 — Backend unit tests
+
+```bash
+uv run pytest app/features/model_selection/tests -v -m "not integration"
+```
+Required new test names (additive to the A/B suite):
+- `test_train_selected_trains_chosen_candidate` / `test_train_selected_rejects_non_candidate_model_type_400`
+- `test_train_selected_sets_is_override_and_warning_for_non_winner`
+- `test_train_winner_now_persists_trained_model_type_not_override`  (regression: train-winner response shape unchanged)
+- `test_decision_z_table_exact_and_nearest` / `test_safety_stock_formula_matches_z_sigma_sqrt_l` / `test_flat_forecast_safety_stock_zero`
+- `test_forecast_peak_low_picks_max_and_min` / `test_bias_risk_text_under_over_neutral`
+- `test_predict_attaches_decision_and_peak_low` / `test_predict_empty_body_uses_default_lead_time_service_level`
+- `test_promote_requires_trained_model_422` / `test_promote_non_recommended_requires_ack_422`
+- `test_promote_orchestrates_create_run_success_and_alias` (mock RegistryService) / `test_promote_persists_promotion_decision_audit`
+- `test_promote_carries_real_feature_frame_version_v2` (a V2 run → RunCreate.runtime_info_extras["feature_frame_version"] == 2; NOT hardcoded)
+- `test_promote_defaults_feature_frame_version_1_for_legacy_run` (unset/legacy row → server_default 1 — the ONLY fallback case using the literal 1)
+- `test_run_creation_persists_request_feature_frame_version` (run_selection + submit_run write row.feature_frame_version from the request)
+- `test_train_selected_threads_feature_frame_version_into_train_model` (V2 run → train_model called with feature_frame_version=2)
+- `test_promote_bad_alias_name_422` (schema regex)
+
+### Level 3 — Migration & integration
+
+```bash
+docker compose up -d
+uv run alembic upgrade head
+uv run pytest app/features/model_selection/tests -v -m integration
+uv run alembic downgrade -1 && uv run alembic upgrade head   # round-trips cleanly
+```
+Integration expectations: the seven columns exist (incl. feature_frame_version); train-selected → predict (decision + peak/low) → promote produces a
+registry `model_run` in SUCCESS + a `run_alias`, with `champion_run_id`/`promoted_alias`/`promotion_decision` persisted;
+teardown removes the created registry run/alias (extend the prefix-scoped cleanup).
+
+### Level 4 — Full gates (must be green before PR)
+
+```bash
+uv run ruff check . && uv run ruff format --check .
+uv run mypy app/ && uv run pyright app/
+uv run pytest -v -m "not integration"
+cd frontend && pnpm tsc --noEmit && pnpm lint && pnpm test --run
+```
+> Known-local-noise: mypy/pyright report pre-existing lightgbm/xgboost optional-dep import errors in forecasting/+registry/
+> (CI installs the extras). Do NOT "fix" them; a green LOCAL mypy can MASK errors that only surface once the extras resolve
+> types (memory: the #355 finalizer cast). Reset the DB (`docker compose down -v && up -d && alembic upgrade head`) before
+> any Level-3 integration run (memory: integration-suite-shared-state-pollution).
+
+### Manual dogfood probe (discover REAL ids first — IDs are NOT 1-based)
+
+```bash
+uv run uvicorn app.main:app --port 8123 &
+curl -s "http://localhost:8123/dimensions/stores?page=1&page_size=5"  | python3 -m json.tool | grep '"id"'
+curl -s "http://localhost:8123/dimensions/products?page=1&page_size=5" | python3 -m json.tool | grep '"id"'
+# 1) run a comparison (Slice B async, or legacy sync /run) to a terminal winner; capture <selection_id>
+# 2) train the recommended winner (no body) OR override:
+curl -s -X POST "http://localhost:8123/model-selection/<sid>/train-selected" -H "Content-Type: application/json" \
+  -d '{"model_type":"seasonal_naive","override_reason":"seasonality"}' | python3 -m json.tool   # is_override + override_warning
+# 3) forecast with a decision body (baseline winner only — feature-aware → 400):
+curl -s -X POST "http://localhost:8123/model-selection/<sid>/predict" -H "Content-Type: application/json" \
+  -d '{"lead_time_days":7,"service_level":0.95}' | python3 -m json.tool | grep -E 'peak|low|safety_stock|reorder'
+# 4) promote (approval-gated, audited):
+curl -s -X POST "http://localhost:8123/model-selection/<sid>/promote" -H "Content-Type: application/json" \
+  -d '{"alias_name":"champion-test","approved_by":"dogfood","acknowledge_non_recommended":true}' | python3 -m json.tool
+curl -s "http://localhost:8123/registry/aliases/champion-test" | python3 -m json.tool    # alias → SUCCESS run
+# 5) frontend: VITE_API_BASE_URL=http://localhost:8123; dogfood /visualize/champion over http://localhost:5173 (NOT a LAN IP).
+```
+Expected: train-selected returns `override_warning` on a non-winner; predict returns peak/low + a labeled safety-stock
+decision (and 400 for a feature-aware winner, where the UI shows the blocked state); promote returns the alias and a
+registry SUCCESS run; the page renders the full decision section.
+
+## Final Validation Checklist
+
+- [ ] `POST /{id}/train-selected` trains a chosen candidate; non-candidate model_type → 400; override persists
+      `is_override`/`override_reason` + returns `override_warning`; `train-winner` response shape unchanged (regression green).
+- [ ] `POST /{id}/predict` (empty or bodied) returns peak/low + a labeled `decision`; safety stock never feeds ranking;
+      feature-aware winner → clean 400 + UI blocked state (no predict call).
+- [ ] `POST /{id}/promote`: requires `approved_by`; non-recommended-no-ack → 422; before-train → 422; bad alias_name → 422;
+      success creates a SUCCESS registry run + alias and persists `champion_run_id`/`promoted_alias`/`promotion_decision`.
+- [ ] `decision.py` is pure; z-table + safety-stock + peak/low + bias text deterministically unit-tested.
+- [ ] Migration adds seven columns (six decision/promotion + feature_frame_version); promote carries the REAL persisted version (V2 run → 2, never a hardcoded 1); `downgrade` removes them on a fresh DB; strict-mode policy test green.
+- [ ] Ranking math (`ranking.py`/`explanations.py`) UNCHANGED; Slice A/B contracts (page/hooks/types/run/progress/results)
+      NOT redefined.
+- [ ] Frontend decision section renders after a terminal winning run: accept/override → train → forecast (summary/chart/
+      table) → business interpretation (bias + labeled safety stock + caveats) → gated promote; feature-aware → blocked.
+- [ ] `docs/user-guide/champion-selector-guide.md` exists (full journey + promotion-is-audited rule); cross-linked.
+- [ ] All Level-1..4 gates pass; dogfood journey completes; `gh issue view <N>` confirms the tracking issue is open.
+- [ ] `git diff --stat` shows no CRLF whole-file noise; `docker-compose.lan.yml` + `uv.lock` NOT staged.
+
+## Anti-Patterns to Avoid
+
+- ❌ Don't rewrite or change the signature/response of the existing `train-winner` / `predict` (Slice B treats them as
+  fixed) — ADD `train-selected`, an OPTIONAL predict body, and additive response fields only.
+- ❌ Don't let safety stock (or any decision-layer value) flow into `rank_candidates`/`build_chart_data` — it must never
+  affect ranking (LOCKED #3 + coordination contract).
+- ❌ Don't fake a forecast for a feature-aware winner — surface the capability limitation (Slice A's
+  `supports_auto_predict`) and route the user to the What-If Planner.
+- ❌ Don't auto-promote — promotion requires explicit `approved_by` + a recorded `promotion_decision`; a non-recommended
+  model requires `acknowledge_non_recommended=true`.
+- ❌ Don't perform comparison inside promote (compare and promote are separate workflows).
+- ❌ Don't register an unverifiable artifact — register the bundle into registry storage (hash + size) before SUCCESS;
+  if that mechanic is out of budget, ship Option-3 scope (no promote) + a follow-up issue rather than a fake artifact.
+- ❌ Don't import another feature slice's ORM/service at module scope — lazy-import `ForecastingService`/`RegistryService`
+  inside the methods (mirror the existing pattern at `service.py:410`).
+- ❌ Don't add an agent tool or `agent_require_approval` entry (promotion is a user REST flow, not an agent mutation).
+- ❌ Don't hardcode `feature_frame_version=1` in promote — persist the request's real version on `model_selection_run`
+  and pass `row.feature_frame_version` into `runtime_info_extras` (V2 runs must promote as V2). The literal `1` appears
+  ONLY as the column's migration server_default (legacy backfill) and as a fallback-case test.
+- ❌ Don't add a new strict request model with a date/UUID/Decimal field (none is needed) — keeps the strict-mode linter green.
+- ❌ Don't hardcode store_id=1/product_id=1 (IDs aren't 1-based); don't `crypto.randomUUID()` client-side; dogfood over
+  http://localhost:5173, not a LAN IP.
+- ❌ Don't redefine Slice A/B types/page/hooks/route — extend additively; keep the legacy sync `POST /run` and async
+  `POST /runs` untouched.
+
+## Confidence Score
+
+**7.5/10** for one-pass implementation success. The core decision actions are de-risked: `train-winner` and `predict`
+already exist and are read verbatim, every reused contract (forecasting train/predict, registry create_run/update_run/
+create_alias, storage.save, the exception classes, the test harness, the frontend chart/promote-dialog precedents) is
+cited to file:line, and the safety-stock heuristic is a small pure function with a verification one-liner. The score is
+below Slice A/B's 8.5 for three reasons: (a) **promotion orchestration** (register run → register artifact → SUCCESS →
+alias) is genuinely novel for this slice and the *artifact-registration* call is the one mechanic not fully pinned —
+the PRP mandates a grep-verify step + a documented Option-3 fallback before coding it; (b) Slice C has a **hard A→B→C
+dependency** — its frontend extends pages/hooks/types that are still unimplemented PRPs, so it cannot land until A and B
+merge; (c) the **integration test must clean up created registry runs/aliases** (cross-slice teardown), a sharp edge the
+existing prefix-scoped fixture doesn't yet cover. All three are called out with concrete mitigations above. A fourth,
+smaller touch (M1): supporting **V2 promotion** adds a `feature_frame_version` column persisted at run-creation in BOTH
+`run_selection` and `submit_run`, threaded into training, and carried into the registry run's `runtime_info_extras` —
+additive and low-risk, but it means Slice C makes a one-line write inside Slice B's `submit_run` (documented in LOCKED #7).
+
+### Scoring table (packaging brainstorm)
+
+| Option | User value | Repo fit | Impl clarity | Risk control | Dep isolation | Total /25 |
+|--------|:---:|:---:|:---:|:---:|:---:|:---:|
+| **1 — Extend model_selection with decision endpoints + decision.py + decision UI (CHOSEN)** | 5 | 5 | 4 | 4 | 4 | **22** |
+| 3 — Forecast output only; defer promotion/governance (de-risking fallback) | 2 | 4 | 5 | 5 | 5 | 21 |
+| 2 — Frontend reuses /forecasting + /registry directly; no new model_selection endpoints | 4 | 2 | 2 | 2 | 2 | 12 |
diff --git a/alembic/env.py b/alembic/env.py
index 4ce8f0e1..2cadd971 100644
--- a/alembic/env.py
+++ b/alembic/env.py
@@ -18,6 +18,7 @@
 from app.features.data_platform import models as data_platform_models  # noqa: F401
 from app.features.explainability import models as explainability_models  # noqa: F401
 from app.features.jobs import models as jobs_models  # noqa: F401
+from app.features.model_selection import models as model_selection_models  # noqa: F401
 from app.features.rag import models as rag_models  # noqa: F401
 from app.features.registry import models as registry_models  # noqa: F401
 from app.features.scenarios import models as scenarios_models  # noqa: F401
diff --git a/alembic/versions/b667d321603c_create_model_selection_run.py b/alembic/versions/b667d321603c_create_model_selection_run.py
new file mode 100644
index 00000000..e3dcaa2a
--- /dev/null
+++ b/alembic/versions/b667d321603c_create_model_selection_run.py
@@ -0,0 +1,129 @@
+"""create_model_selection_run
+
+Revision ID: b667d321603c
+Revises: c1d2e3f40512
+Create Date: 2026-06-01 05:58:51.986105
+
+Creates the ``model_selection_run`` table for the Forecast Champion Selector
+backend (issue #353). One row per ``POST /model-selection/run`` — an auditable
+record of which candidate models competed for a (store, product) pair, over
+which window/policy, and which model won.
+
+JSONB snapshot columns mirror the ``batch_job`` precedent
+(``c1d2e3f40512_create_batch_tables``): every flexible payload (candidate
+configs, policy, availability, ranking, per-candidate results incl. fold chart
+data, winner metrics, forecast summary, business summary) is JSONB so the
+eventual UI PRP can add keys without a schema migration. ``candidate_results``
+holds the full per-candidate detail (incl. fold actuals/predictions) so a
+``GET`` rebuilds the same ``chart_data`` payload the originating ``/run``
+returned — without it the chart's fold-stability and actual-vs-predicted
+overlays could not be reconstructed.
+"""
+
+from collections.abc import Sequence
+
+import sqlalchemy as sa
+from sqlalchemy.dialects import postgresql
+
+from alembic import op
+
+# revision identifiers, used by Alembic.
+revision: str = "b667d321603c"
+down_revision: str | None = "c1d2e3f40512"
+branch_labels: str | Sequence[str] | None = None
+depends_on: str | Sequence[str] | None = None
+
+
+def upgrade() -> None:
+    """Apply migration."""
+    op.create_table(
+        "model_selection_run",
+        sa.Column("id", sa.Integer(), nullable=False),
+        sa.Column("selection_id", sa.String(length=32), nullable=False),
+        sa.Column("store_id", sa.Integer(), nullable=False),
+        sa.Column("product_id", sa.Integer(), nullable=False),
+        sa.Column("start_date", sa.Date(), nullable=False),
+        sa.Column("end_date", sa.Date(), nullable=False),
+        sa.Column("forecast_horizon", sa.Integer(), nullable=False),
+        sa.Column("ranking_metric", sa.String(length=20), nullable=False),
+        sa.Column("status", sa.String(length=20), nullable=False),
+        sa.Column("candidate_models", postgresql.JSONB(astext_type=sa.Text()), nullable=False),
+        sa.Column("policy_snapshot", postgresql.JSONB(astext_type=sa.Text()), nullable=False),
+        sa.Column("availability_snapshot", postgresql.JSONB(astext_type=sa.Text()), nullable=True),
+        sa.Column("ranking_result", postgresql.JSONB(astext_type=sa.Text()), nullable=True),
+        sa.Column("candidate_results", postgresql.JSONB(astext_type=sa.Text()), nullable=True),
+        sa.Column("chart_data", postgresql.JSONB(astext_type=sa.Text()), nullable=True),
+        sa.Column("winner_model_type", sa.String(length=40), nullable=True),
+        sa.Column("winner_metrics", postgresql.JSONB(astext_type=sa.Text()), nullable=True),
+        sa.Column("final_model_path", sa.String(length=512), nullable=True),
+        sa.Column("forecast_result", postgresql.JSONB(astext_type=sa.Text()), nullable=True),
+        sa.Column("business_summary", postgresql.JSONB(astext_type=sa.Text()), nullable=True),
+        sa.Column("error_message", sa.String(length=2000), nullable=True),
+        sa.Column("completed_at", sa.DateTime(timezone=True), nullable=True),
+        sa.Column(
+            "created_at",
+            sa.DateTime(timezone=True),
+            server_default=sa.text("now()"),
+            nullable=False,
+        ),
+        sa.Column(
+            "updated_at",
+            sa.DateTime(timezone=True),
+            server_default=sa.text("now()"),
+            nullable=False,
+        ),
+        sa.CheckConstraint(
+            "status IN ('pending', 'running', 'completed', 'partial', 'failed')",
+            name="ck_model_selection_run_valid_status",
+        ),
+        sa.PrimaryKeyConstraint("id"),
+    )
+    op.create_index(
+        op.f("ix_model_selection_run_selection_id"),
+        "model_selection_run",
+        ["selection_id"],
+        unique=True,
+    )
+    op.create_index(
+        op.f("ix_model_selection_run_store_id"),
+        "model_selection_run",
+        ["store_id"],
+        unique=False,
+    )
+    op.create_index(
+        op.f("ix_model_selection_run_product_id"),
+        "model_selection_run",
+        ["product_id"],
+        unique=False,
+    )
+    op.create_index(
+        op.f("ix_model_selection_run_status"),
+        "model_selection_run",
+        ["status"],
+        unique=False,
+    )
+    op.create_index(
+        "ix_model_selection_run_store_product_created",
+        "model_selection_run",
+        ["store_id", "product_id", "created_at"],
+        unique=False,
+    )
+    op.create_index(
+        "ix_model_selection_run_status_created",
+        "model_selection_run",
+        ["status", "created_at"],
+        unique=False,
+    )
+
+
+def downgrade() -> None:
+    """Revert migration."""
+    op.drop_index("ix_model_selection_run_status_created", table_name="model_selection_run")
+    op.drop_index(
+        "ix_model_selection_run_store_product_created", table_name="model_selection_run"
+    )
+    op.drop_index(op.f("ix_model_selection_run_status"), table_name="model_selection_run")
+    op.drop_index(op.f("ix_model_selection_run_product_id"), table_name="model_selection_run")
+    op.drop_index(op.f("ix_model_selection_run_store_id"), table_name="model_selection_run")
+    op.drop_index(op.f("ix_model_selection_run_selection_id"), table_name="model_selection_run")
+    op.drop_table("model_selection_run")
diff --git a/alembic/versions/d3e4f5a6b7c8_add_model_selection_candidate_and_progress.py b/alembic/versions/d3e4f5a6b7c8_add_model_selection_candidate_and_progress.py
new file mode 100644
index 00000000..c510c5ef
--- /dev/null
+++ b/alembic/versions/d3e4f5a6b7c8_add_model_selection_candidate_and_progress.py
@@ -0,0 +1,185 @@
+"""add model_selection_candidate and async progress columns
+
+Revision ID: d3e4f5a6b7c8
+Revises: b667d321603c
+Create Date: 2026-06-01 09:30:00.000000
+
+Slice B of the Forecast Champion Selector (issue #360). Converts the selection
+run into a DB-backed async LRO:
+
+- creates ``model_selection_candidate`` (one row per candidate, FK CASCADE to
+  ``model_selection_run.selection_id``) carrying per-candidate status, result
+  JSONB, error, and timing — the live-progress + audit surface;
+- adds ``started_at`` + the four final count columns to ``model_selection_run``;
+- widens the run status CheckConstraint to include ``'cancelled'`` (forward-only
+  drop + recreate of the named constraint).
+
+Mirrors ``c1d2e3f40512_create_batch_tables`` for JSONB / index / FK style.
+"""
+
+from collections.abc import Sequence
+
+import sqlalchemy as sa
+from sqlalchemy.dialects import postgresql
+
+from alembic import op
+
+# revision identifiers, used by Alembic.
+revision: str = "d3e4f5a6b7c8"
+down_revision: str | None = "b667d321603c"
+branch_labels: str | Sequence[str] | None = None
+depends_on: str | Sequence[str] | None = None
+
+_OLD_RUN_STATUS = "status IN ('pending', 'running', 'completed', 'partial', 'failed')"
+_NEW_RUN_STATUS = (
+    "status IN ('pending', 'running', 'completed', 'partial', 'failed', 'cancelled')"
+)
+
+
+def upgrade() -> None:
+    """Apply migration."""
+    # ------------------------------------------------------------------
+    # 1. Widen the run status CheckConstraint to include 'cancelled'.
+    # ------------------------------------------------------------------
+    op.drop_constraint(
+        "ck_model_selection_run_valid_status",
+        "model_selection_run",
+        type_="check",
+    )
+    op.create_check_constraint(
+        "ck_model_selection_run_valid_status",
+        "model_selection_run",
+        _NEW_RUN_STATUS,
+    )
+
+    # ------------------------------------------------------------------
+    # 2. Additive progress columns on the parent run.
+    # ------------------------------------------------------------------
+    op.add_column(
+        "model_selection_run",
+        sa.Column("started_at", sa.DateTime(timezone=True), nullable=True),
+    )
+    op.add_column(
+        "model_selection_run",
+        sa.Column("total_candidates", sa.Integer(), nullable=False, server_default="0"),
+    )
+    op.add_column(
+        "model_selection_run",
+        sa.Column(
+            "completed_candidates", sa.Integer(), nullable=False, server_default="0"
+        ),
+    )
+    op.add_column(
+        "model_selection_run",
+        sa.Column("failed_candidates", sa.Integer(), nullable=False, server_default="0"),
+    )
+    op.add_column(
+        "model_selection_run",
+        sa.Column(
+            "cancelled_candidates", sa.Integer(), nullable=False, server_default="0"
+        ),
+    )
+
+    # ------------------------------------------------------------------
+    # 3. Per-candidate execution child table (FK CASCADE on selection_id).
+    # ------------------------------------------------------------------
+    op.create_table(
+        "model_selection_candidate",
+        sa.Column("id", sa.Integer(), nullable=False),
+        sa.Column("candidate_id", sa.String(length=32), nullable=False),
+        sa.Column("selection_id", sa.String(length=32), nullable=False),
+        sa.Column("ordinal", sa.Integer(), nullable=False),
+        sa.Column("model_type", sa.String(length=40), nullable=False),
+        sa.Column("params", postgresql.JSONB(astext_type=sa.Text()), nullable=False),
+        sa.Column("status", sa.String(length=20), nullable=False),
+        sa.Column("result", postgresql.JSONB(astext_type=sa.Text()), nullable=True),
+        sa.Column("error_message", sa.String(length=2000), nullable=True),
+        sa.Column("error_type", sa.String(length=100), nullable=True),
+        sa.Column("started_at", sa.DateTime(timezone=True), nullable=True),
+        sa.Column("completed_at", sa.DateTime(timezone=True), nullable=True),
+        sa.Column("duration_ms", sa.Integer(), nullable=True),
+        sa.Column(
+            "created_at",
+            sa.DateTime(timezone=True),
+            server_default=sa.text("now()"),
+            nullable=False,
+        ),
+        sa.Column(
+            "updated_at",
+            sa.DateTime(timezone=True),
+            server_default=sa.text("now()"),
+            nullable=False,
+        ),
+        sa.CheckConstraint(
+            "status IN ('pending', 'running', 'completed', 'failed', 'cancelled')",
+            name="ck_model_selection_candidate_valid_status",
+        ),
+        sa.ForeignKeyConstraint(
+            ["selection_id"],
+            ["model_selection_run.selection_id"],
+            ondelete="CASCADE",
+        ),
+        sa.PrimaryKeyConstraint("id"),
+    )
+    op.create_index(
+        op.f("ix_model_selection_candidate_candidate_id"),
+        "model_selection_candidate",
+        ["candidate_id"],
+        unique=True,
+    )
+    op.create_index(
+        op.f("ix_model_selection_candidate_selection_id"),
+        "model_selection_candidate",
+        ["selection_id"],
+        unique=False,
+    )
+    op.create_index(
+        op.f("ix_model_selection_candidate_status"),
+        "model_selection_candidate",
+        ["status"],
+        unique=False,
+    )
+    op.create_index(
+        "ix_model_selection_candidate_selection_status",
+        "model_selection_candidate",
+        ["selection_id", "status"],
+        unique=False,
+    )
+
+
+def downgrade() -> None:
+    """Revert migration."""
+    op.drop_index(
+        "ix_model_selection_candidate_selection_status",
+        table_name="model_selection_candidate",
+    )
+    op.drop_index(
+        op.f("ix_model_selection_candidate_status"),
+        table_name="model_selection_candidate",
+    )
+    op.drop_index(
+        op.f("ix_model_selection_candidate_selection_id"),
+        table_name="model_selection_candidate",
+    )
+    op.drop_index(
+        op.f("ix_model_selection_candidate_candidate_id"),
+        table_name="model_selection_candidate",
+    )
+    op.drop_table("model_selection_candidate")
+
+    op.drop_column("model_selection_run", "cancelled_candidates")
+    op.drop_column("model_selection_run", "failed_candidates")
+    op.drop_column("model_selection_run", "completed_candidates")
+    op.drop_column("model_selection_run", "total_candidates")
+    op.drop_column("model_selection_run", "started_at")
+
+    op.drop_constraint(
+        "ck_model_selection_run_valid_status",
+        "model_selection_run",
+        type_="check",
+    )
+    op.create_check_constraint(
+        "ck_model_selection_run_valid_status",
+        "model_selection_run",
+        _OLD_RUN_STATUS,
+    )
diff --git a/alembic/versions/e4f5a6b7c8d9_add_model_selection_decision_promotion.py b/alembic/versions/e4f5a6b7c8d9_add_model_selection_decision_promotion.py
new file mode 100644
index 00000000..73f2b648
--- /dev/null
+++ b/alembic/versions/e4f5a6b7c8d9_add_model_selection_decision_promotion.py
@@ -0,0 +1,90 @@
+"""add model_selection decision + promotion columns
+
+Revision ID: e4f5a6b7c8d9
+Revises: d3e4f5a6b7c8
+Create Date: 2026-06-01 11:00:00.000000
+
+Slice C of the Forecast Champion Selector (issue #362). Adds the decision +
+operationalization columns to ``model_selection_run`` — all ADDITIVE:
+
+- ``trained_model_type`` / ``is_override`` / ``override_reason`` — which model
+  the final bundle holds and whether it was a non-recommended override;
+- ``champion_run_id`` / ``promoted_alias`` / ``promotion_decision`` — the
+  approval-gated registry handoff (registry ``model_run.run_id``, alias name,
+  and the audited decision record);
+- ``feature_frame_version`` — M1, the request's V (1 or 2) persisted at
+  run-creation so train/promote carry the REAL version end-to-end. The
+  server_default ``'1'`` backfills legacy rows ONLY (not a code hardcode).
+
+No CheckConstraint change. ``downgrade`` drops all seven columns.
+"""
+
+from collections.abc import Sequence
+
+import sqlalchemy as sa
+from sqlalchemy.dialects import postgresql
+
+from alembic import op
+
+# revision identifiers, used by Alembic.
+revision: str = "e4f5a6b7c8d9"
+down_revision: str | None = "d3e4f5a6b7c8"
+branch_labels: str | Sequence[str] | None = None
+depends_on: str | Sequence[str] | None = None
+
+
+def upgrade() -> None:
+    """Apply migration — seven additive columns on model_selection_run."""
+    op.add_column(
+        "model_selection_run",
+        sa.Column("trained_model_type", sa.String(length=40), nullable=True),
+    )
+    op.add_column(
+        "model_selection_run",
+        sa.Column(
+            "is_override",
+            sa.Boolean(),
+            nullable=False,
+            server_default=sa.text("false"),
+        ),
+    )
+    op.add_column(
+        "model_selection_run",
+        sa.Column("override_reason", sa.String(length=2000), nullable=True),
+    )
+    op.add_column(
+        "model_selection_run",
+        sa.Column("champion_run_id", sa.String(length=32), nullable=True),
+    )
+    op.add_column(
+        "model_selection_run",
+        sa.Column("promoted_alias", sa.String(length=100), nullable=True),
+    )
+    op.add_column(
+        "model_selection_run",
+        sa.Column(
+            "promotion_decision",
+            postgresql.JSONB(astext_type=sa.Text()),
+            nullable=True,
+        ),
+    )
+    op.add_column(
+        "model_selection_run",
+        sa.Column(
+            "feature_frame_version",
+            sa.Integer(),
+            nullable=False,
+            server_default=sa.text("1"),
+        ),
+    )
+
+
+def downgrade() -> None:
+    """Revert migration — drop the seven Slice C columns."""
+    op.drop_column("model_selection_run", "feature_frame_version")
+    op.drop_column("model_selection_run", "promotion_decision")
+    op.drop_column("model_selection_run", "promoted_alias")
+    op.drop_column("model_selection_run", "champion_run_id")
+    op.drop_column("model_selection_run", "override_reason")
+    op.drop_column("model_selection_run", "is_override")
+    op.drop_column("model_selection_run", "trained_model_type")
diff --git a/app/core/config.py b/app/core/config.py
index 09a30cfc..e2d76a85 100644
--- a/app/core/config.py
+++ b/app/core/config.py
@@ -134,6 +134,17 @@ class Settings(BaseSettings):
     # are uncancellable mid-call, so a long fit can stall the drain.
     batch_cancel_drain_timeout_seconds: int = 30
 
+    # Model selection (champion selector) async runner (Slice B) — mirrors the
+    # batch runner. Hard upper bound on concurrent candidate backtests across
+    # all active selection runs on this host; sized for the same Postgres pool
+    # (pool_size=5, max_overflow=10). Setting this to 1 makes the runner
+    # sequential. Env override: MODEL_SELECTION_GLOBAL_MAX_PARALLEL=8 (restart).
+    model_selection_global_max_parallel: int = 4
+    # Max seconds DELETE /model-selection/{id} waits for in-flight candidates to
+    # settle before returning RFC 7807 504. In-flight sklearn/LightGBM fits are
+    # uncancellable mid-call, so a long fit can stall the drain.
+    model_selection_cancel_drain_timeout_seconds: int = 30
+
     # RAG Embedding Configuration
     rag_embedding_provider: Literal["openai", "ollama"] = "openai"
     openai_api_key: str = ""
diff --git a/app/core/exceptions.py b/app/core/exceptions.py
index fd5e2b36..1e6279ea 100644
--- a/app/core/exceptions.py
+++ b/app/core/exceptions.py
@@ -10,6 +10,7 @@
 
 from app.core.logging import get_logger
 from app.core.problem_details import (
+    EMBEDDING_AUTH_CODE,
     ERROR_TYPES,
     ProblemDetailResponse,
     problem_response,
@@ -223,6 +224,36 @@ def __init__(
         )
 
 
+class EmbeddingProviderAuthError(ForecastLabError):
+    """502 — the embedding provider rejected the configured credentials.
+
+    Raised when the RAG embedding provider returns an authentication/
+    authorization failure (HTTP 401/403 — an invalid, placeholder, or
+    unauthorized API key) rather than a transient connection/server failure.
+    Keeps the public ``/rag`` status at 502 (an upstream/gateway failure from
+    the caller's perspective) but emits a *machine-readable* ``EMBEDDING_AUTH``
+    problem ``type``/``code`` so consumers — notably the showcase demo
+    pipeline — can classify it and SKIP the knowledge phase gracefully instead
+    of hard-failing (issue #329). Disambiguated from a generic embedding 502
+    (bare ``{"detail": ...}``) via the ``type`` URI in the problem+json body,
+    mirroring the :class:`UnprocessableEntityError` 422 precedent.
+    """
+
+    error_type_uri: str = ERROR_TYPES[EMBEDDING_AUTH_CODE]
+
+    def __init__(
+        self,
+        message: str = "Embedding provider rejected the configured credentials",
+        details: dict[str, Any] | None = None,
+    ) -> None:
+        super().__init__(
+            message=message,
+            code=EMBEDDING_AUTH_CODE,
+            status_code=502,
+            details=details,
+        )
+
+
 # =============================================================================
 # Exception Handlers (RFC 7807)
 # =============================================================================
diff --git a/app/core/problem_details.py b/app/core/problem_details.py
index 7de6e462..f8bba455 100644
--- a/app/core/problem_details.py
+++ b/app/core/problem_details.py
@@ -23,6 +23,12 @@
 # Base URI for error types (relative URIs for portability)
 ERROR_TYPE_BASE = "/errors"
 
+# Machine-readable code for an embedding-provider auth failure (#329). Single
+# source of truth shared by the producer (EmbeddingProviderAuthError, which
+# stamps this as the problem ``code``/``type``) and the consumer (the showcase
+# demo pipeline's classifier) so the marker never drifts between the two.
+EMBEDDING_AUTH_CODE = "EMBEDDING_AUTH"
+
 ERROR_TYPES = {
     "NOT_FOUND": f"{ERROR_TYPE_BASE}/not-found",
     "VALIDATION_ERROR": f"{ERROR_TYPE_BASE}/validation",
@@ -36,6 +42,7 @@
     "BAD_REQUEST": f"{ERROR_TYPE_BASE}/bad-request",
     "SERVICE_UNAVAILABLE": f"{ERROR_TYPE_BASE}/service-unavailable",
     "GATEWAY_TIMEOUT": f"{ERROR_TYPE_BASE}/gateway-timeout",
+    EMBEDDING_AUTH_CODE: f"{ERROR_TYPE_BASE}/embedding-auth",
 }
 
 
diff --git a/app/core/tests/test_config.py b/app/core/tests/test_config.py
index 0dc96733..496c29bb 100644
--- a/app/core/tests/test_config.py
+++ b/app/core/tests/test_config.py
@@ -23,6 +23,15 @@ def test_settings_has_defaults(monkeypatch):
     assert settings.api_port == 8123
 
 
+def test_model_selection_runner_defaults(monkeypatch):
+    """Slice B async-runner settings default to the batch-mirrored values."""
+    monkeypatch.delenv("MODEL_SELECTION_GLOBAL_MAX_PARALLEL", raising=False)
+    monkeypatch.delenv("MODEL_SELECTION_CANCEL_DRAIN_TIMEOUT_SECONDS", raising=False)
+    settings = Settings(_env_file=None)
+    assert settings.model_selection_global_max_parallel == 4
+    assert settings.model_selection_cancel_drain_timeout_seconds == 30
+
+
 def test_settings_is_development_property():
     """is_development should return True for development env."""
     settings = Settings(app_env="development")
diff --git a/app/features/agents/agents/base.py b/app/features/agents/agents/base.py
index f9f4e1a0..4ccd86b3 100644
--- a/app/features/agents/agents/base.py
+++ b/app/features/agents/agents/base.py
@@ -7,12 +7,14 @@
 
 import functools
 import inspect
+import json
 import os
 from collections.abc import Awaitable, Callable
-from typing import Any
+from typing import Any, cast
 
+import httpx
 import structlog
-from pydantic_ai import ModelRetry
+from pydantic_ai import Agent, ModelRetry
 from pydantic_ai.models import Model
 from pydantic_ai.models.fallback import FallbackModel
 from pydantic_ai.models.openai import OpenAIChatModel
@@ -62,6 +64,71 @@ async def wrapper(*args: P.args, **kwargs: P.kwargs) -> ToolReturnT:
     return wrapper
 
 
+def _coerce_null_message_content(body: bytes) -> bytes | None:
+    """Coerce ``messages[*].content: null`` -> ``""`` in a chat-request body.
+
+    Ollama's OpenAI-compatible ``/v1/chat/completions`` rejects any message
+    whose ``content`` is JSON ``null`` and which carries no ``tool_calls`` with
+    ``400 invalid message content type: <nil>`` — stricter than the real OpenAI
+    API, which tolerates it. A weak local model can emit a degenerate empty
+    assistant turn (no text, no tool call); PydanticAI serialises it as
+    ``content: null`` and then *replays* that message on its validation-retry,
+    so every retry 400s and the whole run dies with a ``FallbackExceptionGroup``.
+    Coercing ``null`` -> ``""`` keeps the message OpenAI-spec-valid and lets the
+    retry loop proceed.
+
+    Args:
+        body: The raw outgoing request body bytes.
+
+    Returns:
+        Re-serialised body bytes when a null ``content`` was rewritten, or
+        ``None`` when nothing changed (the common case) so the caller can
+        forward the original request untouched.
+    """
+    try:
+        parsed = json.loads(body)
+    except (ValueError, TypeError):
+        return None
+    if not isinstance(parsed, dict):
+        return None
+    payload = cast("dict[str, Any]", parsed)
+    messages = payload.get("messages")
+    if not isinstance(messages, list):
+        return None
+    message_list: list[Any] = messages
+    changed = False
+    for message in message_list:
+        if isinstance(message, dict) and "content" in message and message["content"] is None:
+            message["content"] = ""
+            changed = True
+    if not changed:
+        return None
+    return json.dumps(payload).encode("utf-8")
+
+
+class _OllamaNullContentTransport(httpx.AsyncHTTPTransport):
+    """httpx transport that null-content-sanitises outgoing Ollama requests.
+
+    See :func:`_coerce_null_message_content` for the Ollama-compat defect this
+    works around. Applied to the ``OllamaProvider``'s HTTP client so the fix
+    covers both the streaming and non-streaming agent paths.
+    """
+
+    async def handle_async_request(self, request: httpx.Request) -> httpx.Response:
+        sanitized = _coerce_null_message_content(request.content)
+        if sanitized is not None:
+            headers = dict(request.headers)
+            headers.pop("content-length", None)  # httpx recomputes from the new body
+            request = httpx.Request(
+                request.method,
+                request.url,
+                headers=headers,
+                content=sanitized,
+                extensions=request.extensions,
+            )
+        return await super().handle_async_request(request)
+
+
 def build_agent_model(identifier: str) -> str | Model:
     """Build the PydanticAI ``model`` argument for an agent identifier.
 
@@ -85,7 +152,17 @@ def build_agent_model(identifier: str) -> str | Model:
     model_name = identifier.split(":", 1)[1]
     # CRITICAL: Ollama's OpenAI-compatible base ends in /v1.
     base_url = settings.ollama_base_url.rstrip("/") + "/v1"
-    return OpenAIChatModel(model_name, provider=OllamaProvider(base_url=base_url))
+    # The null-content sanitiser lives on the HTTP client (see
+    # _OllamaNullContentTransport). A generous read timeout is required because
+    # local generation on an 8B model routinely exceeds httpx's 5s default.
+    http_client = httpx.AsyncClient(
+        transport=_OllamaNullContentTransport(),
+        timeout=httpx.Timeout(600.0, connect=10.0),
+    )
+    return OpenAIChatModel(
+        model_name,
+        provider=OllamaProvider(base_url=base_url, http_client=http_client),
+    )
 
 
 def reset_agent_caches() -> None:
@@ -171,6 +248,40 @@ def build_agent_model_with_fallback() -> Model | str:
     return FallbackModel(primary, fallback)
 
 
+FINALIZER_SYSTEM_PROMPT = """You are a concise analyst for ForecastLabAI.
+Answer the user's question using ONLY the provided tool data. Be specific and brief
+(2-4 sentences, plain text — no JSON, no preamble).
+- If the user asked for a ranking (lowest/highest WAPE, MAE, RMSE, …), name the
+  specific run/item and its value, and ignore entries whose metric is missing.
+- If the data is empty, say so plainly.
+- Never invent values, run ids, or entities that are not present in the data.
+"""
+
+
+def build_finalizer_agent() -> Agent[None, str]:
+    """Build a tool-less, plain-text agent that salvages an answer from tool data.
+
+    Weak local models (e.g. ``ollama:llama3.1:8b``) reliably call tools and obtain
+    the data, but cannot wrap the result in the primary agent's structured
+    ``PromptedOutput`` schema — they echo the raw tool output and exhaust the
+    output-retry budget (issue #351). This finalizer takes the data already
+    obtained and answers in plain text, which weak models *can* do. It has NO
+    tools (cannot loop) and ``output_type=str`` (cannot fail schema validation),
+    so it degrades gracefully. Cloud models never need it — it only runs on the
+    primary agent's misbehavior path.
+
+    Returns:
+        A configured plain-text :class:`Agent`, primary+fallback model wrapped.
+    """
+    model = build_agent_model_with_fallback()
+    return Agent(
+        model=model,
+        output_type=str,
+        system_prompt=FINALIZER_SYSTEM_PROMPT,
+        **get_model_settings(),
+    )
+
+
 def get_agent_retries() -> int:
     """Get the configured retry budget for agent tool calls and output validation.
 
@@ -294,3 +405,59 @@ def requires_approval(action_name: str) -> bool:
 - Never bypass safety checks or approval requirements
 - Log all significant decisions and their reasoning
 """
+
+# Generalized read-only intent guard. Embedded in the experiment-agent prompt to
+# stop a read-only question (list/rank/summarize/compare/report) from derailing
+# into a scenario / write / experiment tool — especially on an output-format
+# validation retry, where a weak local model tends to start a brand-new action
+# instead of just reformatting the data it already fetched (issue #347). Every
+# `tool_*` name referenced here is registered on the experiment agent, so the
+# `test_prompts_only_reference_registered_tool_names` invariant still holds.
+READ_ONLY_INTENT_GUARD = """
+READ-ONLY INTENT GUARD (apply this before every turn):
+Many requests are READ-ONLY — the user wants you to look something up and report
+it, not to change anything. Treat a request as READ-ONLY when it asks you to list,
+show, rank, summarize, compare, or report. Examples that are ALWAYS read-only
+unless the user explicitly asks to change something:
+- listing or ranking stores or products (e.g. "top products")
+- sales, revenue, or units-sold summaries
+- forecast summaries, or which products have the highest forecasted demand
+- model runs and metric comparisons, including WAPE, MAE, or RMSE
+- registry aliases and deployment status
+- backtest metrics
+- RAG / document / knowledge questions
+
+For a READ-ONLY request you MUST:
+- Use ONLY read-only tools: tool_list_runs, tool_get_run, tool_compare_runs,
+  tool_compare_backtest_results.
+- NEVER call tool_propose_scenario, tool_save_scenario, tool_create_alias,
+  tool_archive_run, or tool_run_backtest. Those create, save, promote, archive,
+  run, or plan something — they are NOT allowed for a read-only question.
+- Call a mutating / planning / experiment tool ONLY when the user EXPLICITLY asks
+  to create, save, promote, archive, run a backtest, or run an experiment.
+- Answer directly in the ExperimentReport `summary` field, grounded in tool output.
+
+FINISH IN ONE PASS — do not loop:
+- Call each read-only tool AT MOST ONCE per question.
+- The MOMENT a read tool returns, STOP calling tools and write your
+  ExperimentReport `summary` from what it returned — you already have the answer.
+- NEVER call a tool again that has already returned. Re-running the same tool
+  (e.g. tool_list_runs twice) is the most common failure: it burns the retry
+  budget until the run is killed. Use the data you already received.
+- If a read tool returns an EMPTY result, say so in the `summary` (e.g. "No model
+  runs found.") — do NOT retry the tool hoping for different data.
+
+OUTPUT-FORMAT RETRIES:
+- If your previous reply failed schema validation (e.g. "summary: Field required"),
+  DO NOT call any new tool. Only reformat the data you already obtained into a
+  valid ExperimentReport with a concise `summary`. A validation retry is a
+  formatting fix, never a reason to start a new action.
+
+WHEN A TOOL IS MISSING OR THE REQUEST IS AMBIGUOUS:
+- If a ranking is ambiguous (e.g. "top products"), ask a clarifying question such
+  as: "Top by revenue, units sold, forecasted demand, or model error?" — do not guess.
+- If no read-only tool exists for the requested metric, say plainly that this agent
+  does not have a tool for that metric. Do NOT invent data.
+- NEVER invent or guess a store_id, product_id, or run_id. Use only IDs returned by
+  a tool or explicitly supplied by the user.
+"""
diff --git a/app/features/agents/agents/experiment.py b/app/features/agents/agents/experiment.py
index d9bad5bd..d58b53de 100644
--- a/app/features/agents/agents/experiment.py
+++ b/app/features/agents/agents/experiment.py
@@ -16,6 +16,7 @@
 from pydantic_ai import Agent, PromptedOutput, RunContext
 
 from app.features.agents.agents.base import (
+    READ_ONLY_INTENT_GUARD,
     SAFETY_INSTRUCTIONS,
     SYSTEM_PROMPT_HEADER,
     TOOL_USAGE_INSTRUCTIONS,
@@ -68,6 +69,8 @@
   would like to experiment on. Do NOT call any tools until you have a specific
   objective (a store and product plus a date range, or an explicit request).
 
+{READ_ONLY_INTENT_GUARD}
+
 {TOOL_USAGE_INSTRUCTIONS}
 
 {SAFETY_INSTRUCTIONS}
@@ -322,6 +325,13 @@ async def tool_create_alias(
 
         # Check if approval is required
         if requires_approval("create_alias"):
+            # Record a machine-readable approval request so the service layer
+            # can persist pending_action + emit approval_required (#336).
+            ctx.deps.set_pending_action(
+                "create_alias",
+                {"alias_name": alias_name, "run_id": run_id, "description": description},
+                f"Create alias '{alias_name}' pointing at run {run_id}",
+            )
             return {
                 "status": "approval_required",
                 "action": "create_alias",
@@ -366,6 +376,13 @@ async def tool_archive_run(
 
         # Check if approval is required
         if requires_approval("archive_run"):
+            # Record a machine-readable approval request so the service layer
+            # can persist pending_action + emit approval_required (#336).
+            ctx.deps.set_pending_action(
+                "archive_run",
+                {"run_id": run_id},
+                f"Archive run {run_id}",
+            )
             return {
                 "status": "approval_required",
                 "action": "archive_run",
@@ -466,6 +483,14 @@ async def tool_save_scenario(
 
         # Check if approval is required — mirrors tool_create_alias exactly.
         if requires_approval("save_scenario"):
+            # Record a machine-readable approval request so the service layer
+            # can persist pending_action + emit approval_required (#336). The
+            # arguments dict is exactly what _execute_pending_action replays.
+            ctx.deps.set_pending_action(
+                "save_scenario",
+                arguments,
+                f"Save scenario plan '{name}' for store {store_id} / product {product_id}",
+            )
             return {
                 "status": "approval_required",
                 "action": "save_scenario",
diff --git a/app/features/agents/deps.py b/app/features/agents/deps.py
index 23bcf1f8..3344ad67 100644
--- a/app/features/agents/deps.py
+++ b/app/features/agents/deps.py
@@ -7,6 +7,7 @@
 from __future__ import annotations
 
 from dataclasses import dataclass, field
+from typing import Any
 
 from sqlalchemy.ext.asyncio import AsyncSession
 
@@ -23,14 +24,46 @@ class AgentDeps:
         session_id: Current agent session ID.
         request_id: Optional request correlation ID for logging.
         tool_call_count: Counter for tool calls in this run.
+        pending_action: Machine-readable HITL approval request recorded by a
+            gated tool when it short-circuits without persisting (#336). The
+            service layer reads this after the agent run to flip the session to
+            ``awaiting_approval`` and emit the ``approval_required`` event,
+            instead of relying on the model echoing the request into its
+            structured output.
     """
 
     db: AsyncSession
     session_id: str
     request_id: str | None = None
     tool_call_count: int = field(default=0)
+    pending_action: dict[str, Any] | None = field(default=None)
 
     def increment_tool_calls(self) -> int:
         """Increment and return the tool call count."""
         self.tool_call_count += 1
         return self.tool_call_count
+
+    def set_pending_action(
+        self,
+        action_type: str,
+        arguments: dict[str, Any],
+        description: str,
+    ) -> None:
+        """Record that a gated tool call needs human approval (HITL).
+
+        Called by approval-gated tools (e.g. ``save_scenario``, ``create_alias``,
+        ``archive_run``) instead of persisting their effect. The ``arguments``
+        dict must carry everything ``AgentService._execute_pending_action`` needs
+        to run the action once a human approves it.
+
+        Args:
+            action_type: The gated action name (``create_alias`` / ``archive_run``
+                / ``save_scenario``).
+            arguments: Arguments to replay when the action is approved.
+            description: Human-readable summary shown on the approval card.
+        """
+        self.pending_action = {
+            "action_type": action_type,
+            "arguments": arguments,
+            "description": description,
+        }
diff --git a/app/features/agents/service.py b/app/features/agents/service.py
index 1b3c4644..6372fd9c 100644
--- a/app/features/agents/service.py
+++ b/app/features/agents/service.py
@@ -13,6 +13,7 @@
 from __future__ import annotations
 
 import asyncio
+import json
 import uuid
 from collections.abc import AsyncIterator
 from contextlib import AbstractContextManager
@@ -20,9 +21,9 @@
 from typing import Any, Literal, cast
 
 import structlog
-from pydantic_ai import Agent
+from pydantic_ai import Agent, capture_run_messages
 from pydantic_ai.exceptions import UnexpectedModelBehavior
-from pydantic_ai.messages import ModelMessage, ModelMessagesTypeAdapter
+from pydantic_ai.messages import ModelMessage, ModelMessagesTypeAdapter, ToolReturnPart
 from sqlalchemy import select
 from sqlalchemy.ext.asyncio import AsyncSession
 
@@ -40,6 +41,31 @@
 
 logger = structlog.get_logger()
 
+# Cap on the tool-data JSON fed to the plain-text finalizer (#351). With the
+# verbose keys below stripped, a full runs page fits comfortably; the cap is a
+# context-budget backstop for pathological payloads.
+_FINALIZER_MAX_CHARS = 8000
+
+# Verbose, decision-irrelevant keys stripped from tool results before they are
+# handed to the finalizer (#351). Dropping these keeps every run's identity +
+# metrics (e.g. WAPE) inside the budget, so a ranking question sees ALL runs
+# instead of just the first one or two — the bug where the finalizer reported
+# 99.0 as "lowest" while the true minimum (18.93) had been truncated away.
+_FINALIZER_DROP_KEYS = frozenset(
+    {
+        "model_config",
+        "model_config_data",
+        "feature_config",
+        "runtime_info",
+        "agent_context",
+        "config_hash",
+        "artifact_hash",
+        "artifact_uri",
+        "artifact_size_bytes",
+        "error_message",
+    }
+)
+
 
 class SessionNotFoundError(ValueError):
     """Session not found in the database."""
@@ -266,16 +292,20 @@ async def chat(
             history_length=len(message_history),
         )
 
+        # Always bound for the misbehavior handler, even if the run raises before
+        # capture_run_messages() populates it.
+        captured_messages: list[ModelMessage] = []
         try:
-            with _sequential_tool_execution():
-                result = await asyncio.wait_for(
-                    agent.run(
-                        message,
-                        deps=deps,
-                        message_history=message_history,
-                    ),
-                    timeout=self.settings.agent_timeout_seconds,
-                )
+            with capture_run_messages() as captured_messages:
+                with _sequential_tool_execution():
+                    result = await asyncio.wait_for(
+                        agent.run(
+                            message,
+                            deps=deps,
+                            message_history=message_history,
+                        ),
+                        timeout=self.settings.agent_timeout_seconds,
+                    )
         except TimeoutError as e:
             raise TimeoutError(
                 f"Agent response timed out after {self.settings.agent_timeout_seconds} seconds"
@@ -290,8 +320,30 @@ async def chat(
                 error=str(e),
                 error_type=type(e).__name__,
             )
-            session.last_activity = datetime.now(UTC)
+            misbehavior_now = datetime.now(UTC)
+            session.last_activity = misbehavior_now
+            # A gated tool may have fired (and recorded a valid approval request)
+            # before the model misbehaved — surface the Approve card rather than
+            # discarding it behind the generic error (#344).
+            salvaged = self._salvage_pending_action(session, deps, misbehavior_now)
             await db.flush()
+            if salvaged is not None:
+                return ChatResponse(
+                    session_id=session_id,
+                    message=(
+                        "I've prepared an action that needs your approval before "
+                        "I can proceed. Please review the pending request."
+                    ),
+                    pending_approval=True,
+                    pending_action=salvaged,
+                )
+            # A weak local model often calls tools and obtains the data, then
+            # fails to wrap it in the structured output schema (#351). Salvage a
+            # plain-text answer from the tool data already captured this run.
+            answer = await self._salvage_plaintext_answer(message, captured_messages)
+            if answer is not None:
+                logger.info("agents.chat_finalizer_salvage", session_id=session_id)
+                return ChatResponse(session_id=session_id, message=answer)
             return ChatResponse(
                 session_id=session_id,
                 message=(
@@ -314,9 +366,26 @@ async def chat(
         # NOTE: PydanticAI v1.48.0 uses result.output (not result.data)
         result_data: Any = result.output
 
-        # Check for pending_action in result data (primary trigger)
+        # Primary trigger (#336): a gated tool recorded a machine-readable
+        # approval request on deps. Deterministic — does not rely on the model
+        # echoing the request into its structured output (ExperimentReport has
+        # no pending_action field, so the legacy triggers below never fired).
+        if deps.pending_action:
+            pending_approval = True
+            pending_action = self._record_pending_action(
+                session,
+                action_type=str(deps.pending_action.get("action_type", "unknown")),
+                arguments=deps.pending_action.get("arguments") or {},
+                description=str(
+                    deps.pending_action.get("description")
+                    or f"Agent requested approval for "
+                    f"{deps.pending_action.get('action_type', 'unknown')}"
+                ),
+                now=now,
+            )
+        # Legacy trigger: structured output carried a pending_action field.
         # The agent tools should return a pending_action dict with action_type and arguments
-        if hasattr(result_data, "pending_action") and result_data.pending_action:
+        elif hasattr(result_data, "pending_action") and result_data.pending_action:
             pending_approval = True
             pending_action_data = result_data.pending_action
             # Extract action details - support both dict and object with attributes
@@ -335,33 +404,19 @@ async def chat(
                     f"Agent requested approval for {action_type}",
                 )
 
-            session.pending_action = {
-                "action_id": uuid.uuid4().hex[:16],
-                "action_type": action_type,
-                "description": description,
-                "arguments": arguments,
-                "created_at": now.isoformat(),
-                "expires_at": (
-                    now + timedelta(minutes=self.settings.agent_approval_timeout_minutes)
-                ).isoformat(),
-            }
-            session.status = SessionStatus.AWAITING_APPROVAL.value
-            pending_action = self._format_pending_action(session.pending_action)
+            pending_action = self._record_pending_action(
+                session, action_type, arguments, description, now
+            )
         # Fallback: check approval_required flag (legacy trigger)
         elif hasattr(result_data, "approval_required") and result_data.approval_required:
             pending_approval = True
-            session.pending_action = {
-                "action_id": uuid.uuid4().hex[:16],
-                "action_type": "unknown",
-                "description": "Agent requested approval for an action",
-                "arguments": {},
-                "created_at": now.isoformat(),
-                "expires_at": (
-                    now + timedelta(minutes=self.settings.agent_approval_timeout_minutes)
-                ).isoformat(),
-            }
-            session.status = SessionStatus.AWAITING_APPROVAL.value
-            pending_action = self._format_pending_action(session.pending_action)
+            pending_action = self._record_pending_action(
+                session,
+                "unknown",
+                {},
+                "Agent requested approval for an action",
+                now,
+            )
 
         # Update session
         usage = result.usage()
@@ -456,153 +511,185 @@ async def stream_chat(
             agent_type=session.agent_type,
         )
 
-        # Stream the response
+        # Stream the response. Ollama's OpenAI-compat endpoint rejects
+        # PydanticAI's streamed request with 400 "invalid message content type:
+        # <nil>" (#342), while the non-streaming run() path works — so fall back
+        # to run() for the ollama provider and emit the result as a single
+        # text_delta plus the usual approval/complete events. Cloud providers
+        # keep the true token-streaming path.
+        default_model = self.settings.agent_default_model
+        provider = default_model.split(":", 1)[0] if ":" in default_model else ""
+        stream_supported = provider != "ollama"
+        # Always bound for the misbehavior handler (see chat()).
+        captured_messages: list[ModelMessage] = []
         try:
-            with _sequential_tool_execution():
+            with capture_run_messages() as captured_messages, _sequential_tool_execution():
                 async with asyncio.timeout(self.settings.agent_timeout_seconds):
-                    async with agent.run_stream(
-                        message,
-                        deps=deps,
-                        message_history=message_history,
-                    ) as result:
-                        try:
-                            async for text in result.stream_text():
-                                yield StreamEvent(
-                                    event_type="text_delta",
-                                    data={"delta": text},
-                                    timestamp=datetime.now(UTC),
+                    final_result: Any
+                    usage: Any
+                    all_messages: list[ModelMessage]
+
+                    if stream_supported:
+                        async with agent.run_stream(
+                            message,
+                            deps=deps,
+                            message_history=message_history,
+                        ) as result:
+                            try:
+                                async for text in result.stream_text():
+                                    yield StreamEvent(
+                                        event_type="text_delta",
+                                        data={"delta": text},
+                                        timestamp=datetime.now(UTC),
+                                    )
+                            except Exception as e:
+                                # Structured output agents (output_type=...) cannot
+                                # stream raw text deltas. Skip delta streaming and
+                                # only emit the final complete event.
+                                logger.info(
+                                    "agents.stream_chat_text_delta_unavailable",
+                                    session_id=session_id,
+                                    error=str(e),
+                                    error_type=type(e).__name__,
                                 )
-                        except Exception as e:
-                            # Structured output agents (output_type=...) cannot stream raw text deltas.
-                            # In that case we skip delta streaming and only emit the final complete event.
-                            logger.info(
-                                "agents.stream_chat_text_delta_unavailable",
-                                session_id=session_id,
-                                error=str(e),
-                                error_type=type(e).__name__,
+                            # NOTE: PydanticAI exposes get_output() on StreamedRunResult.
+                            final_result = await result.get_output()
+                            usage = result.usage()
+                            all_messages = result.all_messages()
+                    else:
+                        # #342 — non-streaming fallback for the ollama provider.
+                        run_result = await agent.run(
+                            message,
+                            deps=deps,
+                            message_history=message_history,
+                        )
+                        final_result = run_result.output
+                        usage = run_result.usage()
+                        all_messages = run_result.all_messages()
+
+                    # Update session (shared by both paths)
+                    session.message_history = self._serialize_messages(all_messages)
+                    session.total_tokens_used += usage.total_tokens or 0
+                    session.tool_calls_count += deps.tool_call_count
+                    session.last_activity = datetime.now(UTC)
+                    session.expires_at = session.last_activity + timedelta(
+                        minutes=self.settings.agent_session_ttl_minutes
+                    )
+
+                    await db.flush()
+
+                    # Check for pending approval actions (mirror chat() logic)
+                    pending_action = None
+                    pending_approval = False
+                    stream_now = datetime.now(UTC)
+
+                    # Primary trigger (#336): a gated tool recorded a
+                    # machine-readable approval request on deps. Deterministic
+                    # — the experiment agent's ExperimentReport output has no
+                    # pending_action field, so the legacy triggers below never
+                    # fired and the approval_required event was never emitted.
+                    if deps.pending_action:
+                        pending_approval = True
+                        pending_action = self._record_pending_action(
+                            session,
+                            action_type=str(deps.pending_action.get("action_type", "unknown")),
+                            arguments=deps.pending_action.get("arguments") or {},
+                            description=str(
+                                deps.pending_action.get("description")
+                                or "Agent requested approval for "
+                                f"{deps.pending_action.get('action_type', 'unknown')}"
+                            ),
+                            now=stream_now,
+                        )
+                    # Legacy trigger: structured output carried pending_action.
+                    elif hasattr(final_result, "pending_action") and final_result.pending_action:
+                        pending_approval = True
+                        pending_action_data = final_result.pending_action
+                        # Extract action details - support both dict and object with attributes
+                        if isinstance(pending_action_data, dict):
+                            action_type = pending_action_data.get("action_type", "unknown")
+                            arguments = pending_action_data.get("arguments", {})
+                            description = pending_action_data.get(
+                                "description", f"Agent requested approval for {action_type}"
+                            )
+                        else:
+                            action_type = getattr(pending_action_data, "action_type", "unknown")
+                            arguments = getattr(pending_action_data, "arguments", {})
+                            description = getattr(
+                                pending_action_data,
+                                "description",
+                                f"Agent requested approval for {action_type}",
                             )
 
-                        # Get final result and update session
-                        # NOTE: PydanticAI v1.48 exposes get_output() on StreamedRunResult.
-                        final_result: Any = await result.get_output()
-                        usage = result.usage()
-
-                        session.message_history = self._serialize_messages(result.all_messages())
-                        session.total_tokens_used += usage.total_tokens or 0
-                        session.tool_calls_count += deps.tool_call_count
-                        session.last_activity = datetime.now(UTC)
-                        session.expires_at = session.last_activity + timedelta(
-                            minutes=self.settings.agent_session_ttl_minutes
+                        pending_action = self._record_pending_action(
+                            session, action_type, arguments, description, stream_now
+                        )
+                    # Fallback: check approval_required flag (legacy trigger)
+                    elif (
+                        hasattr(final_result, "approval_required")
+                        and final_result.approval_required
+                    ):
+                        pending_approval = True
+                        pending_action = self._record_pending_action(
+                            session,
+                            "unknown",
+                            {},
+                            "Agent requested approval for an action",
+                            stream_now,
                         )
 
-                        await db.flush()
-
-                        # Check for pending approval actions (mirror chat() logic)
-                        pending_action = None
-                        pending_approval = False
-                        stream_now = datetime.now(UTC)
-
-                        # Check for pending_action in result data (primary trigger)
-                        if hasattr(final_result, "pending_action") and final_result.pending_action:
-                            pending_approval = True
-                            pending_action_data = final_result.pending_action
-                            # Extract action details - support both dict and object with attributes
-                            if isinstance(pending_action_data, dict):
-                                action_type = pending_action_data.get("action_type", "unknown")
-                                arguments = pending_action_data.get("arguments", {})
-                                description = pending_action_data.get(
-                                    "description", f"Agent requested approval for {action_type}"
-                                )
-                            else:
-                                action_type = getattr(pending_action_data, "action_type", "unknown")
-                                arguments = getattr(pending_action_data, "arguments", {})
-                                description = getattr(
-                                    pending_action_data,
-                                    "description",
-                                    f"Agent requested approval for {action_type}",
-                                )
+                    await db.flush()
 
-                            session.pending_action = {
-                                "action_id": uuid.uuid4().hex[:16],
-                                "action_type": action_type,
-                                "description": description,
-                                "arguments": arguments,
-                                "created_at": stream_now.isoformat(),
-                                "expires_at": (
-                                    stream_now
-                                    + timedelta(
-                                        minutes=self.settings.agent_approval_timeout_minutes
-                                    )
-                                ).isoformat(),
-                            }
-                            session.status = SessionStatus.AWAITING_APPROVAL.value
-                            pending_action = self._format_pending_action(session.pending_action)
-                        # Fallback: check approval_required flag (legacy trigger)
+                    # Build the response text (shared by both paths).
+                    response_message: str = "No response generated."
+                    if final_result:
+                        if hasattr(final_result, "answer") and final_result.answer:
+                            response_message = str(final_result.answer)
+                        elif hasattr(final_result, "summary") and final_result.summary:
+                            response_message = str(final_result.summary)
                         elif (
-                            hasattr(final_result, "approval_required")
-                            and final_result.approval_required
+                            hasattr(final_result, "recommendations")
+                            and final_result.recommendations
                         ):
-                            pending_approval = True
-                            session.pending_action = {
-                                "action_id": uuid.uuid4().hex[:16],
-                                "action_type": "unknown",
-                                "description": "Agent requested approval for an action",
-                                "arguments": {},
-                                "created_at": stream_now.isoformat(),
-                                "expires_at": (
-                                    stream_now
-                                    + timedelta(
-                                        minutes=self.settings.agent_approval_timeout_minutes
-                                    )
-                                ).isoformat(),
-                            }
-                            session.status = SessionStatus.AWAITING_APPROVAL.value
-                            pending_action = self._format_pending_action(session.pending_action)
-
-                        await db.flush()
-
-                        # If approval is required, emit approval_required event
-                        if pending_approval and pending_action:
-                            yield StreamEvent(
-                                event_type="approval_required",
-                                data={
-                                    "action": pending_action,
-                                    "message": "Human approval required before proceeding.",
-                                },
-                                timestamp=stream_now,
-                            )
-
-                        # Yield completion event
-                        response_message: str = "No response generated."
-                        if final_result:
-                            if hasattr(final_result, "answer") and final_result.answer:
-                                response_message = str(final_result.answer)
-                            elif hasattr(final_result, "summary") and final_result.summary:
-                                response_message = str(final_result.summary)
-                            elif (
-                                hasattr(final_result, "recommendations")
-                                and final_result.recommendations
-                            ):
-                                recommendations = final_result.recommendations
-                                if isinstance(recommendations, list) and recommendations:
-                                    response_message = "\n".join(
-                                        str(item) for item in recommendations
-                                    )
-                                else:
-                                    response_message = str(final_result)
+                            recommendations = final_result.recommendations
+                            if isinstance(recommendations, list) and recommendations:
+                                response_message = "\n".join(str(item) for item in recommendations)
                             else:
                                 response_message = str(final_result)
+                        else:
+                            response_message = str(final_result)
 
+                    # #342 — the ollama (non-streaming) path produced no token
+                    # deltas; emit the full text once so the FE renders the reply.
+                    # Cloud streaming behavior is unchanged.
+                    if not stream_supported and response_message != "No response generated.":
                         yield StreamEvent(
-                            event_type="complete",
+                            event_type="text_delta",
+                            data={"delta": response_message},
+                            timestamp=datetime.now(UTC),
+                        )
+
+                    # If approval is required, emit approval_required event
+                    if pending_approval and pending_action:
+                        yield StreamEvent(
+                            event_type="approval_required",
                             data={
-                                "message": response_message,
-                                "tokens_used": usage.total_tokens or 0,
-                                "tool_calls_count": deps.tool_call_count,
-                                "pending_approval": pending_approval,
+                                "action": pending_action,
+                                "message": "Human approval required before proceeding.",
                             },
-                            timestamp=datetime.now(UTC),
+                            timestamp=stream_now,
                         )
+
+                    yield StreamEvent(
+                        event_type="complete",
+                        data={
+                            "message": response_message,
+                            "tokens_used": usage.total_tokens or 0,
+                            "tool_calls_count": deps.tool_call_count,
+                            "pending_approval": pending_approval,
+                        },
+                        timestamp=datetime.now(UTC),
+                    )
         except TimeoutError as e:
             raise TimeoutError(
                 f"Agent response timed out after {self.settings.agent_timeout_seconds} seconds"
@@ -617,6 +704,58 @@ async def stream_chat(
                 error=str(e),
                 error_type=type(e).__name__,
             )
+            misbehavior_now = datetime.now(UTC)
+            session.last_activity = misbehavior_now
+            # A gated tool may have fired (and recorded a valid approval request)
+            # before the model misbehaved — surface the Approve card rather than
+            # discarding it behind the generic error (#344).
+            salvaged = self._salvage_pending_action(session, deps, misbehavior_now)
+            await db.flush()
+            if salvaged is not None:
+                yield StreamEvent(
+                    event_type="approval_required",
+                    data={
+                        "action": salvaged,
+                        "message": "Human approval required before proceeding.",
+                    },
+                    timestamp=misbehavior_now,
+                )
+                yield StreamEvent(
+                    event_type="complete",
+                    data={
+                        "message": (
+                            "I've prepared an action that needs your approval before I can proceed."
+                        ),
+                        "tokens_used": 0,
+                        "tool_calls_count": deps.tool_call_count,
+                        "pending_approval": True,
+                    },
+                    timestamp=misbehavior_now,
+                )
+                return
+            # A weak local model often calls tools and obtains the data, then
+            # fails to wrap it in the structured output schema (#351). Salvage a
+            # plain-text answer from the tool data already captured this run and
+            # emit it as a normal reply rather than an error.
+            answer = await self._salvage_plaintext_answer(message, captured_messages)
+            if answer is not None:
+                logger.info("agents.stream_chat_finalizer_salvage", session_id=session_id)
+                yield StreamEvent(
+                    event_type="text_delta",
+                    data={"delta": answer},
+                    timestamp=misbehavior_now,
+                )
+                yield StreamEvent(
+                    event_type="complete",
+                    data={
+                        "message": answer,
+                        "tokens_used": 0,
+                        "tool_calls_count": deps.tool_call_count,
+                        "pending_approval": False,
+                    },
+                    timestamp=misbehavior_now,
+                )
+                return
             yield StreamEvent(
                 event_type="error",
                 data={
@@ -627,7 +766,7 @@ async def stream_chat(
                     "error_type": "model_behavior_error",
                     "recoverable": True,
                 },
-                timestamp=datetime.now(UTC),
+                timestamp=misbehavior_now,
             )
             return
 
@@ -825,6 +964,183 @@ def _deserialize_messages(
             )
             return []
 
+    def _salvage_pending_action(
+        self,
+        session: AgentSession,
+        deps: AgentDeps,
+        now: datetime,
+    ) -> PendingAction | None:
+        """Persist a gated tool's approval request captured before a misbehaving run.
+
+        A gated tool sets ``deps.pending_action`` the moment it fires (#336), but
+        it does not halt the run. A weak model can ramble past the gate and
+        exhaust its retry budget, so ``agent.run()`` raises
+        ``UnexpectedModelBehavior`` BEFORE returning and the normal post-run
+        approval-surfacing path never executes. The gate did fire and the
+        captured arguments are valid, so surface the approval card instead of
+        discarding it behind a generic error (issue #344).
+
+        Args:
+            session: The agent session to mutate.
+            deps: The agent deps that a gated tool may have written to.
+            now: Timestamp for created_at / expires_at.
+
+        Returns:
+            The formatted :class:`PendingAction` when a gated tool recorded a
+            request, else ``None`` (the genuine "invalid tool call" case).
+        """
+        if not deps.pending_action:
+            return None
+        action_type = str(deps.pending_action.get("action_type", "unknown"))
+        return self._record_pending_action(
+            session,
+            action_type=action_type,
+            arguments=deps.pending_action.get("arguments") or {},
+            description=str(
+                deps.pending_action.get("description")
+                or f"Agent requested approval for {action_type}"
+            ),
+            now=now,
+        )
+
+    @staticmethod
+    def _extract_tool_payloads(captured: list[ModelMessage]) -> list[dict[str, Any]]:
+        """Pull every tool return out of a captured run's message trace.
+
+        Used by :meth:`_salvage_plaintext_answer` to recover the data a weak
+        model fetched before it failed structured-output validation (#351).
+
+        Args:
+            captured: Messages captured via ``capture_run_messages`` (may be empty
+                when the run failed before any tool returned).
+
+        Returns:
+            One ``{"tool", "result"}`` dict per ``ToolReturnPart``, in order.
+        """
+        payloads: list[dict[str, Any]] = []
+        for message in captured:
+            for part in getattr(message, "parts", []):
+                if isinstance(part, ToolReturnPart):
+                    payloads.append({"tool": part.tool_name, "result": part.content})
+        return payloads
+
+    @classmethod
+    def _compact_for_finalizer(cls, obj: object) -> object:
+        """Recursively strip verbose, decision-irrelevant keys from tool data (#351).
+
+        Keeps each entry's identity + metrics while dropping bulky nested config
+        / runtime blobs, so a full result set fits in the finalizer's budget and
+        a ranking sees every entry. Pure/serialisation-only — no I/O.
+
+        Args:
+            obj: Any JSON-ish value extracted from a tool return.
+
+        Returns:
+            The same structure with :data:`_FINALIZER_DROP_KEYS` removed at every
+            dict level.
+        """
+        if isinstance(obj, dict):
+            return {
+                k: cls._compact_for_finalizer(v)
+                for k, v in obj.items()
+                if k not in _FINALIZER_DROP_KEYS
+            }
+        if isinstance(obj, list):
+            return [cls._compact_for_finalizer(v) for v in obj]
+        return obj
+
+    async def _salvage_plaintext_answer(
+        self,
+        message: str,
+        captured: list[ModelMessage],
+    ) -> str | None:
+        """Answer in plain text from tool data when structured output failed (#351).
+
+        A weak local model (e.g. ``ollama:llama3.1:8b``) reliably calls the read
+        tool and gets the data, but echoes the raw tool result instead of the
+        primary agent's ``PromptedOutput`` schema, exhausting the output-retry
+        budget. The data was obtained, though — so hand it to a tool-less,
+        ``str``-output finalizer that answers the user's question directly. The
+        finalizer cannot loop (no tools) or fail schema validation (plain text).
+
+        Args:
+            message: The original user message.
+            captured: Messages captured from the failed run.
+
+        Returns:
+            The finalizer's plain-text answer, or ``None`` when no tool data was
+            obtained or the finalizer itself errors (caller falls back to the
+            generic recoverable error).
+        """
+        payloads = self._extract_tool_payloads(captured)
+        if not payloads:
+            return None
+        try:
+            from app.features.agents.agents.base import build_finalizer_agent
+
+            compact = self._compact_for_finalizer(payloads)
+            data = json.dumps(compact, default=str)[:_FINALIZER_MAX_CHARS]
+            prompt = (
+                f"User question:\n{message}\n\n"
+                f"Data retrieved from tools (JSON):\n{data}\n\n"
+                "Answer the user's question concisely from this data. If the "
+                "question asks for the lowest/highest of a metric (e.g. WAPE), "
+                "compare that metric across ALL entries that have it, ignore "
+                "entries where it is missing/null, and report the true "
+                "minimum/maximum with its value."
+            )
+            finalizer = build_finalizer_agent()
+            result = await asyncio.wait_for(
+                finalizer.run(prompt),
+                timeout=self.settings.agent_timeout_seconds,
+            )
+            text = str(result.output).strip()
+            return text or None
+        except Exception:
+            # Best-effort: a finalizer failure must never replace the original
+            # recoverable error with a crash.
+            logger.warning("agents.finalizer_fallback_failed", exc_info=True)
+            return None
+
+    def _record_pending_action(
+        self,
+        session: AgentSession,
+        action_type: str,
+        arguments: dict[str, Any],
+        description: str,
+        now: datetime,
+    ) -> PendingAction | None:
+        """Persist a HITL approval request on the session and format it.
+
+        Builds the canonical ``session.pending_action`` dict (fresh action_id +
+        expiry), flips the session to ``awaiting_approval``, and returns the
+        ``PendingAction`` schema for the response / stream event. Shared by the
+        deterministic deps-based trigger (#336) and the legacy structured-output
+        triggers so all three paths persist an identical shape.
+
+        Args:
+            session: The agent session to mutate.
+            action_type: Gated action name.
+            arguments: Arguments to replay on approval.
+            description: Human-readable approval-card summary.
+            now: Timestamp used for created_at / expires_at.
+
+        Returns:
+            The formatted PendingAction, or None if formatting fails.
+        """
+        session.pending_action = {
+            "action_id": uuid.uuid4().hex[:16],
+            "action_type": action_type,
+            "description": description,
+            "arguments": arguments,
+            "created_at": now.isoformat(),
+            "expires_at": (
+                now + timedelta(minutes=self.settings.agent_approval_timeout_minutes)
+            ).isoformat(),
+        }
+        session.status = SessionStatus.AWAITING_APPROVAL.value
+        return self._format_pending_action(session.pending_action)
+
     def _format_pending_action(
         self,
         pending: dict[str, Any] | None,
diff --git a/app/features/agents/tests/test_base.py b/app/features/agents/tests/test_base.py
index ddfcd02b..c7d8d29a 100644
--- a/app/features/agents/tests/test_base.py
+++ b/app/features/agents/tests/test_base.py
@@ -1,10 +1,12 @@
 """Unit tests for agent base helpers (Ollama-aware model factory)."""
 
+import json
 import re
 from collections.abc import Iterator
 from typing import Any, cast
 from unittest.mock import AsyncMock
 
+import httpx
 import pytest
 from pydantic_ai import ModelRetry
 from pydantic_ai.messages import ModelMessage, ModelResponse, TextPart
@@ -15,6 +17,8 @@
 from app.core.config import get_settings
 from app.features.agents.agents.base import (
     TOOL_USAGE_INSTRUCTIONS,
+    _coerce_null_message_content,
+    _OllamaNullContentTransport,
     build_agent_model,
     build_agent_model_with_fallback,
     get_agent_retries,
@@ -322,3 +326,134 @@ def respond(messages: list[ModelMessage], info: AgentInfo) -> ModelResponse:
     assert captured["output_tools"] == []
     assert isinstance(result.output, RAGAnswer)
     assert result.output.confidence == "high"
+
+
+class TestOllamaNullContentSanitizer:
+    """The Ollama HTTP client must convert ``content: null`` -> ``""`` (#344).
+
+    Ollama's OpenAI-compatible ``/v1/chat/completions`` rejects any message
+    whose ``content`` is JSON ``null`` and carries no ``tool_calls`` with
+    ``400 invalid message content type: <nil>``. PydanticAI emits that shape for
+    a degenerate empty assistant turn and then replays it on retry, so without
+    this coercion every retry 400s and the run dies with ``FallbackExceptionGroup``.
+    """
+
+    def test_coerce_rewrites_null_content_to_empty_string(self) -> None:
+        body = json.dumps(
+            {
+                "model": "qwen3:8b",
+                "messages": [
+                    {"role": "user", "content": "hi"},
+                    {"role": "assistant", "content": None},
+                ],
+            }
+        ).encode("utf-8")
+
+        out = _coerce_null_message_content(body)
+
+        assert out is not None
+        payload = json.loads(out)
+        assert payload["messages"][1]["content"] == ""
+        # Untouched fields survive the round-trip.
+        assert payload["messages"][0]["content"] == "hi"
+        assert payload["model"] == "qwen3:8b"
+
+    def test_coerce_rewrites_null_content_even_with_tool_calls(self) -> None:
+        body = json.dumps(
+            {
+                "messages": [
+                    {
+                        "role": "assistant",
+                        "content": None,
+                        "tool_calls": [
+                            {
+                                "id": "c1",
+                                "type": "function",
+                                "function": {"name": "x", "arguments": "{}"},
+                            }
+                        ],
+                    }
+                ]
+            }
+        ).encode("utf-8")
+
+        out = _coerce_null_message_content(body)
+
+        assert out is not None
+        payload = json.loads(out)
+        assert payload["messages"][0]["content"] == ""
+        assert payload["messages"][0]["tool_calls"][0]["id"] == "c1"
+
+    def test_coerce_is_noop_when_no_null_content(self) -> None:
+        body = json.dumps({"messages": [{"role": "user", "content": "hi"}]}).encode("utf-8")
+
+        assert _coerce_null_message_content(body) is None
+
+    def test_coerce_ignores_missing_content_key(self) -> None:
+        # A message with no ``content`` key at all must not be rewritten — only
+        # an explicit JSON null is the Ollama-rejected shape.
+        body = json.dumps({"messages": [{"role": "assistant", "tool_calls": []}]}).encode("utf-8")
+
+        assert _coerce_null_message_content(body) is None
+
+    def test_coerce_handles_non_json_body(self) -> None:
+        assert _coerce_null_message_content(b"not json at all") is None
+
+    def test_coerce_handles_non_dict_payload(self) -> None:
+        assert _coerce_null_message_content(b"[1, 2, 3]") is None
+
+    @pytest.mark.asyncio
+    async def test_transport_sanitizes_outgoing_request(
+        self, monkeypatch: pytest.MonkeyPatch
+    ) -> None:
+        """The transport rewrites the body and fixes Content-Length before send."""
+        captured: dict[str, bytes] = {}
+
+        async def fake_send(
+            _self: httpx.AsyncHTTPTransport, request: httpx.Request
+        ) -> httpx.Response:
+            captured["body"] = request.content
+            captured["content_length"] = request.headers["content-length"].encode()
+            return httpx.Response(200, json={"ok": True})
+
+        monkeypatch.setattr(httpx.AsyncHTTPTransport, "handle_async_request", fake_send)
+
+        transport = _OllamaNullContentTransport()
+        body = json.dumps({"messages": [{"role": "assistant", "content": None}]}).encode("utf-8")
+        request = httpx.Request("POST", "http://ollama/v1/chat/completions", content=body)
+
+        await transport.handle_async_request(request)
+
+        sent = json.loads(captured["body"])
+        assert sent["messages"][0]["content"] == ""
+        # Content-Length must match the rewritten body, not the original.
+        assert int(captured["content_length"]) == len(captured["body"])
+
+    @pytest.mark.asyncio
+    async def test_transport_passthrough_when_nothing_to_sanitize(
+        self, monkeypatch: pytest.MonkeyPatch
+    ) -> None:
+        captured: dict[str, bytes] = {}
+
+        async def fake_send(
+            _self: httpx.AsyncHTTPTransport, request: httpx.Request
+        ) -> httpx.Response:
+            captured["body"] = request.content
+            return httpx.Response(200, json={"ok": True})
+
+        monkeypatch.setattr(httpx.AsyncHTTPTransport, "handle_async_request", fake_send)
+
+        transport = _OllamaNullContentTransport()
+        body = json.dumps({"messages": [{"role": "user", "content": "hi"}]}).encode("utf-8")
+        request = httpx.Request("POST", "http://ollama/v1/chat/completions", content=body)
+
+        await transport.handle_async_request(request)
+
+        # Forwarded unchanged.
+        assert json.loads(captured["body"])["messages"][0]["content"] == "hi"
+
+    def test_build_agent_model_returns_openai_chat_model_for_ollama(self) -> None:
+        # The Ollama branch must hand back a configured OpenAIChatModel (whose
+        # HTTP client carries the sanitizing transport), not the bare identifier.
+        model = build_agent_model("ollama:qwen3:8b")
+        assert isinstance(model, OpenAIChatModel)
diff --git a/app/features/agents/tests/test_read_only_guard.py b/app/features/agents/tests/test_read_only_guard.py
new file mode 100644
index 00000000..6c1a3f4c
--- /dev/null
+++ b/app/features/agents/tests/test_read_only_guard.py
@@ -0,0 +1,195 @@
+"""Deterministic tests for the experiment-agent read-only intent guard (#347).
+
+The guard stops a read-only question ("list the runs and tell me the lowest
+WAPE", "top products", "current deployment alias") from derailing into a
+scenario / write / experiment tool — especially on an output-format validation
+retry, where a weak local model tends to start a brand-new action instead of
+reformatting the data it already fetched.
+
+These tests are deterministic and require **no live model call**: they assert
+that the guard text exists, names the right tools, and governs each named
+read-only intent, and that the guard is actually delivered to the model in the
+system prompt.
+"""
+
+from __future__ import annotations
+
+from collections.abc import Iterator
+from unittest.mock import AsyncMock
+
+import pytest
+from pydantic_ai.messages import ModelMessage, ModelResponse, TextPart
+from pydantic_ai.models.function import AgentInfo, FunctionModel
+
+from app.core.config import get_settings
+from app.features.agents.agents.base import READ_ONLY_INTENT_GUARD
+from app.features.agents.agents.experiment import (
+    EXPERIMENT_SYSTEM_PROMPT,
+    create_experiment_agent,
+)
+from app.features.agents.deps import AgentDeps
+
+# Tools that must NEVER be called for a read-only intent.
+PROHIBITED_TOOLS = (
+    "tool_propose_scenario",
+    "tool_save_scenario",
+    "tool_create_alias",
+    "tool_archive_run",
+    "tool_run_backtest",
+)
+
+# Read-only tools the guard steers the model toward.
+ALLOWED_READ_TOOLS = (
+    "tool_list_runs",
+    "tool_get_run",
+    "tool_compare_runs",
+)
+
+
+@pytest.fixture(autouse=True)
+def _reset_settings() -> Iterator[None]:
+    """Reset the settings cache so model mutations do not leak across tests."""
+    get_settings.cache_clear()
+    yield
+    get_settings.cache_clear()
+
+
+def test_guard_is_embedded_in_experiment_prompt() -> None:
+    """The experiment system prompt embeds the read-only intent guard."""
+    assert READ_ONLY_INTENT_GUARD.strip() in EXPERIMENT_SYSTEM_PROMPT
+    assert "READ-ONLY INTENT GUARD" in EXPERIMENT_SYSTEM_PROMPT
+
+
+@pytest.mark.parametrize("tool_name", PROHIBITED_TOOLS)
+def test_guard_names_prohibited_tools(tool_name: str) -> None:
+    """The guard explicitly forbids each scenario/write/experiment tool."""
+    assert tool_name in READ_ONLY_INTENT_GUARD
+    # And the prohibition is unambiguous.
+    assert "NEVER call" in READ_ONLY_INTENT_GUARD
+
+
+@pytest.mark.parametrize("tool_name", ALLOWED_READ_TOOLS)
+def test_guard_names_allowed_read_tools(tool_name: str) -> None:
+    """The guard points the model at the read-only tools to use instead."""
+    assert tool_name in READ_ONLY_INTENT_GUARD
+    assert "Use ONLY read-only tools" in READ_ONLY_INTENT_GUARD
+
+
+def test_guard_forbids_new_tools_on_validation_retry() -> None:
+    """On an output-format retry the model must reformat, not call new tools."""
+    guard = READ_ONLY_INTENT_GUARD
+    assert "OUTPUT-FORMAT RETRIES" in guard
+    assert "DO NOT call any new tool" in guard
+    assert "reformat" in guard
+    # The exact validation-error string that triggered the original derail.
+    assert "summary: Field required" in guard
+
+
+def test_guard_forbids_tool_call_loops() -> None:
+    """The guard tells the model to finish in one pass and never re-call a tool (#349).
+
+    Regression for the observed failure where a weak 8B model called
+    ``tool_list_runs`` four times in a row — even though it already had the data —
+    and blew the output-retry budget (``Exceeded maximum output retries (3)``).
+    """
+    guard = READ_ONLY_INTENT_GUARD
+    assert "FINISH IN ONE PASS" in guard
+    assert "AT MOST ONCE" in guard
+    assert "NEVER call a tool again that has already returned" in guard
+    assert "STOP calling tools" in guard
+
+
+def test_guard_handles_empty_tool_result() -> None:
+    """An empty read result is reported in the summary, not retried (#349)."""
+    guard = READ_ONLY_INTENT_GUARD
+    assert "EMPTY result" in guard
+    assert "do NOT retry the tool" in guard
+    # The wrapped example phrase, newlines/indent collapsed.
+    assert "No model runs found." in " ".join(guard.split())
+
+
+def test_guard_requires_clarification_for_ambiguous_top_products() -> None:
+    """An ambiguous "top products" ranking gets a clarifying question, not a guess."""
+    guard = READ_ONLY_INTENT_GUARD
+    assert "top products" in guard
+    assert "Top by revenue, units sold, forecasted demand, or model error?" in guard
+
+
+def test_guard_prohibits_invented_ids() -> None:
+    """The guard forbids inventing store_id / product_id / run_id values."""
+    guard = READ_ONLY_INTENT_GUARD
+    assert "NEVER invent" in guard
+    for token in ("store_id", "product_id", "run_id"):
+        assert token in guard
+
+
+def test_guard_states_limitation_when_no_tool_exists() -> None:
+    """The guard tells the model to state a missing-tool limitation, not fabricate."""
+    guard = READ_ONLY_INTENT_GUARD
+    assert "does not have a tool for that metric" in guard
+    assert "Do NOT invent data" in guard
+
+
+# Each example read-only prompt and the guard substring that proves the guard
+# governs that intent (so the named query class can never silently lose
+# coverage). Deterministic — no model is invoked.
+@pytest.mark.parametrize(
+    ("prompt", "covered_intent"),
+    [
+        (
+            "List the most recent model runs and tell me which has the lowest WAPE.",
+            "WAPE",
+        ),
+        ("List the top products.", "top products"),
+        (
+            "Which products have the highest forecasted demand?",
+            "highest forecasted demand",
+        ),
+        ("Show the current deployment alias.", "registry aliases and deployment status"),
+        ("Summarize total revenue and units sold.", "units-sold summaries"),
+        ("Show the backtest metrics for this grain.", "backtest metrics"),
+    ],
+)
+def test_read_only_intents_are_covered_by_guard(prompt: str, covered_intent: str) -> None:
+    """Every named read-only intent is enumerated in the guard's read-only list.
+
+    This is the routing contract: each of these prompts is a read-only request,
+    and the guard's read-only example list names its intent — so the model is
+    told to answer it with read tools only and never with a scenario/write tool.
+    """
+    assert covered_intent in READ_ONLY_INTENT_GUARD
+
+
+def test_guard_is_delivered_in_system_prompt_to_model() -> None:
+    """The guard actually reaches the model in the delivered system prompt.
+
+    Builds the real experiment agent against a stub FunctionModel (no live
+    call), captures the system prompt the framework sends, and asserts the guard
+    is present. Regression for #347 — a guard that never reaches the model is
+    worthless.
+    """
+    settings = get_settings()
+    settings.agent_default_model = "ollama:llama3.1"
+    agent = create_experiment_agent()
+
+    captured: dict[str, str] = {}
+
+    def respond(messages: list[ModelMessage], info: AgentInfo) -> ModelResponse:
+        for message in messages:
+            for part in getattr(message, "parts", []):
+                if getattr(part, "part_kind", None) == "system-prompt":
+                    captured["system_prompt"] = part.content
+        # End the run with a PromptedOutput-parseable text reply.
+        return ModelResponse(parts=[TextPart(content='{"summary": "noop"}')])
+
+    agent.run_sync(
+        "List the most recent model runs and tell me which has the lowest WAPE.",
+        model=FunctionModel(respond),
+        deps=AgentDeps(db=AsyncMock(), session_id="test-read-only-guard"),
+    )
+
+    system_prompt = captured.get("system_prompt", "")
+    assert "READ-ONLY INTENT GUARD" in system_prompt
+    assert "DO NOT call any new tool" in system_prompt
+    for tool_name in PROHIBITED_TOOLS:
+        assert tool_name in system_prompt
diff --git a/app/features/agents/tests/test_service.py b/app/features/agents/tests/test_service.py
index 08064495..759e0284 100644
--- a/app/features/agents/tests/test_service.py
+++ b/app/features/agents/tests/test_service.py
@@ -3,7 +3,7 @@
 import json
 from collections.abc import AsyncIterator
 from datetime import UTC, datetime, timedelta
-from typing import Any
+from typing import Any, cast
 from unittest.mock import AsyncMock, MagicMock, patch
 
 import pytest
@@ -14,6 +14,7 @@
     ModelRequest,
     ModelResponse,
     TextPart,
+    ToolReturnPart,
     UserPromptPart,
 )
 
@@ -335,6 +336,49 @@ async def test_chat_model_misbehavior_returns_friendly_message(
         assert "invalid tool call" in response.message
         assert "exceeded max retries" not in response.message
 
+    @pytest.mark.asyncio
+    async def test_chat_finalizer_salvages_answer_on_misbehavior(
+        self,
+        sample_active_session: AgentSession,
+    ) -> None:
+        """When tools fetched data but structured output failed, salvage a reply (#351).
+
+        A weak local model calls the read tool and gets the data, then can't wrap
+        it in the ExperimentReport schema and exhausts the output-retry budget.
+        The service then asks a tool-less finalizer to answer in plain text — the
+        user gets the answer instead of the generic "invalid tool call" error.
+        """
+        service = AgentService()
+        mock_db = AsyncMock()
+
+        mock_result = MagicMock()
+        mock_result.scalar_one_or_none.return_value = sample_active_session
+        mock_db.execute.return_value = mock_result
+
+        mock_agent = MagicMock()
+        mock_agent.run = AsyncMock(
+            side_effect=UnexpectedModelBehavior("Exceeded maximum output retries (3)")
+        )
+
+        salvaged_answer = "The lowest WAPE is the naive run 2fad611b (18.93)."
+        with (
+            patch.object(service, "_get_agent", return_value=mock_agent),
+            patch.object(
+                service,
+                "_salvage_plaintext_answer",
+                AsyncMock(return_value=salvaged_answer),
+            ),
+        ):
+            response = await service.chat(
+                db=mock_db,
+                session_id=sample_active_session.session_id,
+                message="List the most recent model runs and tell me which has the lowest WAPE.",
+            )
+
+        assert response.message == salvaged_answer
+        assert response.pending_approval is False
+        assert "invalid tool call" not in response.message
+
     @pytest.mark.asyncio
     async def test_chat_runs_tools_sequentially(
         self,
@@ -386,6 +430,7 @@ class TestAgentServiceStreamChat:
     async def test_stream_chat_model_misbehavior_yields_error_event(
         self,
         sample_active_session: AgentSession,
+        monkeypatch: pytest.MonkeyPatch,
     ) -> None:
         """A misbehaving model should yield a recoverable `error` event, not crash.
 
@@ -394,6 +439,9 @@ async def test_stream_chat_model_misbehavior_yields_error_event(
         raw exception string to the client.
         """
         service = AgentService()
+        # Pin a streaming-capable (cloud) provider so this exercises the
+        # run_stream path regardless of the local .env (#342).
+        monkeypatch.setattr(service.settings, "agent_default_model", "anthropic:claude-test")
         mock_db = AsyncMock()
 
         mock_result = MagicMock()
@@ -430,10 +478,104 @@ async def __aexit__(self, *exc: object) -> bool:
         assert events[0].data["error_type"] == "model_behavior_error"
         assert "exceeded max retries" not in events[0].data["error"]
 
+    @pytest.mark.asyncio
+    async def test_chat_surfaces_pending_action_on_model_misbehavior(
+        self,
+        sample_active_session: AgentSession,
+    ) -> None:
+        """A gated tool that fired before the model misbehaved must surface the
+        Approve card, not the generic error (#344).
+
+        A gated tool records ``deps.pending_action`` the moment it fires, but a
+        weak model can ramble past the gate and exhaust its retry budget, so
+        ``agent.run`` raises ``UnexpectedModelBehavior`` before returning. The
+        captured approval is valid and must not be discarded.
+        """
+        service = AgentService()
+        mock_db = AsyncMock()
+        mock_result = MagicMock()
+        mock_result.scalar_one_or_none.return_value = sample_active_session
+        mock_db.execute.return_value = mock_result
+
+        def _fire_gate_then_misbehave(*_args: Any, **kwargs: Any) -> None:
+            deps: AgentDeps = kwargs["deps"]
+            deps.set_pending_action(
+                "create_alias",
+                {"alias_name": "champion", "run_id": "1" * 32},
+                "Create alias champion",
+            )
+            raise UnexpectedModelBehavior("Exceeded maximum output retries (3)")
+
+        mock_agent = MagicMock()
+        mock_agent.run = AsyncMock(side_effect=_fire_gate_then_misbehave)
+
+        with patch.object(service, "_get_agent", return_value=mock_agent):
+            response = await service.chat(
+                db=mock_db,
+                session_id=sample_active_session.session_id,
+                message="Create alias champion. Call tool_create_alias now.",
+            )
+
+        assert response.pending_approval is True
+        assert response.pending_action is not None
+        assert response.pending_action.action_type == "create_alias"
+        assert response.pending_action.arguments["alias_name"] == "champion"
+        assert "invalid tool call" not in response.message
+        # Session flipped so POST /approve can find the action.
+        assert sample_active_session.status == SessionStatus.AWAITING_APPROVAL.value
+        assert sample_active_session.pending_action is not None
+
+    @pytest.mark.asyncio
+    async def test_stream_chat_surfaces_approval_on_model_misbehavior(
+        self,
+        sample_active_session: AgentSession,
+        monkeypatch: pytest.MonkeyPatch,
+    ) -> None:
+        """The streaming path must emit ``approval_required`` (not ``error``)
+        when a gated tool fired before the model misbehaved (#344)."""
+        service = AgentService()
+        # Pin ollama so stream_chat uses the non-streaming run() path (#342) —
+        # the real-world scenario where this surfaced.
+        monkeypatch.setattr(service.settings, "agent_default_model", "ollama:qwen3:8b")
+        mock_db = AsyncMock()
+        mock_result = MagicMock()
+        mock_result.scalar_one_or_none.return_value = sample_active_session
+        mock_db.execute.return_value = mock_result
+
+        def _fire_gate_then_misbehave(*_args: Any, **kwargs: Any) -> None:
+            deps: AgentDeps = kwargs["deps"]
+            deps.set_pending_action(
+                "create_alias",
+                {"alias_name": "champion", "run_id": "1" * 32},
+                "Create alias champion",
+            )
+            raise UnexpectedModelBehavior("Exceeded maximum output retries (3)")
+
+        mock_agent = MagicMock()
+        mock_agent.run = AsyncMock(side_effect=_fire_gate_then_misbehave)
+
+        with patch.object(service, "_get_agent", return_value=mock_agent):
+            events = [
+                event
+                async for event in service.stream_chat(
+                    db=mock_db,
+                    session_id=sample_active_session.session_id,
+                    message="Create alias champion. Call tool_create_alias now.",
+                )
+            ]
+
+        event_types = [event.event_type for event in events]
+        assert "approval_required" in event_types
+        assert "error" not in event_types
+        approval = next(e for e in events if e.event_type == "approval_required")
+        assert approval.data["action"].action_type == "create_alias"
+        assert sample_active_session.status == SessionStatus.AWAITING_APPROVAL.value
+
     @pytest.mark.asyncio
     async def test_stream_chat_runs_tools_sequentially(
         self,
         sample_active_session: AgentSession,
+        monkeypatch: pytest.MonkeyPatch,
     ) -> None:
         """stream_chat() must also run the agent under sequential tool execution.
 
@@ -442,6 +584,9 @@ async def test_stream_chat_runs_tools_sequentially(
         concurrent-session bug from issue #172.
         """
         service = AgentService()
+        # Pin a streaming-capable (cloud) provider so this exercises the
+        # run_stream path regardless of the local .env (#342).
+        monkeypatch.setattr(service.settings, "agent_default_model", "anthropic:claude-test")
         mock_db = AsyncMock()
 
         mock_result = MagicMock()
@@ -484,6 +629,120 @@ async def __aexit__(self, *exc: object) -> bool:
 
         mock_mode.assert_called_once_with("sequential")
 
+    @pytest.mark.asyncio
+    async def test_stream_chat_ollama_uses_nonstreaming_path(
+        self,
+        sample_active_session: AgentSession,
+        sample_experiment_report: ExperimentReport,
+        monkeypatch: pytest.MonkeyPatch,
+    ) -> None:
+        """#342 — an ollama agent uses agent.run() (not run_stream).
+
+        Ollama's OpenAI-compat endpoint rejects PydanticAI's streamed request
+        with 400 "invalid message content type: <nil>". The service must fall
+        back to the non-streaming run() path and still emit text_delta +
+        approval_required (from deps.pending_action, #336) + complete.
+        """
+        service = AgentService()
+        monkeypatch.setattr(service.settings, "agent_default_model", "ollama:qwen3:8b")
+        mock_db = AsyncMock()
+        mock_result = MagicMock()
+        mock_result.scalar_one_or_none.return_value = sample_active_session
+        mock_db.execute.return_value = mock_result
+
+        def _run(message: str, *, deps: AgentDeps, message_history: Any) -> MagicMock:
+            # A gated tool fired during the run and recorded an approval request.
+            deps.set_pending_action(
+                "save_scenario",
+                {"name": "p", "run_id": "r", "store_id": 1, "product_id": 2},
+                "Save scenario plan 'p'",
+            )
+            res = MagicMock()
+            res.output = sample_experiment_report  # has a non-empty summary
+            usage = MagicMock()
+            usage.total_tokens = 11
+            res.usage.return_value = usage
+            res.all_messages.return_value = []
+            return res
+
+        mock_agent = MagicMock()
+        mock_agent.run = AsyncMock(side_effect=_run)
+        mock_agent.run_stream = MagicMock(
+            side_effect=AssertionError("run_stream must not be called for the ollama provider")
+        )
+
+        with patch.object(service, "_get_agent", return_value=mock_agent):
+            events = [
+                event
+                async for event in service.stream_chat(
+                    db=mock_db,
+                    session_id=sample_active_session.session_id,
+                    message="Save a what-if scenario plan",
+                )
+            ]
+
+        types = [e.event_type for e in events]
+        assert "text_delta" in types  # full reply emitted as one delta
+        assert "approval_required" in types
+        assert types[-1] == "complete"
+        approval = next(e for e in events if e.event_type == "approval_required")
+        assert approval.data["action"].action_type == "save_scenario"
+        mock_agent.run.assert_awaited_once()
+        mock_agent.run_stream.assert_not_called()
+        assert sample_active_session.status == SessionStatus.AWAITING_APPROVAL.value
+
+    @pytest.mark.asyncio
+    async def test_stream_chat_cloud_keeps_streaming_path(
+        self,
+        sample_active_session: AgentSession,
+        monkeypatch: pytest.MonkeyPatch,
+    ) -> None:
+        """Regression guard for #342 — a cloud provider keeps the run_stream path."""
+        service = AgentService()
+        monkeypatch.setattr(service.settings, "agent_default_model", "anthropic:claude-test")
+        mock_db = AsyncMock()
+        mock_result = MagicMock()
+        mock_result.scalar_one_or_none.return_value = sample_active_session
+        mock_db.execute.return_value = mock_result
+
+        class _StubStream:
+            async def __aenter__(self) -> MagicMock:
+                stream = MagicMock()
+
+                async def _stream_text() -> AsyncIterator[str]:
+                    yield "hello"
+
+                stream.stream_text = _stream_text
+                stream.get_output = AsyncMock(return_value=None)
+                usage = MagicMock()
+                usage.total_tokens = 1
+                stream.usage.return_value = usage
+                stream.all_messages.return_value = []
+                return stream
+
+            async def __aexit__(self, *exc: object) -> bool:
+                return False
+
+        mock_agent = MagicMock()
+        mock_agent.run_stream = MagicMock(return_value=_StubStream())
+        mock_agent.run = AsyncMock(
+            side_effect=AssertionError("run must not be called for a cloud provider")
+        )
+
+        with patch.object(service, "_get_agent", return_value=mock_agent):
+            events = [
+                event
+                async for event in service.stream_chat(
+                    db=mock_db,
+                    session_id=sample_active_session.session_id,
+                    message="hello",
+                )
+            ]
+
+        mock_agent.run_stream.assert_called_once()
+        mock_agent.run.assert_not_called()
+        assert any(e.event_type == "complete" for e in events)
+
 
 class TestAgentServiceApproval:
     """Tests for approval workflow."""
@@ -777,3 +1036,240 @@ def test_increment_tool_calls(self, mock_db_session: AsyncMock) -> None:
         assert deps.tool_call_count == 1
         deps.increment_tool_calls()
         assert deps.tool_call_count == 2
+
+    def test_set_pending_action_records_request(self, mock_db_session: AsyncMock) -> None:
+        """set_pending_action should record a machine-readable HITL request (#336)."""
+        deps = AgentDeps(db=mock_db_session, session_id="test-123")
+        assert deps.pending_action is None
+
+        deps.set_pending_action(
+            "save_scenario",
+            {"name": "p", "run_id": "r", "store_id": 1, "product_id": 2},
+            "Save scenario plan 'p'",
+        )
+
+        assert deps.pending_action is not None
+        assert deps.pending_action["action_type"] == "save_scenario"
+        assert deps.pending_action["arguments"]["run_id"] == "r"
+        assert deps.pending_action["description"] == "Save scenario plan 'p'"
+
+
+class TestAgentServiceDepsApproval:
+    """Regression tests for #336 — gated tools propagate approval via deps.
+
+    The experiment agent's structured output (ExperimentReport) carries no
+    pending_action/approval_required field, so a gated tool call (e.g.
+    save_scenario) used to leave the session ``active`` with no pending action
+    and no ``approval_required`` event. These assert the deterministic
+    deps-based path: tool -> deps.pending_action -> awaiting_approval ->
+    approval_required.
+    """
+
+    @staticmethod
+    def _save_scenario_pending(deps: AgentDeps) -> None:
+        """Simulate the gated save_scenario tool short-circuiting for approval."""
+        deps.set_pending_action(
+            "save_scenario",
+            {
+                "name": "plan-a",
+                "run_id": "702c7ce74e9848d3b11f124a71bf7b50",
+                "store_id": 111,
+                "product_id": 339,
+                "horizon": 14,
+                "assumptions": {},
+                "source": "agent",
+                "agent_session_id": deps.session_id,
+            },
+            "Save scenario plan 'plan-a' for store 111 / product 339",
+        )
+
+    @pytest.mark.asyncio
+    async def test_chat_persists_pending_action_from_deps(
+        self,
+        sample_active_session: AgentSession,
+        sample_experiment_report: ExperimentReport,
+    ) -> None:
+        """chat() must persist deps.pending_action even when the output lacks one."""
+        service = AgentService()
+        mock_db = AsyncMock()
+        mock_result = MagicMock()
+        mock_result.scalar_one_or_none.return_value = sample_active_session
+        mock_db.execute.return_value = mock_result
+
+        def _run(message: str, *, deps: AgentDeps, message_history: Any) -> MagicMock:
+            # A gated tool fired during the run and recorded the approval request.
+            self._save_scenario_pending(deps)
+            res = MagicMock()
+            res.output = sample_experiment_report  # no pending_action field
+            usage = MagicMock()
+            usage.total_tokens = 7
+            res.usage.return_value = usage
+            res.all_messages.return_value = []
+            return res
+
+        mock_agent = MagicMock()
+        mock_agent.run = AsyncMock(side_effect=_run)
+
+        with patch.object(service, "_get_agent", return_value=mock_agent):
+            response = await service.chat(
+                db=mock_db,
+                session_id=sample_active_session.session_id,
+                message="Save a what-if scenario plan for run 702c...",
+            )
+
+        assert response.pending_approval is True
+        assert response.pending_action is not None
+        assert response.pending_action.action_type == "save_scenario"
+        assert response.pending_action.arguments["run_id"] == "702c7ce74e9848d3b11f124a71bf7b50"
+        assert sample_active_session.status == SessionStatus.AWAITING_APPROVAL.value
+        assert sample_active_session.pending_action is not None
+        assert sample_active_session.pending_action["action_type"] == "save_scenario"
+
+    @pytest.mark.asyncio
+    async def test_stream_chat_emits_approval_required_from_deps(
+        self,
+        sample_active_session: AgentSession,
+        sample_experiment_report: ExperimentReport,
+        monkeypatch: pytest.MonkeyPatch,
+    ) -> None:
+        """stream_chat() must emit approval_required from deps.pending_action."""
+        service = AgentService()
+        # Pin a streaming-capable (cloud) provider so this exercises the
+        # run_stream path regardless of the local .env (#342).
+        monkeypatch.setattr(service.settings, "agent_default_model", "anthropic:claude-test")
+        mock_db = AsyncMock()
+        mock_result = MagicMock()
+        mock_result.scalar_one_or_none.return_value = sample_active_session
+        mock_db.execute.return_value = mock_result
+
+        report = sample_experiment_report
+
+        class _StubStream:
+            async def __aenter__(self) -> MagicMock:
+                stream = MagicMock()
+
+                async def _stream_text() -> AsyncIterator[str]:
+                    # Structured-output agents cannot stream text deltas; mirror
+                    # that by yielding nothing.
+                    return
+                    yield  # pragma: no cover
+
+                stream.stream_text = _stream_text
+                stream.get_output = AsyncMock(return_value=report)
+                usage = MagicMock()
+                usage.total_tokens = 9
+                stream.usage.return_value = usage
+                stream.all_messages.return_value = []
+                return stream
+
+            async def __aexit__(self, *exc: object) -> bool:
+                return False
+
+        def _run_stream(message: str, *, deps: AgentDeps, message_history: Any) -> _StubStream:
+            self._save_scenario_pending(deps)
+            return _StubStream()
+
+        mock_agent = MagicMock()
+        mock_agent.run_stream = MagicMock(side_effect=_run_stream)
+
+        with patch.object(service, "_get_agent", return_value=mock_agent):
+            events = [
+                event
+                async for event in service.stream_chat(
+                    db=mock_db,
+                    session_id=sample_active_session.session_id,
+                    message="Save a what-if scenario plan for run 702c...",
+                )
+            ]
+
+        approval_events = [e for e in events if e.event_type == "approval_required"]
+        assert len(approval_events) == 1
+        assert approval_events[0].data["action"].action_type == "save_scenario"
+        assert sample_active_session.status == SessionStatus.AWAITING_APPROVAL.value
+        assert sample_active_session.pending_action is not None
+
+
+class TestFinalizerSalvage:
+    """The plain-text finalizer fallback used on structured-output failure (#351)."""
+
+    def test_extract_tool_payloads_pulls_tool_returns(self) -> None:
+        """Tool returns are extracted from a captured run trace, in order."""
+        captured: list[ModelMessage] = [
+            ModelRequest(parts=[UserPromptPart(content="List runs")]),
+            ModelResponse(parts=[TextPart(content="{}")]),
+            ModelRequest(
+                parts=[
+                    ToolReturnPart(
+                        tool_name="tool_list_runs",
+                        content={"runs": [{"run_id": "abc", "wape": 18.93}]},
+                        tool_call_id="call-1",
+                    )
+                ]
+            ),
+        ]
+
+        payloads = AgentService._extract_tool_payloads(captured)
+
+        assert payloads == [
+            {"tool": "tool_list_runs", "result": {"runs": [{"run_id": "abc", "wape": 18.93}]}}
+        ]
+
+    def test_extract_tool_payloads_empty_when_no_tool_returns(self) -> None:
+        """No tool returns (model failed before any tool ran) yields an empty list."""
+        captured: list[ModelMessage] = [
+            ModelRequest(parts=[UserPromptPart(content="List runs")]),
+            ModelResponse(parts=[TextPart(content='{"runs": []}')]),
+        ]
+
+        assert AgentService._extract_tool_payloads(captured) == []
+
+    @pytest.mark.asyncio
+    async def test_salvage_returns_none_without_tool_data(self) -> None:
+        """With no captured tool data, salvage returns None (caller emits the error)."""
+        service = AgentService()
+        result = await service._salvage_plaintext_answer("any question", [])
+        assert result is None
+
+    def test_compact_for_finalizer_strips_verbose_keys_keeps_metrics(self) -> None:
+        """Compaction drops bulky config/runtime blobs but keeps identity + metrics (#351).
+
+        Regression for the finalizer reporting 99.0 as "lowest WAPE" when the
+        true minimum (18.93) had been truncated out of the oversized payload.
+        """
+        raw = [
+            {
+                "tool": "tool_list_runs",
+                "result": {
+                    "runs": [
+                        {
+                            "run_id": "a",
+                            "model_type": "seasonal_naive",
+                            "metrics": {"wape": 99.0},
+                            "model_config_data": {"x": "y" * 500},
+                            "runtime_info": {"python": "3.12"},
+                            "artifact_uri": "demo/seasonal-model_a.joblib",
+                        },
+                        {
+                            "run_id": "b",
+                            "model_type": "naive",
+                            "metrics": {"wape": 18.93},
+                            "feature_config": {"lots": "of stuff"},
+                        },
+                    ]
+                },
+            }
+        ]
+
+        compact = cast(list[dict[str, Any]], AgentService._compact_for_finalizer(raw))
+        runs = compact[0]["result"]["runs"]
+
+        # Identity + metrics survive for BOTH runs (so a ranking sees 18.93).
+        assert runs[0]["run_id"] == "a"
+        assert runs[0]["metrics"] == {"wape": 99.0}
+        assert runs[1]["run_id"] == "b"
+        assert runs[1]["metrics"] == {"wape": 18.93}
+        # Verbose blobs are gone.
+        assert "model_config_data" not in runs[0]
+        assert "runtime_info" not in runs[0]
+        assert "artifact_uri" not in runs[0]
+        assert "feature_config" not in runs[1]
diff --git a/app/features/demo/pipeline.py b/app/features/demo/pipeline.py
index c56ae925..041d5361 100644
--- a/app/features/demo/pipeline.py
+++ b/app/features/demo/pipeline.py
@@ -39,6 +39,7 @@
 
 from app.core.config import get_settings
 from app.core.logging import get_logger
+from app.core.problem_details import EMBEDDING_AUTH_CODE, ERROR_TYPES
 from app.features.demo.schemas import DemoRunRequest, StepEvent, StepStatus
 from app.shared.seeder.config import ScenarioPreset
 
@@ -279,15 +280,21 @@ def _model_config_payload(model_type: str) -> dict[str, Any]:
 
 
 def _llm_key_present() -> bool:
-    """Return True when the configured agent model's provider API key is set.
+    """Return True when the configured agent model's provider can be used.
 
     Matches the provider prefix of ``agent_default_model`` so the agent step
     skips gracefully when its provider is unreachable. Logs key PRESENCE only,
     never the value (port of run_demo.py:317-335; see security-patterns.md).
+
+    The local ``ollama`` provider needs no API key (#340), so it always returns
+    True — the agent step still degrades gracefully if Ollama is unreachable
+    (the chat round-trip fails and the step skips via its error path).
     """
     settings = get_settings()
     model = settings.agent_default_model
     provider = model.split(":", 1)[0] if ":" in model else ""
+    if provider == "ollama":
+        return True
     if provider == "anthropic":
         return bool(settings.anthropic_api_key)
     if provider == "openai":
@@ -389,6 +396,31 @@ async def _embedding_provider_reachable(client: _Client) -> tuple[bool, str]:
     return (False, provider)
 
 
+# PRP-42 (#329) — the RAG routes stamp an embedding-provider auth failure
+# (401/403) with the machine-readable EMBEDDING_AUTH code/type. The probe only
+# checks key *presence*, so a placeholder/invalid key passes the probe but the
+# indexing call then 502s with this marker; the knowledge steps classify it and
+# SKIP gracefully instead of hard-failing. Both the code and the type slug come
+# from the single source of truth in app/core/problem_details.py (mirrors
+# EmbeddingProviderAuthError; memory anchor: [[rag-runtime-config-and-corpus-state]]).
+_EMBEDDING_AUTH_TYPE_SLUG = ERROR_TYPES[EMBEDDING_AUTH_CODE].rsplit("/", 1)[-1]
+
+
+def _is_embedding_auth_error(exc: _StepError) -> bool:
+    """True when a _StepError is the embedding-provider auth 502 (#329).
+
+    Classifies on the machine-readable RFC 7807 ``code`` / ``type`` from the
+    problem+json body — never on brittle ``detail`` text matching. The ``type``
+    match is lenient (final path segment) so a fully-qualified problem URI
+    classifies the same as the canonical relative one.
+    """
+    problem = exc.problem
+    if problem.get("code") == EMBEDDING_AUTH_CODE:
+        return True
+    type_uri = problem.get("type")
+    return isinstance(type_uri, str) and type_uri.rsplit("/", 1)[-1] == _EMBEDDING_AUTH_TYPE_SLUG
+
+
 def _select_winner(
     backtest_results: dict[str, dict[str, float]],
 ) -> tuple[str, float] | None:
@@ -1382,17 +1414,27 @@ async def step_rag_index_subset(ctx: DemoContext, client: _Client) -> StepResult
     if ctx.embedding_unreachable:
         return ("skip", "embedding provider unreachable", {})
 
-    body = await client.request(
-        "rag_index_subset",
-        "POST",
-        "/rag/index/project-docs",
-        json_body={
-            "include_docs": True,
-            "include_prps": False,
-            "include_root": False,
-            "path_prefix": "docs/user-guide",
-        },
-    )
+    try:
+        body = await client.request(
+            "rag_index_subset",
+            "POST",
+            "/rag/index/project-docs",
+            json_body={
+                "include_docs": True,
+                "include_prps": False,
+                "include_root": False,
+                "path_prefix": "docs/user-guide",
+            },
+        )
+    except _StepError as exc:
+        # PRP-42 (#329) — the probe only checks key *presence*; a placeholder /
+        # invalid key passes it but the index call 502s with EMBEDDING_AUTH.
+        # Treat it like an unreachable provider: SKIP (not FAIL) and mark the
+        # context so the retrieve probe skips too, without a second 401 round-trip.
+        if _is_embedding_auth_error(exc):
+            ctx.embedding_unreachable = True
+            return ("skip", "embedding provider rejected credentials", {})
+        raise
     results = body.get("results") or []
     total_chunks = int(body.get("total_chunks", 0))
     failed = int(body.get("failed", 0))
@@ -1428,12 +1470,20 @@ async def step_rag_retrieve_probe(ctx: DemoContext, client: _Client) -> StepResu
     if ctx.embedding_unreachable:
         return ("skip", "embedding provider unreachable", {})
 
-    body = await client.request(
-        "rag_retrieve_probe",
-        "POST",
-        "/rag/retrieve",
-        json_body={"query": "How do I run the demo pipeline?", "top_k": 3},
-    )
+    try:
+        body = await client.request(
+            "rag_retrieve_probe",
+            "POST",
+            "/rag/retrieve",
+            json_body={"query": "How do I run the demo pipeline?", "top_k": 3},
+        )
+    except _StepError as exc:
+        # PRP-42 (#329) — same auth-classified graceful skip as the index step,
+        # in case retrieve is reached with a freshly-rejecting key.
+        if _is_embedding_auth_error(exc):
+            ctx.embedding_unreachable = True
+            return ("skip", "embedding provider rejected credentials", {})
+        raise
     results = body.get("results") or []
     if not results:
         return (
diff --git a/app/features/demo/tests/test_pipeline.py b/app/features/demo/tests/test_pipeline.py
index 6e9fd7ea..5f73a8c8 100644
--- a/app/features/demo/tests/test_pipeline.py
+++ b/app/features/demo/tests/test_pipeline.py
@@ -1468,6 +1468,93 @@ async def test_rag_index_subset_skips_when_provider_unreachable():
     assert client.calls == []
 
 
+async def test_rag_index_subset_skips_on_embedding_auth_502():
+    """#329 — an EMBEDDING_AUTH 502 (invalid/placeholder key) SKIPs, not FAILs.
+
+    The probe only checks key presence, so a bad key reaches the index call and
+    502s with the machine-readable EMBEDDING_AUTH marker. The step classifies it
+    and skips, and marks the context so the retrieve probe skips too.
+    """
+    ctx = _make_showcase_ctx()
+    assert ctx.embedding_unreachable is False
+    client = _RecordingClient(
+        None,
+        errors={
+            ("POST", "/rag/index/project-docs"): pipeline._StepError(
+                "rag_index_subset",
+                502,
+                {
+                    "type": "/errors/embedding-auth",
+                    "title": "Embedding Auth",
+                    "status": 502,
+                    "code": "EMBEDDING_AUTH",
+                    "detail": "Embedding provider rejected the credentials",
+                },
+            ),
+        },
+    )
+    status, detail, _ = await pipeline.step_rag_index_subset(ctx, _as_client(client))
+    assert status == "skip"
+    assert "rejected credentials" in detail
+    # The call WAS attempted (unlike the unreachable case)...
+    assert len(client.calls) == 1
+    # ...and the context is now marked so the retrieve probe skips too.
+    assert ctx.embedding_unreachable is True
+
+
+async def test_rag_index_subset_skips_on_embedding_auth_type_only():
+    """#329 — classification by `type` alone (no `code`) still SKIPs gracefully.
+
+    The classifier accepts a problem whose `type` URI's final path segment is
+    `embedding-auth` even when there is no `code` field — and even when the
+    `type` is a fully-qualified absolute URI rather than the canonical relative
+    one. The step must still skip and flag the context.
+    """
+    ctx = _make_showcase_ctx()
+    assert ctx.embedding_unreachable is False
+    client = _RecordingClient(
+        None,
+        errors={
+            ("POST", "/rag/index/project-docs"): pipeline._StepError(
+                "rag_index_subset",
+                502,
+                {
+                    # No "code" key — only an absolute "type" ending in the slug.
+                    "type": "https://errors.example.com/rag/embedding-auth",
+                    "title": "Embedding Auth",
+                    "status": 502,
+                    "detail": "Embedding provider rejected the credentials",
+                },
+            ),
+        },
+    )
+    status, detail, _ = await pipeline.step_rag_index_subset(ctx, _as_client(client))
+    assert status == "skip"
+    assert "rejected credentials" in detail
+    assert len(client.calls) == 1
+    assert ctx.embedding_unreachable is True
+
+
+async def test_rag_index_subset_reraises_non_auth_502():
+    """#329 — a non-auth 502 (e.g. connection failure) still propagates as FAIL."""
+    import pytest
+
+    ctx = _make_showcase_ctx()
+    client = _RecordingClient(
+        None,
+        errors={
+            ("POST", "/rag/index/project-docs"): pipeline._StepError(
+                "rag_index_subset",
+                502,
+                {"title": "Bad Gateway", "detail": "Embedding generation failed: timeout"},
+            ),
+        },
+    )
+    with pytest.raises(pipeline._StepError):
+        await pipeline.step_rag_index_subset(ctx, _as_client(client))
+    assert ctx.embedding_unreachable is False
+
+
 async def test_rag_retrieve_probe_happy_path():
     """PRP-40 — top hit + similarity score surface on PASS."""
     ctx = _make_showcase_ctx()
@@ -1521,6 +1608,31 @@ async def test_rag_retrieve_probe_skips_when_provider_unreachable():
     assert client.calls == []
 
 
+async def test_rag_retrieve_probe_skips_on_embedding_auth_502():
+    """#329 — retrieve also classifies an EMBEDDING_AUTH 502 as SKIP, not FAIL."""
+    ctx = _make_showcase_ctx()
+    client = _RecordingClient(
+        None,
+        errors={
+            ("POST", "/rag/retrieve"): pipeline._StepError(
+                "rag_retrieve_probe",
+                502,
+                {
+                    "type": "/errors/embedding-auth",
+                    "title": "Embedding Auth",
+                    "status": 502,
+                    "code": "EMBEDDING_AUTH",
+                    "detail": "Embedding provider rejected the credentials",
+                },
+            ),
+        },
+    )
+    status, detail, _ = await pipeline.step_rag_retrieve_probe(ctx, _as_client(client))
+    assert status == "skip"
+    assert "rejected credentials" in detail
+    assert ctx.embedding_unreachable is True
+
+
 async def test_run_pipeline_showcase_rich_runs_planning_and_knowledge(monkeypatch, tmp_path):
     """PRP-40 — end-to-end SHOWCASE_RICH reaches the 5 new steps + greens."""
     artifact = tmp_path / "artifacts" / "models" / "model_abc123def456.joblib"
@@ -1689,6 +1801,41 @@ async def request(
     return _HitlClient(event_sink=intermediate), intermediate
 
 
+def test_llm_key_present_ollama_needs_no_key(monkeypatch):
+    """#340 — the local ollama provider needs no API key, so the gate is True.
+
+    Without this, a local-Ollama stack (agent_default_model=ollama:*) makes the
+    showcase agent_hitl_flow / agent steps skip with "no API key matching
+    agent_default_model provider" even though Ollama is reachable.
+    """
+    monkeypatch.setattr(
+        pipeline,
+        "get_settings",
+        lambda: SimpleNamespace(
+            agent_default_model="ollama:qwen3:8b",
+            anthropic_api_key="",
+            openai_api_key="",
+            google_api_key="",
+        ),
+    )
+    assert pipeline._llm_key_present() is True
+
+
+def test_llm_key_present_cloud_still_requires_key(monkeypatch):
+    """Regression guard for #340 — a cloud provider still requires its key."""
+    monkeypatch.setattr(
+        pipeline,
+        "get_settings",
+        lambda: SimpleNamespace(
+            agent_default_model="openai:gpt-4.1-mini",
+            anthropic_api_key="",
+            openai_api_key="",
+            google_api_key="",
+        ),
+    )
+    assert pipeline._llm_key_present() is False
+
+
 async def test_agent_hitl_flow_happy_path(monkeypatch, tmp_path):
     """PRP-41 — full HITL round-trip: chat -> intermediate -> approve -> pass."""
     monkeypatch.setattr(
diff --git a/app/features/model_selection/__init__.py b/app/features/model_selection/__init__.py
new file mode 100644
index 00000000..01931b63
--- /dev/null
+++ b/app/features/model_selection/__init__.py
@@ -0,0 +1,9 @@
+"""Forecast Champion Selector — backend vertical slice (issue #353).
+
+Validates a (store, product) pair's data availability, runs comparable
+backtests for a set of candidate forecasting models, deterministically ranks
+them, selects a champion with a recommendation confidence, persists an
+auditable selection run, and optionally trains/predicts with the winner.
+
+Backend-only by design — the UI is a deliberate follow-up PRP.
+"""
diff --git a/app/features/model_selection/capabilities.py b/app/features/model_selection/capabilities.py
new file mode 100644
index 00000000..5c513496
--- /dev/null
+++ b/app/features/model_selection/capabilities.py
@@ -0,0 +1,157 @@
+"""Pure model-capability catalog for the champion selector (issue #356, Slice A).
+
+No DB, no I/O — :func:`build_model_catalog` is deterministic and unit-tested
+directly (mirrors ``ranking.py`` / ``explanations.py``). It surfaces the
+forecasting model union as a frontend-consumable catalog so the React
+``MODEL_FAMILY_MAP`` / labels never drift from the Python authority.
+
+Capability provenance (BACKEND-OWNED, verified 2026-06-01):
+- ``family``         — ``forecasting.feature_metadata.model_family_for`` (lazy
+  cross-slice import inside the builder, per the slice's import discipline).
+- ``feature_aware``  — the set whose forecasters set ``requires_features=True``
+  (RandomForest/Regression/LightGBM/XGBoost/ProphetLike), i.e. exactly the set
+  ``ForecastingService.predict()`` rejects (``forecasting/service.py``).
+- ``requires_extra`` — ``lightgbm``/``xgboost`` (opt-in extras that may
+  ``ImportError`` when the extra is not installed).
+- ``supports_auto_predict`` — ``not feature_aware`` (feature-aware winners
+  forecast through ``POST /scenarios/simulate``, not the plain predict path).
+- ``default_params``  — the FLAT model-tuning defaults pinned from the live
+  ``forecasting.schemas.ModelConfig`` members (the internal ``schema_version``
+  and ``feature_config_hash`` meta fields are intentionally omitted).
+"""
+
+from __future__ import annotations
+
+from dataclasses import dataclass, field
+
+from app.features.model_selection.schemas import (
+    CandidateModelInfo,
+    ModelCatalogResponse,
+)
+
+# Models gated behind the matching opt-in extra (may be absent at runtime).
+_REQUIRES_EXTRA: frozenset[str] = frozenset({"lightgbm", "xgboost"})
+
+# Feature-aware models — their forecasters set ``requires_features=True`` and
+# ``ForecastingService.predict()`` rejects them (they need an exogenous feature
+# frame). Verified against ``forecasting/models.py`` requires_features flags.
+_FEATURE_AWARE: frozenset[str] = frozenset(
+    {"regression", "prophet_like", "lightgbm", "xgboost", "random_forest"}
+)
+
+# The default candidate set the backend ``POST /run`` contract documents — the
+# UI pre-selects exactly these.
+DEFAULT_CANDIDATE_MODEL_TYPES: list[str] = [
+    "naive",
+    "seasonal_naive",
+    "moving_average",
+    "regression",
+    "prophet_like",
+]
+
+
+@dataclass(frozen=True)
+class _CatalogEntry:
+    """Slice-local presentation metadata for one model_type."""
+
+    label: str
+    description: str
+    default_params: dict[str, object] = field(default_factory=lambda: {})
+
+
+# Ordered map: model_type → presentation metadata. The KEYS must equal the
+# ``ModelType`` Literal in ``schemas.py`` exactly (asserted in
+# ``test_capabilities.py``). ``default_params`` are the flat model-tuning
+# defaults from the forecasting ``ModelConfig`` members (schema_version /
+# feature_config_hash meta fields omitted), pinned 2026-06-01.
+_CATALOG: dict[str, _CatalogEntry] = {
+    "naive": _CatalogEntry(
+        label="Naive",
+        description="Repeats the last observed value.",
+    ),
+    "seasonal_naive": _CatalogEntry(
+        label="Seasonal Naive",
+        description="Repeats the value from one season ago.",
+        default_params={"season_length": 7},
+    ),
+    "moving_average": _CatalogEntry(
+        label="Moving Average",
+        description="Averages the last N observed values.",
+        default_params={"window_size": 7},
+    ),
+    "weighted_moving_average": _CatalogEntry(
+        label="Weighted Moving Average",
+        description="Recency-weighted average of the last N values.",
+        default_params={"window_size": 7, "weight_strategy": "linear", "decay": 0.7},
+    ),
+    "seasonal_average": _CatalogEntry(
+        label="Seasonal Average",
+        description="Averages the same season-position across recent cycles.",
+        default_params={"season_length": 7, "lookback_cycles": 4, "trim_outliers": False},
+    ),
+    "trend_regression_baseline": _CatalogEntry(
+        label="Trend Regression Baseline",
+        description="Ridge trend with optional day-of-week / month terms.",
+        default_params={"alpha": 1.0, "include_dow": True, "include_month": True},
+    ),
+    "random_forest": _CatalogEntry(
+        label="Random Forest",
+        description="Feature-aware random-forest regressor over lag/calendar features.",
+        default_params={"n_estimators": 100, "max_depth": 10, "min_samples_leaf": 2},
+    ),
+    "lightgbm": _CatalogEntry(
+        label="LightGBM",
+        description="Gradient-boosted trees (opt-in extra) over engineered features.",
+        default_params={"n_estimators": 100, "max_depth": 6, "learning_rate": 0.1},
+    ),
+    "xgboost": _CatalogEntry(
+        label="XGBoost",
+        description="Extreme gradient boosting (opt-in extra) over engineered features.",
+        default_params={"n_estimators": 100, "max_depth": 6, "learning_rate": 0.1},
+    ),
+    "regression": _CatalogEntry(
+        label="Gradient Boosting Regression",
+        description="Histogram gradient-boosting over lag, calendar, and exogenous features.",
+        default_params={"max_iter": 200, "learning_rate": 0.05, "max_depth": 6},
+    ),
+    "prophet_like": _CatalogEntry(
+        label="Prophet-like Additive",
+        description="Additive trend/seasonality Ridge over engineered features.",
+        default_params={"alpha": 1.0},
+    ),
+}
+
+
+def build_model_catalog() -> ModelCatalogResponse:
+    """Build the backend-owned candidate-model catalog (pure, no I/O).
+
+    Iterates the slice-local ``_CATALOG`` in declaration order, deriving each
+    entry's ``family`` from the forecasting authority and its capability flags
+    from the module-level sets. Returns the full catalog plus the documented
+    default candidate set.
+    """
+    # Lazy cross-slice import (mirror service.py) — avoids closing an alembic
+    # cold-boot import cycle through the forecasting slice.
+    from app.features.forecasting.feature_metadata import model_family_for
+
+    models: list[CandidateModelInfo] = []
+    for model_type, meta in _CATALOG.items():
+        feature_aware = model_type in _FEATURE_AWARE
+        models.append(
+            CandidateModelInfo(
+                model_type=model_type,
+                label=meta.label,
+                # ``ModelFamily`` is a ``str, Enum`` whose ``.value`` is already
+                # typed as the ``baseline|tree|additive`` literal the schema wants.
+                family=model_family_for(model_type).value,
+                feature_aware=feature_aware,
+                requires_extra=model_type in _REQUIRES_EXTRA,
+                default_params=dict(meta.default_params),
+                supports_auto_predict=not feature_aware,
+                description=meta.description,
+            )
+        )
+    return ModelCatalogResponse(
+        models=models,
+        default_candidate_model_types=list(DEFAULT_CANDIDATE_MODEL_TYPES),
+    )
diff --git a/app/features/model_selection/decision.py b/app/features/model_selection/decision.py
new file mode 100644
index 00000000..335a3ee8
--- /dev/null
+++ b/app/features/model_selection/decision.py
@@ -0,0 +1,137 @@
+"""Deterministic forecast-decision layer for the champion selector (Slice C).
+
+Pure functions — NO LLM, NO DB, NO I/O (mirror ``explanations.py``). Translate a
+horizon forecast into an inventory-decision heuristic a planner can act on:
+peak/low demand day, a CLEARLY-LABELED safety-stock heuristic, and bias-risk
+wording.
+
+The safety-stock formula is the demand-variability-only form (King 2011,
+constant lead time):
+
+    safety_stock = z(service_level) * sigma_daily * sqrt(lead_time_days)
+    expected_demand_over_lead_time = average_demand * lead_time_days
+    reorder_point = expected_demand_over_lead_time + safety_stock
+
+``z`` comes from a fixed one-sided service-level lookup (NO scipy); an
+in-between service level falls back to the nearest table key. Every field is
+labeled ``method="heuristic"`` and carries a caveat — this output NEVER feeds
+ranking (LOCKED #3).
+"""
+
+from __future__ import annotations
+
+import statistics
+from datetime import date
+from typing import Any
+
+from app.features.model_selection.schemas import ForecastDecision
+
+# LOCKED #4 — the canonical bias sentence, kept byte-identical to the frontend
+# ``BIAS_EXPLANATION`` constant (``components/champion-selector/copy.ts``) so the
+# wording never drifts between the two surfaces.
+BIAS_EXPLANATION = (
+    "Positive bias means the model under-forecasts (risk of stockouts); "
+    "negative bias means it over-forecasts (risk of overstock)."
+)
+
+# One-sided service-level z values (NO scipy dependency). Source: King 2011
+# safety-stock z-from-service-level table.
+_Z_TABLE: dict[float, float] = {0.90: 1.2816, 0.95: 1.6449, 0.975: 1.9600, 0.99: 2.3263}
+
+_CAVEATS = [
+    "Safety stock is a deterministic heuristic (demand variability only; constant lead time).",
+    "Not a substitute for a full inventory-optimisation model.",
+]
+
+
+def z_for_service_level(service_level: float) -> float:
+    """Return the one-sided z for a service level (exact key, else nearest).
+
+    An exact table key returns its z directly; any other level snaps to the
+    nearest table key (documented heuristic — the table is coarse on purpose).
+    """
+    if service_level in _Z_TABLE:
+        return _Z_TABLE[service_level]
+    nearest = min(_Z_TABLE, key=lambda key: abs(key - service_level))
+    return _Z_TABLE[nearest]
+
+
+def _coerce_date(value: object) -> date | None:
+    """Coerce a point's ``date`` (ISO string in JSON-mode dumps, or a date)."""
+    if isinstance(value, date):
+        return value
+    if isinstance(value, str):
+        try:
+            return date.fromisoformat(value)
+        except ValueError:
+            return None
+    return None
+
+
+def forecast_peak_low(
+    points: list[dict[str, Any]],
+) -> tuple[date | None, float | None, date | None, float | None]:
+    """Return ``(peak_date, peak_demand, low_date, low_demand)`` over points.
+
+    Picks the max/min ``forecast`` value; ``(None, None, None, None)`` on an
+    empty forecast. Ties resolve to the first occurrence (deterministic).
+    """
+    if not points:
+        return (None, None, None, None)
+    peak = max(points, key=lambda p: float(p["forecast"]))
+    low = min(points, key=lambda p: float(p["forecast"]))
+    return (
+        _coerce_date(peak.get("date")),
+        float(peak["forecast"]),
+        _coerce_date(low.get("date")),
+        float(low["forecast"]),
+    )
+
+
+def _bias_direction(winner_bias: float | None) -> str:
+    """Plain-English direction phrase for a winner's bias sign."""
+    if winner_bias is None:
+        return "has no recorded bias measurement"
+    if winner_bias > 0:
+        return "under-forecasts (risk of stockouts)"
+    if winner_bias < 0:
+        return "over-forecasts (risk of overstock)"
+    return "is roughly unbiased"
+
+
+def compute_forecast_decision(
+    points: list[dict[str, Any]],
+    average_demand: float,
+    lead_time_days: int,
+    service_level: float,
+    winner_bias: float | None,
+) -> ForecastDecision:
+    """Build the deterministic, labeled inventory-decision heuristic.
+
+    ``sigma_daily`` is the POPULATION stdev of the forecast values; a flat or
+    single-point forecast yields ``sigma=0`` → ``safety_stock=0`` (honest, not
+    an error).
+    """
+    values = [float(p["forecast"]) for p in points]
+    sigma_daily = statistics.pstdev(values) if len(values) > 1 else 0.0
+    z = z_for_service_level(service_level)
+    safety_stock = z * sigma_daily * (lead_time_days**0.5)
+    expected_lt = average_demand * lead_time_days
+    bias_dir = _bias_direction(winner_bias)
+    if winner_bias is None:
+        bias_text = f"{BIAS_EXPLANATION} For this winner, bias {bias_dir}."
+    else:
+        bias_text = (
+            f"{BIAS_EXPLANATION} For this winner, bias {winner_bias:.2f} indicates it {bias_dir}."
+        )
+    return ForecastDecision(
+        lead_time_days=lead_time_days,
+        service_level=service_level,
+        z_value=z,
+        sigma_daily_demand=sigma_daily,
+        expected_demand_over_lead_time=expected_lt,
+        safety_stock=safety_stock,
+        reorder_point=expected_lt + safety_stock,
+        bias_risk_text=bias_text,
+        caveats=list(_CAVEATS),
+    )
diff --git a/app/features/model_selection/explanations.py b/app/features/model_selection/explanations.py
new file mode 100644
index 00000000..907b974a
--- /dev/null
+++ b/app/features/model_selection/explanations.py
@@ -0,0 +1,97 @@
+"""Deterministic business-explanation layer for the champion selector (#353).
+
+Pure functions — NO LLM, NO external call. Translates the numeric ranking +
+availability into short, deterministic English a business user can read. The
+output dict is persisted into ``model_selection_run.business_summary`` and
+echoed on the response.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+from app.features.model_selection.schemas import PairAvailabilityResponse, RankingResult
+
+
+def _metric_phrase(metrics: dict[str, float] | None) -> str:
+    """One-line plain-English metric summary for a ranked model."""
+    if not metrics:
+        return "no metrics available"
+    return (
+        f"WAPE {metrics['wape']:.1f}%, sMAPE {metrics['smape']:.1f}, "
+        f"MAE {metrics['mae']:.2f}, bias {metrics['bias']:.2f}"
+    )
+
+
+def explain_winner(
+    ranking: RankingResult,
+    availability: PairAvailabilityResponse | None,
+) -> dict[str, Any]:
+    """Build the deterministic ``business_summary`` payload.
+
+    Always returns a dict; when there is no winner the summary explains why no
+    model could be recommended.
+    """
+    caveats = [
+        "Backtest accuracy reflects historical fit, not a guarantee of future performance.",
+        "Metrics measure correlation with past demand, not causation.",
+    ]
+
+    if availability is not None:
+        data_notes = [
+            f"Observed {availability.observed_days} of "
+            f"{availability.expected_calendar_days} calendar days "
+            f"({availability.coverage_ratio:.0%} coverage).",
+            f"Average daily demand {availability.average_daily_demand:.2f}.",
+        ]
+        data_notes.extend(availability.warnings)
+    else:
+        data_notes = ["No availability snapshot was computed."]
+
+    if ranking.winner is None:
+        return {
+            "headline": "No model could be recommended for this pair.",
+            "winner": None,
+            "recommendation_confidence": ranking.confidence,
+            "confidence_reasons": ranking.reasons,
+            "comparison": None,
+            "data_notes": data_notes,
+            "caveats": caveats,
+        }
+
+    winner = ranking.winner
+    headline = f"Recommended model: {winner.model_type} ({ranking.confidence} confidence)."
+
+    included = [e for e in ranking.entries if e.included]
+    runner_up = included[1] if len(included) > 1 else None
+    if runner_up is not None and runner_up.metrics and winner.metrics:
+        runner_wape = runner_up.metrics["wape"]
+        if runner_wape > 0:
+            lead = (runner_wape - winner.metrics["wape"]) / runner_wape
+            lead_text = f"{lead:.1%} lower WAPE than the runner-up ({runner_up.model_type})"
+        else:
+            lead_text = f"a comparable WAPE to the runner-up ({runner_up.model_type})"
+        comparison: dict[str, Any] = {
+            "runner_up_model_type": runner_up.model_type,
+            "runner_up_summary": _metric_phrase(runner_up.metrics),
+            "lead_text": lead_text,
+        }
+    else:
+        comparison = {
+            "runner_up_model_type": None,
+            "runner_up_summary": None,
+            "lead_text": "no runner-up was available for comparison",
+        }
+
+    return {
+        "headline": headline,
+        "winner": {
+            "model_type": winner.model_type,
+            "summary": _metric_phrase(winner.metrics),
+        },
+        "recommendation_confidence": ranking.confidence,
+        "confidence_reasons": ranking.reasons,
+        "comparison": comparison,
+        "data_notes": data_notes,
+        "caveats": caveats,
+    }
diff --git a/app/features/model_selection/models.py b/app/features/model_selection/models.py
new file mode 100644
index 00000000..8d987a58
--- /dev/null
+++ b/app/features/model_selection/models.py
@@ -0,0 +1,199 @@
+"""ORM models for the Forecast Champion Selector slice (issue #353).
+
+One table — ``model_selection_run`` — records one ``POST /model-selection/run``
+invocation as an auditable artifact. Mirrors ``app/features/batch/models.py``
+for shape: ``TimestampMixin`` + ``Base``, a string status column with an
+allow-list ``CheckConstraint`` in ``__table_args__``, and JSONB columns for the
+flexible audit snapshots (candidate configs, policy, availability, ranking,
+per-candidate results, chart data, winner metrics, forecast summary, business
+summary).
+"""
+
+from __future__ import annotations
+
+import datetime as _dt
+from enum import Enum
+from typing import Any
+
+from sqlalchemy import (
+    Boolean,
+    CheckConstraint,
+    Date,
+    DateTime,
+    ForeignKey,
+    Index,
+    Integer,
+    String,
+)
+from sqlalchemy.dialects.postgresql import JSONB
+from sqlalchemy.orm import Mapped, mapped_column
+
+from app.core.database import Base
+from app.shared.models import TimestampMixin
+
+
+class ModelSelectionStatus(str, Enum):
+    """Lifecycle states of a selection run.
+
+    Transitions:
+    - PENDING -> RUNNING -> {COMPLETED, PARTIAL, FAILED, CANCELLED}
+    - PARTIAL fires when >=1 candidate succeeded AND >=1 candidate failed/cancelled.
+    - FAILED fires when availability is unusable (fail-fast) OR every
+      candidate's backtest errored (no valid winner).
+    - CANCELLED (Slice B) fires when a cancel drained before any candidate
+      reached a non-cancelled terminal state.
+    """
+
+    PENDING = "pending"
+    RUNNING = "running"
+    COMPLETED = "completed"
+    PARTIAL = "partial"
+    FAILED = "failed"
+    CANCELLED = "cancelled"
+
+
+# Statuses a selection run cannot transition out of — the DELETE-route 409 set
+# (Slice B). Mirrors ``batch.models.TERMINAL_BATCH_STATES``.
+TERMINAL_SELECTION_STATES: frozenset[str] = frozenset(
+    {
+        ModelSelectionStatus.COMPLETED.value,
+        ModelSelectionStatus.PARTIAL.value,
+        ModelSelectionStatus.FAILED.value,
+        ModelSelectionStatus.CANCELLED.value,
+    }
+)
+
+
+class CandidateStatus(str, Enum):
+    """Per-candidate execution states inside an async selection run (Slice B)."""
+
+    PENDING = "pending"
+    RUNNING = "running"
+    COMPLETED = "completed"
+    FAILED = "failed"
+    CANCELLED = "cancelled"
+
+
+class ModelSelectionRun(TimestampMixin, Base):
+    """A single champion-selection run over one (store, product) pair.
+
+    ``candidate_results`` carries the full per-candidate detail (incl. fold
+    actuals/predictions) so a ``GET`` rebuilds the same ``chart_data`` payload
+    the originating ``/run`` returned. ``chart_data`` caches the computed
+    chart-ready payload so the read path needs no recomputation.
+    """
+
+    __tablename__ = "model_selection_run"
+
+    id: Mapped[int] = mapped_column(Integer, primary_key=True)
+    selection_id: Mapped[str] = mapped_column(String(32), unique=True, index=True)
+    store_id: Mapped[int] = mapped_column(Integer, index=True)
+    product_id: Mapped[int] = mapped_column(Integer, index=True)
+    start_date: Mapped[_dt.date] = mapped_column(Date)
+    end_date: Mapped[_dt.date] = mapped_column(Date)
+    forecast_horizon: Mapped[int] = mapped_column(Integer)
+    ranking_metric: Mapped[str] = mapped_column(String(20))
+    status: Mapped[str] = mapped_column(
+        String(20), default=ModelSelectionStatus.PENDING.value, index=True
+    )
+    candidate_models: Mapped[list[dict[str, Any]]] = mapped_column(JSONB, nullable=False)
+    policy_snapshot: Mapped[dict[str, Any]] = mapped_column(JSONB, nullable=False)
+    availability_snapshot: Mapped[dict[str, Any] | None] = mapped_column(JSONB, nullable=True)
+    ranking_result: Mapped[dict[str, Any] | None] = mapped_column(JSONB, nullable=True)
+    candidate_results: Mapped[list[dict[str, Any]] | None] = mapped_column(JSONB, nullable=True)
+    chart_data: Mapped[dict[str, Any] | None] = mapped_column(JSONB, nullable=True)
+    winner_model_type: Mapped[str | None] = mapped_column(String(40), nullable=True)
+    winner_metrics: Mapped[dict[str, Any] | None] = mapped_column(JSONB, nullable=True)
+    final_model_path: Mapped[str | None] = mapped_column(String(512), nullable=True)
+    forecast_result: Mapped[dict[str, Any] | None] = mapped_column(JSONB, nullable=True)
+    business_summary: Mapped[dict[str, Any] | None] = mapped_column(JSONB, nullable=True)
+    error_message: Mapped[str | None] = mapped_column(String(2000), nullable=True)
+    # Slice B (async) — set when the run starts executing; the four count
+    # columns cache the FINAL per-status candidate tally written once at settle
+    # (live progress is derived from a GROUP BY over the child rows).
+    started_at: Mapped[_dt.datetime | None] = mapped_column(DateTime(timezone=True), nullable=True)
+    total_candidates: Mapped[int] = mapped_column(Integer, default=0, server_default="0")
+    completed_candidates: Mapped[int] = mapped_column(Integer, default=0, server_default="0")
+    failed_candidates: Mapped[int] = mapped_column(Integer, default=0, server_default="0")
+    cancelled_candidates: Mapped[int] = mapped_column(Integer, default=0, server_default="0")
+    completed_at: Mapped[_dt.datetime | None] = mapped_column(
+        DateTime(timezone=True), nullable=True
+    )
+    # Slice C (forecast decision + operationalization) — all additive.
+    # ``trained_model_type`` records which model the final bundle holds (the
+    # ranked winner, or a user override); ``is_override`` flags a non-recommended
+    # choice; the promotion columns capture the approval-gated registry handoff.
+    trained_model_type: Mapped[str | None] = mapped_column(String(40), nullable=True)
+    is_override: Mapped[bool] = mapped_column(
+        Boolean, default=False, server_default="false", nullable=False
+    )
+    override_reason: Mapped[str | None] = mapped_column(String(2000), nullable=True)
+    champion_run_id: Mapped[str | None] = mapped_column(String(32), nullable=True)
+    promoted_alias: Mapped[str | None] = mapped_column(String(100), nullable=True)
+    promotion_decision: Mapped[dict[str, Any] | None] = mapped_column(JSONB, nullable=True)
+    # M1 — V2 promotion support: the request's feature_frame_version persisted at
+    # run-creation so train/promote carry the REAL version end-to-end. The
+    # server_default '1' backfills legacy rows ONLY (it is not a code hardcode).
+    feature_frame_version: Mapped[int] = mapped_column(
+        Integer, default=1, server_default="1", nullable=False
+    )
+
+    __table_args__ = (
+        CheckConstraint(
+            "status IN ('pending', 'running', 'completed', 'partial', 'failed', 'cancelled')",
+            name="ck_model_selection_run_valid_status",
+        ),
+        Index(
+            "ix_model_selection_run_store_product_created",
+            "store_id",
+            "product_id",
+            "created_at",
+        ),
+        Index("ix_model_selection_run_status_created", "status", "created_at"),
+    )
+
+
+class ModelSelectionCandidate(TimestampMixin, Base):
+    """One candidate's async execution record inside a selection run (Slice B).
+
+    Concurrent candidate tasks each write their OWN row in their OWN session —
+    no shared-row write race. ``result`` carries the full ``CandidateResult``
+    JSONB (incl. folds) on success; failed/cancelled candidates keep their row
+    so they stay visible in the results UI. Mirrors ``batch.BatchJobItem``.
+    """
+
+    __tablename__ = "model_selection_candidate"
+
+    id: Mapped[int] = mapped_column(Integer, primary_key=True)
+    candidate_id: Mapped[str] = mapped_column(String(32), unique=True, index=True)
+    selection_id: Mapped[str] = mapped_column(
+        String(32),
+        ForeignKey("model_selection_run.selection_id", ondelete="CASCADE"),
+        index=True,
+    )
+    ordinal: Mapped[int] = mapped_column(Integer)  # submit order — stable display
+    model_type: Mapped[str] = mapped_column(String(40))
+    params: Mapped[dict[str, Any]] = mapped_column(JSONB, nullable=False)
+    status: Mapped[str] = mapped_column(
+        String(20), default=CandidateStatus.PENDING.value, index=True
+    )
+    result: Mapped[dict[str, Any] | None] = mapped_column(JSONB, nullable=True)
+    error_message: Mapped[str | None] = mapped_column(String(2000), nullable=True)
+    error_type: Mapped[str | None] = mapped_column(String(100), nullable=True)
+    started_at: Mapped[_dt.datetime | None] = mapped_column(DateTime(timezone=True), nullable=True)
+    completed_at: Mapped[_dt.datetime | None] = mapped_column(
+        DateTime(timezone=True), nullable=True
+    )
+    duration_ms: Mapped[int | None] = mapped_column(Integer, nullable=True)
+
+    __table_args__ = (
+        CheckConstraint(
+            "status IN ('pending', 'running', 'completed', 'failed', 'cancelled')",
+            name="ck_model_selection_candidate_valid_status",
+        ),
+        Index(
+            "ix_model_selection_candidate_selection_status",
+            "selection_id",
+            "status",
+        ),
+    )
diff --git a/app/features/model_selection/ranking.py b/app/features/model_selection/ranking.py
new file mode 100644
index 00000000..ecca7587
--- /dev/null
+++ b/app/features/model_selection/ranking.py
@@ -0,0 +1,283 @@
+"""Pure ranking + confidence logic for the champion selector (issue #353).
+
+No DB, no I/O — every function here is deterministic and unit-tested directly.
+The ranking key and confidence policy implement the PRP's LOCKED decision #6
+(deterministic tie-break chain) and the relative-improvement confidence model.
+"""
+
+from __future__ import annotations
+
+import math
+from dataclasses import dataclass
+
+from app.features.model_selection.schemas import (
+    CandidateResult,
+    ChartData,
+    ConfidenceLevel,
+    FoldChart,
+    ModelRankEntry,
+    RankingPolicy,
+    RankingResult,
+)
+
+# Below this relative WAPE lead over second place, the winner is a near-tie and
+# confidence is capped at LOW (the lead is not meaningful).
+NEAR_TIE_EPSILON = 0.02
+
+# The metric keys that MUST be finite for a candidate to be rankable. rmse is
+# carried for the contract but not required (it never enters the sort key).
+_REQUIRED_FINITE = ("wape", "smape", "mae", "bias")
+
+
+@dataclass(frozen=True)
+class NormalizedMetrics:
+    """The five backtest metrics plus the derived sample size, all floats."""
+
+    wape: float
+    smape: float
+    mae: float
+    rmse: float
+    bias: float
+    sample_size: int
+
+    def as_dict(self) -> dict[str, float]:
+        """Stable 6-key dict embedded in ``ModelRankEntry.metrics``."""
+        return {
+            "wape": self.wape,
+            "smape": self.smape,
+            "mae": self.mae,
+            "rmse": self.rmse,
+            "bias": self.bias,
+            "sample_size": float(self.sample_size),
+        }
+
+
+def _is_finite(value: float) -> bool:
+    return not (math.isnan(value) or math.isinf(value))
+
+
+def normalize_metrics(
+    aggregated_metrics: dict[str, float] | None,
+    sample_size: int,
+) -> NormalizedMetrics | None:
+    """Coerce a raw 5-key backtest metric dict into ``NormalizedMetrics``.
+
+    Returns ``None`` (candidate is unrankable) when the dict is missing/empty or
+    when any of the sort-key metrics (wape, smape, mae, bias) is NaN/inf — e.g.
+    a WAPE of ``inf`` from an all-zero actual window.
+    """
+    if not aggregated_metrics:
+        return None
+
+    def _g(key: str) -> float:
+        raw = aggregated_metrics.get(key)
+        return float(raw) if raw is not None else math.nan
+
+    metrics = NormalizedMetrics(
+        wape=_g("wape"),
+        smape=_g("smape"),
+        mae=_g("mae"),
+        rmse=_g("rmse"),
+        bias=_g("bias"),
+        sample_size=sample_size,
+    )
+    if not all(_is_finite(getattr(metrics, name)) for name in _REQUIRED_FINITE):
+        return None
+    return metrics
+
+
+def _primary_value(metrics: NormalizedMetrics, ranking_metric: str) -> float:
+    """Value of the primary ranking metric (``bias`` ranks by magnitude)."""
+    if ranking_metric == "bias":
+        return abs(metrics.bias)
+    return float(getattr(metrics, ranking_metric))
+
+
+def _sort_key(
+    metrics: NormalizedMetrics, model_type: str, ranking_metric: str
+) -> tuple[float, float, float, float, str]:
+    """Deterministic sort key (LOCKED #6).
+
+    Primary = the chosen ranking metric, then the fixed tie-break chain
+    ``wape -> smape -> abs(bias) -> mae -> model_type`` with the primary metric
+    removed from the chain so it is never duplicated.
+    """
+    chain: list[tuple[str, float]] = [
+        ("wape", metrics.wape),
+        ("smape", metrics.smape),
+        ("bias", abs(metrics.bias)),
+        ("mae", metrics.mae),
+    ]
+    key: list[float] = [_primary_value(metrics, ranking_metric)]
+    key.extend(value for name, value in chain if name != ranking_metric)
+    return (key[0], key[1], key[2], key[3], model_type)
+
+
+def rank_candidates(
+    results: list[CandidateResult],
+    policy: RankingPolicy,
+    ranking_metric: str = "wape",
+    availability_status: str | None = None,
+) -> RankingResult:
+    """Rank completed candidates and pick a deterministic winner.
+
+    Failed/filtered candidates are never hidden — they appear as excluded
+    ``ModelRankEntry`` rows (``rank=None``) after the ranked winners.
+    """
+    valid: list[tuple[CandidateResult, NormalizedMetrics]] = []
+    excluded: list[ModelRankEntry] = []
+
+    for result in results:
+        if result.failed:
+            excluded.append(_excluded_entry(result, result.error or "candidate backtest failed"))
+            continue
+        metrics = normalize_metrics(result.aggregated_metrics, result.sample_size)
+        if metrics is None:
+            excluded.append(_excluded_entry(result, "missing or non-finite primary metric"))
+            continue
+        if metrics.sample_size < policy.minimum_sample_size:
+            excluded.append(
+                _excluded_entry(
+                    result,
+                    f"sample_size {metrics.sample_size} below minimum {policy.minimum_sample_size}",
+                )
+            )
+            continue
+        valid.append((result, metrics))
+
+    if not valid:
+        return RankingResult(
+            winner=None,
+            entries=excluded,
+            confidence="low",
+            reasons=["No candidate produced a valid backtest."],
+        )
+
+    ordered = sorted(valid, key=lambda pair: _sort_key(pair[1], pair[0].model_type, ranking_metric))
+    ranked_entries = [
+        ModelRankEntry(
+            rank=index + 1,
+            model_type=result.model_type,
+            params=result.params,
+            included=True,
+            metrics=metrics.as_dict(),
+        )
+        for index, (result, metrics) in enumerate(ordered)
+    ]
+
+    confidence, reasons = _confidence(ordered, policy, availability_status)
+
+    return RankingResult(
+        winner=ranked_entries[0],
+        entries=ranked_entries + excluded,
+        confidence=confidence,
+        reasons=reasons,
+    )
+
+
+def _excluded_entry(result: CandidateResult, reason: str) -> ModelRankEntry:
+    return ModelRankEntry(
+        rank=None,
+        model_type=result.model_type,
+        params=result.params,
+        included=False,
+        exclusion_reason=reason,
+        metrics=None,
+    )
+
+
+def _confidence(
+    ordered: list[tuple[CandidateResult, NormalizedMetrics]],
+    policy: RankingPolicy,
+    availability_status: str | None,
+) -> tuple[ConfidenceLevel, list[str]]:
+    """Derive the recommendation confidence from the ranked candidates.
+
+    Order of checks: a single valid candidate, limited availability, or an
+    over-threshold winner bias all cap confidence at LOW; a clear WAPE lead with
+    acceptable bias is HIGH; everything in between is MEDIUM.
+    """
+    reasons: list[str] = []
+    winner_metrics = ordered[0][1]
+
+    if len(ordered) == 1:
+        reasons.append("Only one candidate produced a valid backtest.")
+        return "low", reasons
+
+    second_metrics = ordered[1][1]
+    if second_metrics.wape > 0:
+        rel_improvement = (second_metrics.wape - winner_metrics.wape) / second_metrics.wape
+    else:
+        rel_improvement = 0.0
+
+    bias_ok = abs(winner_metrics.bias) <= policy.max_acceptable_abs_bias
+
+    if availability_status == "limited":
+        reasons.append("Data availability is limited; treat the recommendation cautiously.")
+        return "low", reasons
+    if not bias_ok:
+        reasons.append(
+            f"Winner bias {winner_metrics.bias:.3f} exceeds the acceptable bound "
+            f"{policy.max_acceptable_abs_bias:.3f}."
+        )
+        return "low", reasons
+    if rel_improvement < NEAR_TIE_EPSILON:
+        reasons.append(f"Winner WAPE lead over second place is {rel_improvement:.1%} — a near tie.")
+        return "low", reasons
+    if rel_improvement >= policy.high_confidence_rel_improvement:
+        reasons.append(
+            f"Winner WAPE beats second place by {rel_improvement:.1%} "
+            f"(>= {policy.high_confidence_rel_improvement:.0%})."
+        )
+        return "high", reasons
+
+    reasons.append(
+        f"Winner leads second place by {rel_improvement:.1%}, below the "
+        f"{policy.high_confidence_rel_improvement:.0%} high-confidence threshold."
+    )
+    return "medium", reasons
+
+
+def _fold_wape(actuals: list[float], predictions: list[float]) -> float:
+    """WAPE (%) for one fold; 0.0 when the actual window sums to zero."""
+    denominator = sum(abs(a) for a in actuals)
+    if denominator == 0:
+        return 0.0
+    numerator = sum(abs(a - p) for a, p in zip(actuals, predictions, strict=False))
+    return numerator / denominator * 100.0
+
+
+def build_chart_data(results: list[CandidateResult], ranking: RankingResult) -> ChartData:
+    """Assemble the chart-ready comparison payload from candidate results.
+
+    Keyed by ``model_type``; when a candidate list repeats a model_type the last
+    occurrence wins (acceptable for v1 — duplicate model_types are uncommon).
+    """
+    by_type: dict[str, CandidateResult] = {r.model_type: r for r in results}
+    wape_by_model: dict[str, float] = {}
+    bias_by_model: dict[str, float] = {}
+    fold_stability: dict[str, list[float]] = {}
+
+    for entry in ranking.entries:
+        if not entry.included or entry.metrics is None:
+            continue
+        wape_by_model[entry.model_type] = entry.metrics["wape"]
+        bias_by_model[entry.model_type] = entry.metrics["bias"]
+        result = by_type.get(entry.model_type)
+        if result is not None:
+            fold_stability[entry.model_type] = [
+                _fold_wape(fold.actuals, fold.predictions) for fold in result.folds
+            ]
+
+    winner_folds: list[FoldChart] = []
+    if ranking.winner is not None:
+        winner_result = by_type.get(ranking.winner.model_type)
+        if winner_result is not None:
+            winner_folds = winner_result.folds
+
+    return ChartData(
+        wape_by_model=wape_by_model,
+        bias_by_model=bias_by_model,
+        fold_stability=fold_stability,
+        winner_actual_vs_predicted=winner_folds,
+    )
diff --git a/app/features/model_selection/routes.py b/app/features/model_selection/routes.py
new file mode 100644
index 00000000..61a0cb8e
--- /dev/null
+++ b/app/features/model_selection/routes.py
@@ -0,0 +1,338 @@
+"""FastAPI routes for the Forecast Champion Selector slice (issue #353).
+
+Endpoints (all under ``/model-selection``):
+- GET  /availability            — pair data-availability assessment
+- POST /run                     — run candidate comparison + ranking (200)
+- GET  /{selection_id}          — fetch a persisted selection run
+- GET  /{selection_id}/ranking  — fetch just the ranking block
+- POST /{selection_id}/train-winner — train the winning model
+- POST /{selection_id}/train-selected — train a user-chosen candidate (override)
+- POST /{selection_id}/predict  — forecast with the trained winner + decision
+- POST /{selection_id}/promote  — promote the trained champion to a registry alias
+
+Error mapping mirrors ``app/features/backtesting/routes.py``: ``ValueError`` →
+``BadRequestError`` (RFC 7807 400), ``SQLAlchemyError`` → ``DatabaseError`` (500).
+``NotFoundError`` / ``BadRequestError`` raised inside the service are
+``ForecastLabError`` subclasses and bubble straight to the global handler.
+"""
+
+from __future__ import annotations
+
+from fastapi import APIRouter, Body, Depends, Query, Response, status
+from sqlalchemy.exc import SQLAlchemyError
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from app.core.database import get_db
+from app.core.exceptions import BadRequestError, DatabaseError
+from app.core.logging import get_logger
+from app.features.model_selection.schemas import (
+    ForecastDecisionParams,
+    ModelCatalogResponse,
+    ModelSelectionRunRequest,
+    ModelSelectionRunResponse,
+    PairAvailabilityResponse,
+    PredictWinnerResponse,
+    PromoteRequest,
+    PromoteResponse,
+    RankingResult,
+    SubmitRunResponse,
+    TrainSelectedRequest,
+    TrainWinnerResponse,
+)
+from app.features.model_selection.service import ModelSelectionService
+
+logger = get_logger(__name__)
+
+router = APIRouter(prefix="/model-selection", tags=["model-selection"])
+
+
+@router.get(
+    "/availability",
+    response_model=PairAvailabilityResponse,
+    status_code=status.HTTP_200_OK,
+    summary="Assess data availability for a (store, product) pair",
+)
+async def get_availability(
+    store_id: int = Query(..., ge=1, description="Store ID"),
+    product_id: int = Query(..., ge=1, description="Product ID"),
+    forecast_horizon: int = Query(14, ge=1, le=90, description="Forecast horizon in days"),
+    db: AsyncSession = Depends(get_db),
+) -> PairAvailabilityResponse:
+    """Return coverage, demand, promotion, and a recommended split config."""
+    service = ModelSelectionService()
+    try:
+        return await service.get_availability(db, store_id, product_id, forecast_horizon)
+    except ValueError as exc:
+        raise BadRequestError(message=str(exc)) from exc
+    except SQLAlchemyError as exc:
+        raise DatabaseError(
+            message="Failed to assess availability", details={"error": str(exc)}
+        ) from exc
+
+
+@router.get(
+    "/models",
+    response_model=ModelCatalogResponse,
+    status_code=status.HTTP_200_OK,
+    summary="List the backend-owned candidate-model capability catalog",
+)
+async def get_model_catalog() -> ModelCatalogResponse:
+    """Return the static candidate-model catalog (no DB, no query params).
+
+    Declared BEFORE ``GET /{selection_id}`` so Starlette matches the literal
+    ``/models`` path and does not capture it as ``selection_id="models"``.
+    """
+    service = ModelSelectionService()
+    return service.get_model_catalog()
+
+
+@router.post(
+    "/runs",
+    response_model=SubmitRunResponse,
+    status_code=status.HTTP_202_ACCEPTED,
+    summary="Submit an async candidate comparison (fire-and-forget LRO)",
+)
+async def submit_run(
+    request: ModelSelectionRunRequest,
+    response: Response,
+    db: AsyncSession = Depends(get_db),
+) -> SubmitRunResponse:
+    """Submit an async selection run — returns 202 with monitor/cancel pointers.
+
+    The candidate backtests run in a detached task; poll
+    ``GET /model-selection/{selection_id}`` for live progress, terminal ranking,
+    and the winner.
+    """
+    logger.info(
+        "model_selection.runs_request_received",
+        store_id=request.store_id,
+        product_id=request.product_id,
+        n_candidates=len(request.candidate_models),
+    )
+    service = ModelSelectionService()
+    try:
+        result = await service.submit_run(db, request)
+        response.headers["Location"] = result.monitor_url
+        response.headers["Retry-After"] = "2"
+        return result
+    except ValueError as exc:
+        raise BadRequestError(message=str(exc)) from exc
+    except SQLAlchemyError as exc:
+        raise DatabaseError(
+            message="Failed to submit selection run", details={"error": str(exc)}
+        ) from exc
+
+
+@router.post(
+    "/run",
+    response_model=ModelSelectionRunResponse,
+    status_code=status.HTTP_200_OK,
+    summary="Run candidate model comparison and select a champion",
+)
+async def run_selection(
+    request: ModelSelectionRunRequest,
+    db: AsyncSession = Depends(get_db),
+) -> ModelSelectionRunResponse:
+    """Validate availability, backtest candidates, rank, and persist the run."""
+    logger.info(
+        "model_selection.request_received",
+        store_id=request.store_id,
+        product_id=request.product_id,
+        n_candidates=len(request.candidate_models),
+        ranking_metric=request.ranking_metric,
+    )
+    service = ModelSelectionService()
+    try:
+        return await service.run_selection(db, request)
+    except ValueError as exc:
+        raise BadRequestError(message=str(exc)) from exc
+    except SQLAlchemyError as exc:
+        raise DatabaseError(
+            message="Failed to run model selection", details={"error": str(exc)}
+        ) from exc
+
+
+@router.get(
+    "/{selection_id}",
+    response_model=ModelSelectionRunResponse,
+    status_code=status.HTTP_200_OK,
+    summary="Fetch a persisted selection run",
+)
+async def get_selection(
+    selection_id: str,
+    db: AsyncSession = Depends(get_db),
+) -> ModelSelectionRunResponse:
+    """Return the full persisted selection run by id (404 when missing)."""
+    service = ModelSelectionService()
+    try:
+        return await service.get_selection(db, selection_id)
+    except SQLAlchemyError as exc:
+        raise DatabaseError(
+            message="Failed to fetch selection run", details={"error": str(exc)}
+        ) from exc
+
+
+@router.delete(
+    "/{selection_id}",
+    response_model=ModelSelectionRunResponse,
+    status_code=status.HTTP_200_OK,
+    summary="Cancel an in-flight selection run (cooperative drain)",
+    description=(
+        "Cooperatively cancel an async selection run (Slice B). Pending "
+        "candidates skip; running candidates observe ``asyncio.CancelledError`` "
+        "at the next safe yield — sklearn / LightGBM fits are uncancellable "
+        "mid-call, so an in-flight fit may finish first. Returns:\n\n"
+        "- ``200`` settled run on a clean drain\n"
+        "- ``404`` RFC 7807 if the run does not exist\n"
+        "- ``409`` RFC 7807 if the run is already terminal\n"
+        "- ``504`` RFC 7807 if the drain exceeds "
+        "``Settings.model_selection_cancel_drain_timeout_seconds``"
+    ),
+)
+async def cancel_run(
+    selection_id: str,
+    db: AsyncSession = Depends(get_db),
+) -> ModelSelectionRunResponse:
+    """Cancel an in-flight selection run and return its settled record.
+
+    ``NotFoundError`` (404) / ``ConflictError`` (409) / ``GatewayTimeoutError``
+    (504) raised in-service bubble to the global RFC 7807 handler.
+    """
+    service = ModelSelectionService()
+    try:
+        return await service.cancel_run(db, selection_id)
+    except SQLAlchemyError as exc:
+        raise DatabaseError(
+            message="Failed to cancel selection run", details={"error": str(exc)}
+        ) from exc
+
+
+@router.get(
+    "/{selection_id}/ranking",
+    response_model=RankingResult,
+    status_code=status.HTTP_200_OK,
+    summary="Fetch the ranking block for a selection run",
+)
+async def get_ranking(
+    selection_id: str,
+    db: AsyncSession = Depends(get_db),
+) -> RankingResult:
+    """Return just the ranking (winner, entries, confidence, reasons)."""
+    service = ModelSelectionService()
+    try:
+        return await service.get_ranking(db, selection_id)
+    except SQLAlchemyError as exc:
+        raise DatabaseError(message="Failed to fetch ranking", details={"error": str(exc)}) from exc
+
+
+@router.post(
+    "/{selection_id}/train-winner",
+    response_model=TrainWinnerResponse,
+    status_code=status.HTTP_200_OK,
+    summary="Train the winning model for a selection run",
+)
+async def train_winner(
+    selection_id: str,
+    db: AsyncSession = Depends(get_db),
+) -> TrainWinnerResponse:
+    """Train the champion and store its model bundle path."""
+    service = ModelSelectionService()
+    try:
+        return await service.train_winner(db, selection_id)
+    except ValueError as exc:
+        raise BadRequestError(message=str(exc)) from exc
+    except SQLAlchemyError as exc:
+        raise DatabaseError(
+            message="Failed to train winning model", details={"error": str(exc)}
+        ) from exc
+
+
+@router.post(
+    "/{selection_id}/train-selected",
+    response_model=TrainWinnerResponse,
+    status_code=status.HTTP_200_OK,
+    summary="Train a user-chosen candidate (override)",
+)
+async def train_selected(
+    selection_id: str,
+    request: TrainSelectedRequest,
+    db: AsyncSession = Depends(get_db),
+) -> TrainWinnerResponse:
+    """Train a chosen candidate (override). A non-candidate ``model_type`` → 400.
+
+    Overriding the recommended winner returns ``is_override=true`` plus an
+    ``override_warning`` and records the override reason on the run.
+    """
+    service = ModelSelectionService()
+    try:
+        return await service.train_selected(
+            db, selection_id, request.model_type, request.override_reason
+        )
+    except ValueError as exc:
+        raise BadRequestError(message=str(exc)) from exc
+    except SQLAlchemyError as exc:
+        raise DatabaseError(
+            message="Failed to train selected model", details={"error": str(exc)}
+        ) from exc
+
+
+@router.post(
+    "/{selection_id}/predict",
+    response_model=PredictWinnerResponse,
+    status_code=status.HTTP_200_OK,
+    summary="Forecast with the trained model + inventory decision",
+)
+async def predict_winner(
+    selection_id: str,
+    request: ForecastDecisionParams | None = Body(default=None),
+    db: AsyncSession = Depends(get_db),
+) -> PredictWinnerResponse:
+    """Generate a horizon forecast + a labeled safety-stock decision heuristic.
+
+    The body is OPTIONAL — an empty body uses ``ForecastDecisionParams``
+    defaults (lead_time_days=7, service_level=0.95). A feature-aware model 400s
+    (use the What-If Planner instead).
+    """
+    params = request or ForecastDecisionParams()
+    service = ModelSelectionService()
+    try:
+        forecast, decision = await service.predict_winner(
+            db, selection_id, params.lead_time_days, params.service_level
+        )
+        return PredictWinnerResponse(
+            selection_id=selection_id, forecast=forecast, decision=decision
+        )
+    except ValueError as exc:
+        raise BadRequestError(message=str(exc)) from exc
+    except SQLAlchemyError as exc:
+        raise DatabaseError(
+            message="Failed to forecast with winning model", details={"error": str(exc)}
+        ) from exc
+
+
+@router.post(
+    "/{selection_id}/promote",
+    response_model=PromoteResponse,
+    status_code=status.HTTP_200_OK,
+    summary="Promote the trained champion to a registry alias (approval-gated)",
+)
+async def promote(
+    selection_id: str,
+    request: PromoteRequest,
+    db: AsyncSession = Depends(get_db),
+) -> PromoteResponse:
+    """Register a SUCCESS model run + alias for the trained champion.
+
+    Approval-gated + audited: requires ``approved_by``; a non-recommended model
+    requires ``acknowledge_non_recommended=true`` (else 422); promoting before
+    training → 422; a bad ``alias_name`` → 422 at the schema boundary.
+    """
+    service = ModelSelectionService()
+    try:
+        return await service.promote(db, selection_id, request)
+    except ValueError as exc:
+        raise BadRequestError(message=str(exc)) from exc
+    except SQLAlchemyError as exc:
+        raise DatabaseError(
+            message="Failed to promote champion", details={"error": str(exc)}
+        ) from exc
diff --git a/app/features/model_selection/runner.py b/app/features/model_selection/runner.py
new file mode 100644
index 00000000..7320ea03
--- /dev/null
+++ b/app/features/model_selection/runner.py
@@ -0,0 +1,312 @@
+"""Bounded-concurrency candidate runner for the champion selector (Slice B).
+
+A slice-local mirror of ``app/features/batch/runner.py``: one
+:class:`asyncio.Semaphore` inside an :class:`asyncio.TaskGroup` fans out one
+task per ``model_selection_candidate``; each child opens its own
+``AsyncSession`` and observes a cooperative :class:`asyncio.Event` so
+``DELETE /model-selection/{selection_id}`` cancels what hasn't started and
+gracefully drains what has.
+
+The asyncio mechanics (the three cancel mechanisms, the
+``except* asyncio.CancelledError`` PEP-654 catch shape, the per-task cancel +
+cooperative event) are documented in
+``PRPs/ai_docs/asyncio-taskgroup-cancellation.md``.
+
+Cross-slice rule: this module imports from ``app.features.model_selection.models``
+(same slice) and ``app.core.*`` only — it does NOT import the batch runner
+(vertical-slice rule). The per-child ``execute_candidate`` callable supplied by
+``ModelSelectionService`` is the seam that keeps the heavy backtest work out of
+this module.
+"""
+
+from __future__ import annotations
+
+import asyncio
+from collections.abc import Awaitable, Callable
+from dataclasses import dataclass, field
+from datetime import UTC, datetime
+from typing import TYPE_CHECKING
+
+from sqlalchemy import select, update
+
+from app.core.logging import get_logger
+from app.features.model_selection.models import (
+    CandidateStatus,
+    ModelSelectionCandidate,
+)
+
+if TYPE_CHECKING:
+    from sqlalchemy.ext.asyncio import AsyncSession, async_sessionmaker
+
+
+logger = get_logger(__name__)
+
+
+@dataclass
+class CancelHandle:
+    """Cancel signal + Task refs + completion event for an in-flight selection.
+
+    Created by :func:`run_selection_candidates`, looked up by
+    :func:`cancel_selection`, removed from :data:`_ACTIVE_SELECTIONS` and
+    signalled by the runner's caller via :func:`mark_completed` *after* the
+    parent's settle has committed — so ``DELETE`` never observes the parent
+    mid-settle.
+    """
+
+    cancel_event: asyncio.Event = field(default_factory=asyncio.Event)
+    completed_event: asyncio.Event = field(default_factory=asyncio.Event)
+    tasks: list[asyncio.Task[None]] = field(default_factory=list)
+
+
+# Module-level registry — single-process scope (matches the single-host vision).
+_ACTIVE_SELECTIONS: dict[str, CancelHandle] = {}
+
+
+def register_selection(selection_id: str) -> CancelHandle:
+    """Eagerly create (or reuse) the cancel handle for a selection.
+
+    Called by the service the moment ``POST /runs`` commits — BEFORE the
+    detached worker starts — so a ``DELETE`` arriving in the gap between the 202
+    response and the worker's first ``run_selection_candidates`` call still
+    finds a handle (and is not misreported as "already settled"). The worker's
+    ``setdefault`` reuses this same handle.
+    """
+    return _ACTIVE_SELECTIONS.setdefault(selection_id, CancelHandle())
+
+
+async def run_selection_candidates(
+    *,
+    selection_id: str,
+    candidate_ids: list[str],
+    max_parallel: int,
+    global_max_parallel: int,
+    session_maker: async_sessionmaker[AsyncSession],
+    execute_candidate: Callable[[str], Awaitable[None]],
+) -> int:
+    """Execute one selection's candidates through a bounded TaskGroup.
+
+    Args:
+        selection_id: ``model_selection_run.selection_id`` — registry key + log
+            correlator.
+        candidate_ids: ``model_selection_candidate.candidate_id`` values, in
+            submit order.
+        max_parallel: per-run cap (Slice B passes the global setting — there is
+            no per-run field).
+        global_max_parallel: host-wide cap from
+            :attr:`Settings.model_selection_global_max_parallel`.
+        session_maker: shared ``async_sessionmaker``; each child opens one
+            ``AsyncSession`` from it for the state-transition writes the runner
+            emits. The caller-supplied ``execute_candidate`` opens its OWN
+            session from the same maker.
+        execute_candidate: one-arg coroutine; runs one candidate's backtest +
+            persists its result/failure in its own session.
+
+    Returns:
+        ``effective = min(max_parallel, global_max_parallel)``.
+
+    Notes:
+        - Caller MUST call :func:`mark_completed` after the parent settle
+          commits (even on the exception path).
+        - Cancellation does NOT propagate out: ``except* asyncio.CancelledError``
+          absorbs the ``ExceptionGroup`` so the caller can settle the parent.
+    """
+    effective = min(max_parallel, global_max_parallel)
+    sem = asyncio.Semaphore(effective)
+    handle = _ACTIVE_SELECTIONS.setdefault(selection_id, CancelHandle())
+
+    logger.info(
+        "model_selection.runner_start",
+        selection_id=selection_id,
+        total_candidates=len(candidate_ids),
+        max_parallel=max_parallel,
+        effective_max_parallel=effective,
+    )
+
+    async def _child(candidate_id: str) -> None:
+        # One ``AsyncSession`` per child for the runner's own state writes.
+        async with session_maker() as session:
+            # FAST-CANCEL before the semaphore acquire — skips not-yet-started
+            # work cleanly (sync check; no await window).
+            if handle.cancel_event.is_set():
+                await _mark_cancelled_skipped(session, candidate_id)
+                return
+
+            acquired = False
+            try:
+                async with sem:
+                    acquired = True
+                    # Re-check after acquire — a sibling may have signalled
+                    # cancel while we waited on the semaphore.
+                    if handle.cancel_event.is_set():
+                        await _mark_cancelled_skipped(session, candidate_id)
+                        return
+                    try:
+                        await execute_candidate(candidate_id)
+                    except asyncio.CancelledError:
+                        # Persist the cancelled terminal state before re-raising
+                        # so the TaskGroup absorbs the cancel.
+                        await _mark_cancelled_running(session, candidate_id)
+                        raise
+                    except Exception:
+                        # Defensive: ``execute_candidate`` should persist its own
+                        # failure; if it didn't, mark FAILED so settle aggregates
+                        # correctly. Do NOT re-raise — that would tear down siblings.
+                        logger.exception(
+                            "model_selection.runner_unexpected_child_error",
+                            selection_id=selection_id,
+                            candidate_id=candidate_id,
+                        )
+                        await _mark_failed_unexpected(session, candidate_id)
+            except asyncio.CancelledError:
+                if not acquired:
+                    await _mark_cancelled_skipped(session, candidate_id)
+                raise
+
+    try:
+        async with asyncio.TaskGroup() as tg:
+            for cid in candidate_ids:
+                task = tg.create_task(_child(cid), name=f"model_selection:{selection_id}:{cid}")
+                handle.tasks.append(task)
+    except* asyncio.CancelledError:
+        # Clean ``task.cancel()`` calls are absorbed here; the per-child blocks
+        # already wrote the terminal state. The caller settles the parent.
+        logger.info(
+            "model_selection.runner_cancelled_exception_group",
+            selection_id=selection_id,
+        )
+
+    logger.info(
+        "model_selection.runner_complete",
+        selection_id=selection_id,
+        cancel_requested=handle.cancel_event.is_set(),
+    )
+    return effective
+
+
+def cancel_selection(selection_id: str) -> bool:
+    """Signal cooperative cancel for an in-flight selection.
+
+    Sets ``cancel_event`` (skips pending children) and ``task.cancel()`` on
+    every tracked child (interrupts running children at the next yield).
+
+    Returns:
+        ``True`` if the selection was registered; ``False`` if no handle exists
+        (race: the selection settled before cancel).
+    """
+    handle = _ACTIVE_SELECTIONS.get(selection_id)
+    if handle is None:
+        return False
+    handle.cancel_event.set()
+    cancelled_count = 0
+    for task in handle.tasks:
+        if not task.done():
+            task.cancel()
+            cancelled_count += 1
+    logger.info(
+        "model_selection.cancel_requested",
+        selection_id=selection_id,
+        n_tasks_tracked=len(handle.tasks),
+        n_tasks_cancelled=cancelled_count,
+    )
+    return True
+
+
+async def await_drain(selection_id: str, timeout_seconds: float) -> bool:
+    """Block until the selection's parent settle commits, or timeout elapses.
+
+    Returns:
+        ``True`` on clean drain (or if never registered); ``False`` on timeout.
+    """
+    handle = _ACTIVE_SELECTIONS.get(selection_id)
+    if handle is None:
+        return True
+    try:
+        await asyncio.wait_for(handle.completed_event.wait(), timeout=timeout_seconds)
+        return True
+    except TimeoutError:
+        # asyncio.wait_for raises the built-in TimeoutError since Python 3.11.
+        logger.warning(
+            "model_selection.cancel_drain_timeout",
+            selection_id=selection_id,
+            timeout_seconds=timeout_seconds,
+        )
+        return False
+
+
+def mark_completed(selection_id: str) -> None:
+    """Signal that the selection's parent settle has committed.
+
+    Must be called after ``_settle`` commits (including the failure path) so any
+    concurrent ``DELETE`` drain unblocks. Idempotent: a missing handle is a no-op.
+    """
+    handle = _ACTIVE_SELECTIONS.pop(selection_id, None)
+    if handle is None:
+        return
+    handle.completed_event.set()
+
+
+# --------------------------------------------------------------------- helpers
+# Each helper accepts an already-open ``AsyncSession`` (one per child) and
+# commits its single UPDATE. They never raise on a missing row (a deleted-parent
+# race is survivable — log + move on).
+
+
+async def _mark_cancelled_skipped(session: AsyncSession, candidate_id: str) -> None:
+    """Mark a not-yet-started candidate as cancelled (pending → cancelled)."""
+    now = datetime.now(UTC)
+    await session.execute(
+        update(ModelSelectionCandidate)
+        .where(ModelSelectionCandidate.candidate_id == candidate_id)
+        .values(status=CandidateStatus.CANCELLED.value, completed_at=now)
+    )
+    await session.commit()
+
+
+async def _mark_cancelled_running(session: AsyncSession, candidate_id: str) -> None:
+    """Mark a running candidate as cancelled (running → cancelled)."""
+    now = datetime.now(UTC)
+    row = (
+        await session.execute(
+            select(ModelSelectionCandidate.started_at).where(
+                ModelSelectionCandidate.candidate_id == candidate_id
+            )
+        )
+    ).first()
+    started_at = row[0] if row is not None else None
+    duration_ms = int((now - started_at).total_seconds() * 1000) if started_at is not None else None
+    await session.execute(
+        update(ModelSelectionCandidate)
+        .where(ModelSelectionCandidate.candidate_id == candidate_id)
+        .values(
+            status=CandidateStatus.CANCELLED.value,
+            completed_at=now,
+            duration_ms=duration_ms,
+        )
+    )
+    await session.commit()
+
+
+async def _mark_failed_unexpected(session: AsyncSession, candidate_id: str) -> None:
+    """Defensive: mark a candidate ``failed`` when ``execute_candidate`` raised."""
+    now = datetime.now(UTC)
+    await session.execute(
+        update(ModelSelectionCandidate)
+        .where(ModelSelectionCandidate.candidate_id == candidate_id)
+        .values(
+            status=CandidateStatus.FAILED.value,
+            completed_at=now,
+            error_message="Runner caught unexpected exception (see structlog)",
+            error_type="UnexpectedRunnerError",
+        )
+    )
+    await session.commit()
+
+
+__all__ = [
+    "_ACTIVE_SELECTIONS",
+    "CancelHandle",
+    "await_drain",
+    "cancel_selection",
+    "mark_completed",
+    "run_selection_candidates",
+]
diff --git a/app/features/model_selection/schemas.py b/app/features/model_selection/schemas.py
new file mode 100644
index 00000000..f494882d
--- /dev/null
+++ b/app/features/model_selection/schemas.py
@@ -0,0 +1,475 @@
+"""Pydantic v2 schemas for the Forecast Champion Selector slice (issue #353).
+
+Request bodies use ``ConfigDict(strict=True)`` per
+``docs/_base/SECURITY.md`` § "Pydantic v2 strict mode on FastAPI request
+bodies"; the only JSON-non-native fields (``SelectionWindow.start_date`` /
+``end_date``) carry ``Field(strict=False, ...)`` so the strict-mode policy
+linter (``app/core/tests/test_strict_mode_policy.py``) stays green and ISO-date
+JSON strings are accepted on the ``validate_python`` path.
+
+Enum-like string fields use ``Literal[...]`` (NOT a ``str``-``Enum``) because
+strict mode refuses to coerce a JSON string into a str-enum instance — the same
+reason ``app/features/batch/schemas.py`` uses literals.
+
+Response/intermediate models are plain ``BaseModel`` (outputs need no strict
+coercion). They form the stable backend contract the eventual UI consumes.
+
+``SplitConfig`` is reused directly from the backtesting slice (a schema type
+with no import cycle back to this slice) to avoid configuration drift.
+"""
+
+from __future__ import annotations
+
+from datetime import date, datetime
+from typing import Any, Literal
+
+from pydantic import BaseModel, ConfigDict, Field, model_validator
+
+from app.features.backtesting.schemas import SplitConfig
+
+# Valid forecasting model_type values — the full ``ModelConfig`` union
+# (``app/features/forecasting/schemas.py``). ``lightgbm``/``xgboost`` are opt-in
+# extras and may degrade to a failed candidate at runtime when the extra is
+# absent (handled in the service, not rejected here).
+ModelType = Literal[
+    "naive",
+    "seasonal_naive",
+    "moving_average",
+    "weighted_moving_average",
+    "seasonal_average",
+    "trend_regression_baseline",
+    "random_forest",
+    "lightgbm",
+    "xgboost",
+    "regression",
+    "prophet_like",
+]
+
+RankingMetric = Literal["wape", "smape", "mae", "bias"]
+SelectionStatusLiteral = Literal[
+    "pending", "running", "completed", "partial", "failed", "cancelled"
+]
+CandidateStatusLiteral = Literal["pending", "running", "completed", "failed", "cancelled"]
+ConfidenceLevel = Literal["high", "medium", "low"]
+AvailabilityStatus = Literal["ready", "limited", "unusable"]
+
+
+# =============================================================================
+# Request models (strict mode)
+# =============================================================================
+
+
+class SelectionWindow(BaseModel):
+    """Inclusive date window the candidate backtests run over."""
+
+    model_config = ConfigDict(strict=True)
+
+    start_date: date = Field(strict=False, description="Window start (inclusive), YYYY-MM-DD")
+    end_date: date = Field(strict=False, description="Window end (inclusive), YYYY-MM-DD")
+
+    @model_validator(mode="after")
+    def _check_order(self) -> SelectionWindow:
+        """Reject an inverted/zero-length window (surfaced as RFC 7807 422)."""
+        if self.end_date <= self.start_date:
+            raise ValueError("end_date must be after start_date")
+        return self
+
+
+class CandidateModelConfig(BaseModel):
+    """One candidate forecasting model to evaluate.
+
+    ``params`` are the FLAT model-specific parameters (e.g.
+    ``{"season_length": 7}``). They are flattened into the forecasting
+    ``ModelConfig`` union at the service boundary; unknown params surface as a
+    failed candidate with a reason rather than a request rejection.
+    """
+
+    model_config = ConfigDict(strict=True)
+
+    model_type: ModelType
+    params: dict[str, Any] = Field(default_factory=dict)
+
+
+class RankingPolicy(BaseModel):
+    """Tunable thresholds for ranking filters + confidence.
+
+    ``max_acceptable_abs_bias`` is an ABSOLUTE bias bound in demand units and is
+    therefore series-scale dependent; it defaults high enough to be effectively
+    disabled so confidence is driven primarily by the relative WAPE lead, the
+    valid-candidate count, and the sample size. Set a series-appropriate value
+    to enable the bias guard.
+    """
+
+    model_config = ConfigDict(strict=True)
+
+    minimum_sample_size: int = Field(
+        default=0, ge=0, description="Drop candidates whose backtest sample is below this"
+    )
+    high_confidence_rel_improvement: float = Field(
+        default=0.10,
+        ge=0.0,
+        le=1.0,
+        description="Relative WAPE lead over 2nd place required for HIGH confidence",
+    )
+    max_acceptable_abs_bias: float = Field(
+        default=1_000_000_000.0,
+        ge=0.0,
+        description="Absolute winner-bias bound (demand units); high default = guard disabled",
+    )
+
+
+class ModelSelectionRunRequest(BaseModel):
+    """``POST /model-selection/run`` request body."""
+
+    model_config = ConfigDict(strict=True)
+
+    store_id: int = Field(..., ge=1, description="Store ID")
+    product_id: int = Field(..., ge=1, description="Product ID")
+    selection_window: SelectionWindow
+    forecast_horizon: int = Field(..., ge=1, le=90, description="Forecast horizon in days")
+    ranking_metric: RankingMetric = "wape"
+    split_config: SplitConfig = Field(default_factory=SplitConfig)
+    candidate_models: list[CandidateModelConfig] = Field(min_length=1, max_length=10)
+    feature_frame_version: int = Field(default=1, ge=1, le=2)
+    feature_groups: list[str] | None = Field(default=None)
+    ranking_policy: RankingPolicy = Field(default_factory=RankingPolicy)
+    auto_train_winner: bool = Field(default=False)
+    auto_predict: bool = Field(default=False)
+
+    @model_validator(mode="after")
+    def _check_consistency(self) -> ModelSelectionRunRequest:
+        """Enforce LOCKED decisions #5 and #7 plus V1/feature-group consistency."""
+        if self.split_config.horizon != self.forecast_horizon:
+            raise ValueError(
+                f"split_config.horizon ({self.split_config.horizon}) must equal "
+                f"forecast_horizon ({self.forecast_horizon})"
+            )
+        if self.auto_predict and not self.auto_train_winner:
+            raise ValueError("auto_predict requires auto_train_winner=True")
+        if self.feature_frame_version == 1 and self.feature_groups is not None:
+            raise ValueError(
+                "feature_groups is only valid when feature_frame_version=2; "
+                "omit it for V1 selection."
+            )
+        return self
+
+
+class AvailabilityQuery(BaseModel):
+    """Validated query params for ``GET /model-selection/availability``."""
+
+    model_config = ConfigDict(strict=True)
+
+    store_id: int = Field(..., ge=1)
+    product_id: int = Field(..., ge=1)
+    forecast_horizon: int = Field(default=14, ge=1, le=90)
+
+
+class TrainSelectedRequest(BaseModel):
+    """``POST /model-selection/{id}/train-selected`` body (Slice C).
+
+    Trains a USER-CHOSEN candidate (override). Only ``str``/``None`` fields so
+    ``ConfigDict(strict=True)`` needs no ``Field(strict=False)`` override (no
+    date/uuid/decimal field) — keeps ``test_strict_mode_policy`` green.
+    """
+
+    model_config = ConfigDict(strict=True)
+
+    model_type: ModelType
+    override_reason: str | None = Field(default=None, max_length=2000)
+
+
+class ForecastDecisionParams(BaseModel):
+    """Optional ``POST /model-selection/{id}/predict`` body (Slice C).
+
+    Drives the deterministic safety-stock heuristic in ``decision.py``. All
+    fields are JSON-native (``int``/``float``) → no ``Field(strict=False)``.
+    """
+
+    model_config = ConfigDict(strict=True)
+
+    lead_time_days: int = Field(default=7, ge=1, le=365)
+    service_level: float = Field(default=0.95, ge=0.5, lt=1.0)
+
+
+class PromoteRequest(BaseModel):
+    """``POST /model-selection/{id}/promote`` body (Slice C).
+
+    Approval-gated promotion of a trained champion to a registry alias.
+    ``alias_name`` mirrors the registry regex so a bad name 422s at the schema
+    boundary. ``approved_by`` is required — promotion is never automatic.
+    """
+
+    model_config = ConfigDict(strict=True)
+
+    alias_name: str = Field(..., min_length=1, max_length=100, pattern=r"^[a-z0-9][a-z0-9\-_]*$")
+    approved_by: str = Field(..., min_length=1, max_length=100)
+    acknowledge_non_recommended: bool = False
+    description: str | None = Field(default=None, max_length=500)
+
+
+# =============================================================================
+# Intermediate models (service-internal; embedded in JSONB snapshots)
+# =============================================================================
+
+
+class FoldChart(BaseModel):
+    """Per-fold chart points for one candidate."""
+
+    fold_index: int
+    dates: list[date]
+    actuals: list[float]
+    predictions: list[float]
+
+
+class CandidateResult(BaseModel):
+    """One candidate's full backtest outcome (success or failure).
+
+    ``params`` are carried through unchanged so the winning model can be rebuilt
+    from the persisted record without re-deriving them.
+    """
+
+    model_type: str
+    params: dict[str, Any]
+    failed: bool
+    error: str | None = None
+    aggregated_metrics: dict[str, float] | None = None
+    sample_size: int = 0
+    config_hash: str | None = None
+    folds: list[FoldChart] = Field(default_factory=list)
+
+
+class ModelRankEntry(BaseModel):
+    """One row in the ranking table — a ranked winner/runner-up or an excluded
+    (failed/filtered) candidate. Excluded entries keep ``rank=None``."""
+
+    rank: int | None
+    model_type: str
+    params: dict[str, Any]
+    included: bool
+    exclusion_reason: str | None = None
+    metrics: dict[str, float] | None = None
+
+
+class RankingResult(BaseModel):
+    """Deterministic ranking outcome — persisted into ``ranking_result``."""
+
+    winner: ModelRankEntry | None
+    entries: list[ModelRankEntry]
+    confidence: ConfidenceLevel
+    reasons: list[str]
+
+
+class WinnerSummary(BaseModel):
+    """The champion — flattened for the response top level."""
+
+    model_type: str
+    params: dict[str, Any]
+    metrics: dict[str, float]
+    rank: int
+
+
+class ChartData(BaseModel):
+    """Chart-ready comparison payload (a Success-Criteria deliverable)."""
+
+    wape_by_model: dict[str, float]
+    bias_by_model: dict[str, float]
+    fold_stability: dict[str, list[float]]
+    winner_actual_vs_predicted: list[FoldChart]
+
+
+# =============================================================================
+# Response models
+# =============================================================================
+
+
+class PairAvailabilityResponse(BaseModel):
+    """``GET /model-selection/availability`` response."""
+
+    store_id: int
+    product_id: int
+    first_sales_date: date | None
+    last_sales_date: date | None
+    observed_days: int
+    expected_calendar_days: int
+    coverage_ratio: float
+    missing_days: int
+    zero_sale_days: int
+    promotion_days: int | None
+    average_daily_demand: float
+    status: AvailabilityStatus
+    recommended_split_config: SplitConfig
+    warnings: list[str] = Field(default_factory=list)
+
+
+class ForecastSummary(BaseModel):
+    """Forecast output rolled up for the response.
+
+    Slice C adds ``peak_*`` / ``low_*`` as ADDITIVE Optional fields (default
+    ``None``) so legacy JSONB snapshots written by the Slice A/B auto-predict
+    path still validate on reload.
+    """
+
+    points: list[dict[str, Any]]
+    total_demand: float
+    average_demand: float
+    horizon: int
+    peak_date: date | None = None
+    peak_demand: float | None = None
+    low_date: date | None = None
+    low_demand: float | None = None
+
+
+class ForecastDecision(BaseModel):
+    """Deterministic, CLEARLY-LABELED inventory-decision heuristic (Slice C).
+
+    Computed by ``decision.compute_forecast_decision`` from the forecast points
+    + lead time + service level. ``method`` is fixed ``"heuristic"`` and every
+    use carries a caveat — this NEVER feeds ranking (LOCKED #3).
+    """
+
+    method: Literal["heuristic"] = "heuristic"
+    lead_time_days: int
+    service_level: float
+    z_value: float
+    sigma_daily_demand: float
+    expected_demand_over_lead_time: float
+    safety_stock: float
+    reorder_point: float
+    bias_risk_text: str
+    caveats: list[str]
+
+
+class CandidateProgress(BaseModel):
+    """One candidate's live execution state (Slice B async run).
+
+    Output-only. Empty list on a legacy synchronous ``/run`` row (no children).
+    """
+
+    candidate_id: str
+    ordinal: int
+    model_type: str
+    status: CandidateStatusLiteral
+    error: str | None = None
+    started_at: datetime | None = None
+    completed_at: datetime | None = None
+    duration_ms: int | None = None
+
+
+class SelectionProgress(BaseModel):
+    """Per-status candidate counts for an async selection run (Slice B)."""
+
+    total: int
+    pending: int
+    running: int
+    completed: int
+    failed: int
+    cancelled: int
+
+
+class ModelSelectionRunResponse(BaseModel):
+    """``POST /model-selection/run`` and ``GET /model-selection/{id}`` contract.
+
+    Slice B adds ``started_at`` / ``progress`` / ``candidate_progress`` as
+    ADDITIVE fields with safe defaults — a legacy synchronous ``/run`` row has
+    ``progress=None`` and ``candidate_progress=[]``.
+    """
+
+    selection_id: str
+    store_id: int
+    product_id: int
+    status: SelectionStatusLiteral
+    selection_window: SelectionWindow
+    forecast_horizon: int
+    ranking_metric: str
+    availability: PairAvailabilityResponse | None
+    ranking: list[ModelRankEntry]
+    winner: WinnerSummary | None
+    recommendation_confidence: ConfidenceLevel | None
+    confidence_reasons: list[str]
+    chart_data: ChartData | None
+    final_model: dict[str, Any] | None
+    forecast: ForecastSummary | None
+    business_summary: dict[str, Any] | None
+    error_message: str | None
+    created_at: datetime
+    started_at: datetime | None = None
+    completed_at: datetime | None
+    progress: SelectionProgress | None = None
+    candidate_progress: list[CandidateProgress] = Field(default_factory=list)
+
+
+class SubmitRunResponse(ModelSelectionRunResponse):
+    """``POST /model-selection/runs`` 202 response — an additive superset.
+
+    Carries the LRO status-monitor pointers (the frontend drives the UI from
+    these body fields, not the ``Location``/``Retry-After`` headers).
+    """
+
+    monitor_url: str
+    cancel_url: str
+
+
+class CandidateModelInfo(BaseModel):
+    """One selectable forecasting model in the capability catalog.
+
+    Output-only (plain ``BaseModel`` — no strict coercion needed). The
+    capability flags are BACKEND-OWNED: they derive from the forecasting
+    authority (``model_family_for`` + each forecaster's ``requires_features``)
+    so the frontend never re-derives families/feature-awareness in TypeScript.
+    """
+
+    model_type: str
+    label: str
+    family: Literal["baseline", "tree", "additive"]
+    feature_aware: bool
+    requires_extra: bool  # lightgbm/xgboost — opt-in extra may be absent at runtime
+    default_params: dict[str, Any]
+    supports_auto_predict: bool  # False for feature-aware models (predict() rejects them)
+    description: str
+
+
+class ModelCatalogResponse(BaseModel):
+    """``GET /model-selection/models`` — backend-owned candidate catalog."""
+
+    models: list[CandidateModelInfo]
+    default_candidate_model_types: list[str]
+
+
+class TrainWinnerResponse(BaseModel):
+    """``POST /model-selection/{id}/train-winner`` and ``/train-selected``.
+
+    Slice C adds ``is_override`` / ``override_warning`` as ADDITIVE fields with
+    back-compatible defaults — ``train-winner`` still returns
+    ``is_override=False`` + ``override_warning=None`` (its shape is unchanged for
+    existing callers/tests).
+    """
+
+    selection_id: str
+    model_type: str
+    model_path: str
+    is_override: bool = False
+    override_warning: str | None = None
+
+
+class PredictWinnerResponse(BaseModel):
+    """``POST /model-selection/{id}/predict`` response.
+
+    Slice C adds ``decision`` (the labeled safety-stock heuristic) as an
+    ADDITIVE Optional field; ``forecast`` now also carries peak/low.
+    """
+
+    selection_id: str
+    forecast: ForecastSummary
+    decision: ForecastDecision | None = None
+
+
+class PromoteResponse(BaseModel):
+    """``POST /model-selection/{id}/promote`` response (Slice C)."""
+
+    selection_id: str
+    alias_name: str
+    run_id: str
+    run_status: str
+    model_type: str
+    is_override: bool
+    promoted_at: datetime
diff --git a/app/features/model_selection/service.py b/app/features/model_selection/service.py
new file mode 100644
index 00000000..baef2875
--- /dev/null
+++ b/app/features/model_selection/service.py
@@ -0,0 +1,1346 @@
+"""Service layer for the Forecast Champion Selector slice (issue #353).
+
+Orchestrates pair-availability → candidate backtests → deterministic ranking →
+optional winner train/predict, persisting an auditable ``model_selection_run``.
+
+Cross-slice coupling rules (mirror ``OpsService`` + the forecasting/Batch
+precedent):
+- Read the data-platform ORM **models** at module scope (the sanctioned
+  read-only ORM surface).
+- Import sibling feature **services** (``BacktestingService`` /
+  ``ForecastingService``) and the ``ModelConfig`` ``TypeAdapter`` LAZILY inside
+  the methods that use them — avoids closing an alembic cold-boot import cycle.
+- Reuse the backtesting ``SplitConfig`` schema directly (no cycle).
+"""
+
+from __future__ import annotations
+
+import asyncio
+import uuid
+from collections.abc import Sequence
+from datetime import UTC, datetime
+from pathlib import Path
+from typing import TYPE_CHECKING, Any
+
+from sqlalchemy import and_, func, or_, select
+from sqlalchemy.ext.asyncio import AsyncSession, async_sessionmaker
+
+from app.core.config import get_settings
+from app.core.database import get_session_maker
+from app.core.exceptions import (
+    BadRequestError,
+    ConflictError,
+    GatewayTimeoutError,
+    NotFoundError,
+    UnprocessableEntityError,
+)
+from app.core.logging import get_logger
+from app.features.backtesting.schemas import SplitConfig
+from app.features.data_platform.models import Product, Promotion, SalesDaily, Store
+from app.features.model_selection import runner
+from app.features.model_selection.capabilities import build_model_catalog
+from app.features.model_selection.decision import (
+    compute_forecast_decision,
+    forecast_peak_low,
+)
+from app.features.model_selection.explanations import explain_winner
+from app.features.model_selection.models import (
+    TERMINAL_SELECTION_STATES,
+    CandidateStatus,
+    ModelSelectionCandidate,
+    ModelSelectionRun,
+    ModelSelectionStatus,
+)
+from app.features.model_selection.ranking import build_chart_data, rank_candidates
+from app.features.model_selection.schemas import (
+    AvailabilityStatus,
+    CandidateModelConfig,
+    CandidateProgress,
+    CandidateResult,
+    ChartData,
+    FoldChart,
+    ForecastDecision,
+    ForecastSummary,
+    ModelCatalogResponse,
+    ModelSelectionRunRequest,
+    ModelSelectionRunResponse,
+    PairAvailabilityResponse,
+    PromoteRequest,
+    PromoteResponse,
+    RankingResult,
+    SelectionProgress,
+    SelectionWindow,
+    SubmitRunResponse,
+    TrainWinnerResponse,
+    WinnerSummary,
+)
+
+if TYPE_CHECKING:
+    from app.features.backtesting.schemas import BacktestResponse
+    from app.features.forecasting.schemas import PredictResponse
+
+logger = get_logger(__name__)
+
+# Strong refs to detached background workers — asyncio holds only a WEAK ref to
+# a bare ``create_task`` result, so without this set a worker can be GC'd
+# mid-run (https://docs.python.org/3.12/library/asyncio-task.html#asyncio.create_task).
+_BACKGROUND_TASKS: set[asyncio.Task[None]] = set()
+
+# Availability policy constants (module-level; not operator-configurable in v1).
+MIN_COVERAGE_RATIO = 0.8
+DEFAULT_MIN_TRAIN_SIZE = 30
+MAX_RECOMMENDED_SPLITS = 5
+
+_TERMINAL_WITH_WINNER = frozenset(
+    {ModelSelectionStatus.COMPLETED.value, ModelSelectionStatus.PARTIAL.value}
+)
+
+
+class ModelSelectionService:
+    """Stateless orchestrator — a fresh ``db`` session per method."""
+
+    # -------------------------------------------------------------------------
+    # Capability catalog
+    # -------------------------------------------------------------------------
+
+    def get_model_catalog(self) -> ModelCatalogResponse:
+        """Return the backend-owned candidate-model catalog (static, no I/O).
+
+        Thin pass-through to the pure :func:`capabilities.build_model_catalog`;
+        kept on the service for symmetry with ``get_availability`` / ``run``.
+        """
+        return build_model_catalog()
+
+    # -------------------------------------------------------------------------
+    # Availability
+    # -------------------------------------------------------------------------
+
+    async def get_availability(
+        self,
+        db: AsyncSession,
+        store_id: int,
+        product_id: int,
+        forecast_horizon: int,
+        split_config: SplitConfig | None = None,
+    ) -> PairAvailabilityResponse:
+        """Assess whether a (store, product) pair has enough history to model."""
+        store = await db.get(Store, store_id)
+        if store is None:
+            raise NotFoundError(message=f"Store {store_id} not found")
+        product = await db.get(Product, product_id)
+        if product is None:
+            raise NotFoundError(message=f"Product {product_id} not found")
+
+        n_splits = split_config.n_splits if split_config else MAX_RECOMMENDED_SPLITS
+        min_train = split_config.min_train_size if split_config else DEFAULT_MIN_TRAIN_SIZE
+
+        agg = (
+            await db.execute(
+                select(
+                    func.min(SalesDaily.date),
+                    func.max(SalesDaily.date),
+                    func.count(func.distinct(SalesDaily.date)),
+                    func.avg(SalesDaily.quantity),
+                    func.count().filter(SalesDaily.quantity == 0),
+                ).where(
+                    SalesDaily.store_id == store_id,
+                    SalesDaily.product_id == product_id,
+                )
+            )
+        ).one()
+        first_date, last_date, observed_raw, avg_qty, zero_raw = agg
+        observed_days = int(observed_raw or 0)
+        zero_sale_days = int(zero_raw or 0)
+        average_daily_demand = float(avg_qty) if avg_qty is not None else 0.0
+
+        warnings: list[str] = []
+
+        if first_date is None or last_date is None or observed_days == 0:
+            expected_calendar_days = 0
+            coverage_ratio = 0.0
+            missing_days = 0
+            promotion_days: int | None = 0
+        else:
+            expected_calendar_days = (last_date - first_date).days + 1
+            coverage_ratio = (
+                observed_days / expected_calendar_days if expected_calendar_days > 0 else 0.0
+            )
+            missing_days = max(0, expected_calendar_days - observed_days)
+            promotion_days = await self._count_promotion_days(db, store_id, product_id, warnings)
+
+        ready_threshold = min_train + forecast_horizon * n_splits
+        limited_threshold = min_train + forecast_horizon
+        status: AvailabilityStatus
+        if observed_days >= ready_threshold and coverage_ratio >= MIN_COVERAGE_RATIO:
+            status = "ready"
+        elif observed_days >= limited_threshold:
+            status = "limited"
+        else:
+            status = "unusable"
+
+        if coverage_ratio and coverage_ratio < MIN_COVERAGE_RATIO and status != "unusable":
+            warnings.append(
+                f"Coverage {coverage_ratio:.0%} is below the {MIN_COVERAGE_RATIO:.0%} "
+                "ready threshold."
+            )
+
+        feasible_splits = (observed_days - min_train) // max(forecast_horizon, 1)
+        recommended_splits = min(20, max(2, min(MAX_RECOMMENDED_SPLITS, feasible_splits)))
+        recommended_split_config = SplitConfig(
+            strategy="expanding",
+            n_splits=recommended_splits,
+            min_train_size=min_train,
+            gap=0,
+            horizon=forecast_horizon,
+        )
+
+        return PairAvailabilityResponse(
+            store_id=store_id,
+            product_id=product_id,
+            first_sales_date=first_date,
+            last_sales_date=last_date,
+            observed_days=observed_days,
+            expected_calendar_days=expected_calendar_days,
+            coverage_ratio=coverage_ratio,
+            missing_days=missing_days,
+            zero_sale_days=zero_sale_days,
+            promotion_days=promotion_days,
+            average_daily_demand=average_daily_demand,
+            status=status,
+            recommended_split_config=recommended_split_config,
+            warnings=warnings,
+        )
+
+    async def _count_promotion_days(
+        self,
+        db: AsyncSession,
+        store_id: int,
+        product_id: int,
+        warnings: list[str],
+    ) -> int | None:
+        """Count distinct sales dates inside any promotion for the pair.
+
+        Includes chain-wide promos (``promotion.store_id IS NULL``). Returns
+        ``None`` + a warning on any error (an acceptable fallback per the
+        Success Criteria) — never sums ``(end-start)`` which would double-count
+        overlapping ranges.
+        """
+        try:
+            count = await db.scalar(
+                select(func.count(func.distinct(SalesDaily.date)))
+                .select_from(SalesDaily)
+                .join(
+                    Promotion,
+                    and_(
+                        Promotion.product_id == SalesDaily.product_id,
+                        or_(
+                            Promotion.store_id == SalesDaily.store_id,
+                            Promotion.store_id.is_(None),
+                        ),
+                        SalesDaily.date >= Promotion.start_date,
+                        SalesDaily.date <= Promotion.end_date,
+                    ),
+                )
+                .where(
+                    SalesDaily.store_id == store_id,
+                    SalesDaily.product_id == product_id,
+                )
+            )
+            return int(count or 0)
+        except Exception as exc:  # promotion_days is best-effort; degrade gracefully
+            warnings.append(f"promotion_days could not be derived: {exc}")
+            return None
+
+    # -------------------------------------------------------------------------
+    # Orchestration
+    # -------------------------------------------------------------------------
+
+    async def run_selection(
+        self, db: AsyncSession, request: ModelSelectionRunRequest
+    ) -> ModelSelectionRunResponse:
+        """Run the full champion-selection workflow and persist the audit row."""
+        from pydantic import TypeAdapter  # lazy
+
+        from app.features.backtesting.schemas import BacktestConfig  # lazy
+        from app.features.backtesting.service import BacktestingService  # lazy
+        from app.features.forecasting.schemas import ModelConfig  # lazy
+
+        adapter: TypeAdapter[object] = TypeAdapter(ModelConfig)
+
+        row = ModelSelectionRun(
+            selection_id=uuid.uuid4().hex,
+            status=ModelSelectionStatus.RUNNING.value,
+            store_id=request.store_id,
+            product_id=request.product_id,
+            start_date=request.selection_window.start_date,
+            end_date=request.selection_window.end_date,
+            forecast_horizon=request.forecast_horizon,
+            ranking_metric=request.ranking_metric,
+            candidate_models=[c.model_dump() for c in request.candidate_models],
+            policy_snapshot=request.ranking_policy.model_dump(mode="json"),
+            feature_frame_version=request.feature_frame_version,
+        )
+        db.add(row)
+        await db.flush()
+        logger.info(
+            "model_selection.run_received",
+            selection_id=row.selection_id,
+            store_id=request.store_id,
+            product_id=request.product_id,
+            n_candidates=len(request.candidate_models),
+        )
+
+        availability = await self.get_availability(
+            db,
+            request.store_id,
+            request.product_id,
+            request.forecast_horizon,
+            request.split_config,
+        )
+        row.availability_snapshot = availability.model_dump(mode="json")
+        logger.info(
+            "model_selection.availability_checked",
+            selection_id=row.selection_id,
+            status=availability.status,
+            observed_days=availability.observed_days,
+        )
+
+        if availability.status == "unusable":  # LOCKED #2 — fail fast (400)
+            message = "Insufficient data for model selection (availability unusable)."
+            row.status = ModelSelectionStatus.FAILED.value
+            row.error_message = message
+            await db.flush()
+            logger.warning(
+                "model_selection.run_failed",
+                selection_id=row.selection_id,
+                reason="unusable_availability",
+            )
+            raise BadRequestError(message=message)
+
+        results: list[CandidateResult] = []
+        backtesting_service = BacktestingService()
+        for candidate in request.candidate_models:
+            try:
+                cfg = adapter.validate_python(
+                    {"model_type": candidate.model_type, **candidate.params}
+                )
+                backtest = await backtesting_service.run_backtest(
+                    db,
+                    request.store_id,
+                    request.product_id,
+                    request.selection_window.start_date,
+                    request.selection_window.end_date,
+                    BacktestConfig(
+                        split_config=request.split_config,
+                        model_config_main=cfg,  # type: ignore[arg-type]
+                        include_baselines=False,
+                        store_fold_details=True,
+                    ),
+                )
+                results.append(self._shape_candidate(candidate, backtest))
+                logger.info(
+                    "model_selection.candidate_completed",
+                    selection_id=row.selection_id,
+                    model_type=candidate.model_type,
+                )
+            except Exception as exc:  # never hide a failed candidate
+                results.append(self._shape_failed_candidate(candidate, exc))
+                logger.warning(
+                    "model_selection.candidate_failed",
+                    selection_id=row.selection_id,
+                    model_type=candidate.model_type,
+                    error=str(exc),
+                )
+
+        row.candidate_results = [r.model_dump(mode="json") for r in results]
+        ranking = rank_candidates(
+            results, request.ranking_policy, request.ranking_metric, availability.status
+        )
+        row.ranking_result = ranking.model_dump(mode="json")
+
+        if ranking.winner is None:  # LOCKED #3 — persist failed, return 200
+            row.status = ModelSelectionStatus.FAILED.value
+            row.error_message = "No candidate produced a valid backtest."
+            row.business_summary = explain_winner(ranking, availability)
+            row.completed_at = datetime.now(UTC)
+            await db.flush()
+            await db.refresh(row)
+            logger.warning(
+                "model_selection.run_failed",
+                selection_id=row.selection_id,
+                reason="no_valid_winner",
+            )
+            return self._response(row, ranking)
+
+        winner_cfg = adapter.validate_python(
+            {"model_type": ranking.winner.model_type, **ranking.winner.params}
+        )
+
+        if request.auto_train_winner:
+            from app.features.forecasting.service import ForecastingService  # lazy
+
+            train = await ForecastingService().train_model(
+                db,
+                request.store_id,
+                request.product_id,
+                request.selection_window.start_date,
+                request.selection_window.end_date,
+                winner_cfg,  # type: ignore[arg-type]
+                feature_frame_version=request.feature_frame_version,
+                feature_groups=request.feature_groups,
+            )
+            row.final_model_path = train.model_path
+
+        forecast_warning: str | None = None
+        if request.auto_predict and row.final_model_path:
+            from app.features.forecasting.service import ForecastingService  # lazy
+
+            try:
+                prediction = await ForecastingService().predict(
+                    request.store_id,
+                    request.product_id,
+                    request.forecast_horizon,
+                    row.final_model_path,
+                )
+                row.forecast_result = self._forecast_summary(
+                    prediction, request.forecast_horizon
+                ).model_dump(mode="json")
+            except Exception as exc:  # e.g. feature-aware predict reject — warn, don't fail
+                forecast_warning = f"Auto-predict skipped: {exc}"
+                logger.warning(
+                    "model_selection.predict_skipped",
+                    selection_id=row.selection_id,
+                    error=str(exc),
+                )
+
+        row.winner_model_type = ranking.winner.model_type
+        row.winner_metrics = ranking.winner.metrics
+        row.chart_data = build_chart_data(results, ranking).model_dump(mode="json")
+        business = explain_winner(ranking, availability)
+        if forecast_warning is not None:
+            business["forecast_warning"] = forecast_warning
+        row.business_summary = business
+        row.status = (
+            ModelSelectionStatus.PARTIAL.value
+            if any(r.failed for r in results)
+            else ModelSelectionStatus.COMPLETED.value
+        )
+        row.completed_at = datetime.now(UTC)
+        await db.flush()
+        await db.refresh(row)
+        logger.info(
+            "model_selection.run_completed",
+            selection_id=row.selection_id,
+            status=row.status,
+            winner=row.winner_model_type,
+        )
+        return self._response(row, ranking)
+
+    # -------------------------------------------------------------------------
+    # Async orchestration (Slice B) — fire-and-forget LRO
+    # -------------------------------------------------------------------------
+
+    async def submit_run(
+        self, db: AsyncSession, request: ModelSelectionRunRequest
+    ) -> SubmitRunResponse:
+        """Submit an async selection run: insert parent + children, detach worker.
+
+        Returns 202-shaped ``SubmitRunResponse`` (status=running) IMMEDIATELY —
+        the candidate backtests run in a detached :func:`asyncio.create_task`
+        that uses its OWN sessions (never this request ``db``).
+        """
+        availability = await self.get_availability(
+            db,
+            request.store_id,
+            request.product_id,
+            request.forecast_horizon,
+            request.split_config,
+        )
+
+        selection_id = uuid.uuid4().hex
+        now = datetime.now(UTC)
+        row = ModelSelectionRun(
+            selection_id=selection_id,
+            status=ModelSelectionStatus.RUNNING.value,
+            store_id=request.store_id,
+            product_id=request.product_id,
+            start_date=request.selection_window.start_date,
+            end_date=request.selection_window.end_date,
+            forecast_horizon=request.forecast_horizon,
+            ranking_metric=request.ranking_metric,
+            candidate_models=[c.model_dump() for c in request.candidate_models],
+            policy_snapshot=request.ranking_policy.model_dump(mode="json"),
+            availability_snapshot=availability.model_dump(mode="json"),
+            started_at=now,
+            total_candidates=len(request.candidate_models),
+            feature_frame_version=request.feature_frame_version,
+        )
+        db.add(row)
+        # Flush the parent INSERT before the children — there is no ORM
+        # ``relationship`` and the FK targets the non-PK ``selection_id``, so the
+        # unit-of-work would not otherwise order parent-before-child.
+        await db.flush()
+
+        # Fail fast on unusable availability (LOCKED #2 parity with the sync path)
+        # — persist a failed parent (no children, no worker) and raise 400.
+        if availability.status == "unusable":
+            message = "Insufficient data for model selection (availability unusable)."
+            row.status = ModelSelectionStatus.FAILED.value
+            row.error_message = message
+            row.completed_at = now
+            await db.commit()
+            logger.warning(
+                "model_selection.run_failed",
+                selection_id=selection_id,
+                reason="unusable_availability",
+            )
+            raise BadRequestError(message=message)
+
+        candidates: list[ModelSelectionCandidate] = []
+        for ordinal, candidate in enumerate(request.candidate_models):
+            cand = ModelSelectionCandidate(
+                candidate_id=uuid.uuid4().hex,
+                selection_id=selection_id,
+                ordinal=ordinal,
+                model_type=candidate.model_type,
+                params=candidate.params,
+                status=CandidateStatus.PENDING.value,
+            )
+            db.add(cand)
+            candidates.append(cand)
+        await db.commit()
+        await db.refresh(row)  # populate server-default created_at for the 202 body
+
+        logger.info(
+            "model_selection.run_submitted",
+            selection_id=selection_id,
+            store_id=request.store_id,
+            product_id=request.product_id,
+            n_candidates=len(candidates),
+        )
+
+        # Eagerly register the cancel handle so a DELETE arriving before the
+        # detached worker starts still finds it (avoids a false "already settled"
+        # 409). The worker's setdefault reuses this same handle.
+        runner.register_selection(selection_id)
+
+        # Detach the worker — hold a strong ref so it cannot be GC'd mid-run.
+        task = asyncio.create_task(
+            self._run_in_background(selection_id, request),
+            name=f"model_selection_worker:{selection_id}",
+        )
+        _BACKGROUND_TASKS.add(task)
+        task.add_done_callback(_BACKGROUND_TASKS.discard)
+
+        candidate_progress = [
+            CandidateProgress(
+                candidate_id=c.candidate_id,
+                ordinal=c.ordinal,
+                model_type=c.model_type,
+                status="pending",
+            )
+            for c in candidates
+        ]
+        progress = SelectionProgress(
+            total=len(candidates),
+            pending=len(candidates),
+            running=0,
+            completed=0,
+            failed=0,
+            cancelled=0,
+        )
+        return SubmitRunResponse(
+            selection_id=selection_id,
+            store_id=request.store_id,
+            product_id=request.product_id,
+            status="running",
+            selection_window=request.selection_window,
+            forecast_horizon=request.forecast_horizon,
+            ranking_metric=request.ranking_metric,
+            availability=availability,
+            ranking=[],
+            winner=None,
+            recommendation_confidence=None,
+            confidence_reasons=[],
+            chart_data=None,
+            final_model=None,
+            forecast=None,
+            business_summary=None,
+            error_message=None,
+            created_at=row.created_at,
+            started_at=now,
+            completed_at=None,
+            progress=progress,
+            candidate_progress=candidate_progress,
+            monitor_url=f"/model-selection/{selection_id}",
+            cancel_url=f"/model-selection/{selection_id}",
+        )
+
+    async def _run_in_background(
+        self, selection_id: str, request: ModelSelectionRunRequest
+    ) -> None:
+        """Detached worker — runs candidate backtests, then settles the parent.
+
+        Uses ONLY sessions from ``get_session_maker()`` (the request session is
+        long gone). Never raises out — settles the parent to its observed state.
+        """
+        session_maker = get_session_maker()
+        settings = get_settings()
+
+        async def _exec(candidate_id: str) -> None:
+            from pydantic import TypeAdapter  # lazy
+
+            from app.features.backtesting.schemas import BacktestConfig  # lazy
+            from app.features.backtesting.service import BacktestingService  # lazy
+            from app.features.forecasting.schemas import ModelConfig  # lazy
+
+            async with session_maker() as session:
+                cand = await session.scalar(
+                    select(ModelSelectionCandidate).where(
+                        ModelSelectionCandidate.candidate_id == candidate_id
+                    )
+                )
+                if cand is None:  # deleted-parent race — survivable
+                    return
+                started = datetime.now(UTC)
+                cand.status = CandidateStatus.RUNNING.value
+                cand.started_at = started
+                await session.commit()
+                logger.info(
+                    "model_selection.candidate_started",
+                    selection_id=selection_id,
+                    model_type=cand.model_type,
+                )
+                try:
+                    adapter: TypeAdapter[object] = TypeAdapter(ModelConfig)
+                    cfg = adapter.validate_python({"model_type": cand.model_type, **cand.params})
+                    backtest = await BacktestingService().run_backtest(
+                        session,
+                        request.store_id,
+                        request.product_id,
+                        request.selection_window.start_date,
+                        request.selection_window.end_date,
+                        BacktestConfig(
+                            split_config=request.split_config,
+                            model_config_main=cfg,  # type: ignore[arg-type]
+                            include_baselines=False,
+                            store_fold_details=True,
+                        ),
+                    )
+                    result = self._shape_candidate(
+                        CandidateModelConfig.model_validate(
+                            {"model_type": cand.model_type, "params": cand.params}
+                        ),
+                        backtest,
+                    )
+                    cand.result = result.model_dump(mode="json")
+                    cand.status = CandidateStatus.COMPLETED.value
+                    logger.info(
+                        "model_selection.candidate_completed",
+                        selection_id=selection_id,
+                        model_type=cand.model_type,
+                    )
+                except Exception as exc:  # never hide a failed candidate
+                    cand.status = CandidateStatus.FAILED.value
+                    cand.error_message = str(exc)[:2000]
+                    cand.error_type = type(exc).__name__
+                    logger.warning(
+                        "model_selection.candidate_failed",
+                        selection_id=selection_id,
+                        model_type=cand.model_type,
+                        error=str(exc),
+                    )
+                finished = datetime.now(UTC)
+                cand.completed_at = finished
+                cand.duration_ms = int((finished - started).total_seconds() * 1000)
+                await session.commit()
+
+        try:
+            candidate_ids = await self._candidate_ids(session_maker, selection_id)
+            await runner.run_selection_candidates(
+                selection_id=selection_id,
+                candidate_ids=candidate_ids,
+                max_parallel=settings.model_selection_global_max_parallel,
+                global_max_parallel=settings.model_selection_global_max_parallel,
+                session_maker=session_maker,
+                execute_candidate=_exec,
+            )
+        finally:
+            # Always settle + unblock any DELETE drain, even if loading the
+            # candidate ids or the runner itself raised unexpectedly.
+            await self._settle(selection_id, request, session_maker)
+            runner.mark_completed(selection_id)
+
+    async def _candidate_ids(
+        self, session_maker: async_sessionmaker[AsyncSession], selection_id: str
+    ) -> list[str]:
+        """Load this run's candidate ids in submit (ordinal) order."""
+        async with session_maker() as session:
+            rows = (
+                await session.execute(
+                    select(ModelSelectionCandidate.candidate_id)
+                    .where(ModelSelectionCandidate.selection_id == selection_id)
+                    .order_by(ModelSelectionCandidate.ordinal)
+                )
+            ).all()
+        return [r[0] for r in rows]
+
+    async def _settle(
+        self,
+        selection_id: str,
+        request: ModelSelectionRunRequest,
+        session_maker: async_sessionmaker[AsyncSession],
+    ) -> None:
+        """Aggregate terminal children → ranking/chart/business + final status.
+
+        REUSES the pure ``rank_candidates`` / ``build_chart_data`` /
+        ``explain_winner`` so the terminal GET output is byte-compatible with
+        the synchronous ``/run`` path (LOCKED #7).
+        """
+        async with session_maker() as session:
+            row = await session.scalar(
+                select(ModelSelectionRun).where(ModelSelectionRun.selection_id == selection_id)
+            )
+            if row is None:  # deleted-parent race
+                return
+            children = (
+                (
+                    await session.execute(
+                        select(ModelSelectionCandidate)
+                        .where(ModelSelectionCandidate.selection_id == selection_id)
+                        .order_by(ModelSelectionCandidate.ordinal)
+                    )
+                )
+                .scalars()
+                .all()
+            )
+
+            results: list[CandidateResult] = []
+            for child in children:
+                if child.status == CandidateStatus.COMPLETED.value and child.result:
+                    results.append(CandidateResult.model_validate(child.result))
+                elif child.status == CandidateStatus.CANCELLED.value:
+                    results.append(
+                        CandidateResult(
+                            model_type=child.model_type,
+                            params=child.params,
+                            failed=True,
+                            error="cancelled",
+                            aggregated_metrics=None,
+                            sample_size=0,
+                            folds=[],
+                        )
+                    )
+                else:  # failed (or any non-completed leftover)
+                    results.append(
+                        CandidateResult(
+                            model_type=child.model_type,
+                            params=child.params,
+                            failed=True,
+                            error=child.error_message or "candidate failed",
+                            aggregated_metrics=None,
+                            sample_size=0,
+                            folds=[],
+                        )
+                    )
+
+            availability = (
+                PairAvailabilityResponse.model_validate(row.availability_snapshot)
+                if row.availability_snapshot
+                else None
+            )
+            availability_status: AvailabilityStatus = (
+                availability.status if availability is not None else "ready"
+            )
+            ranking = rank_candidates(
+                results, request.ranking_policy, row.ranking_metric, availability_status
+            )
+            row.candidate_results = [r.model_dump(mode="json") for r in results]
+            row.ranking_result = ranking.model_dump(mode="json")
+            if ranking.winner is not None:
+                row.winner_model_type = ranking.winner.model_type
+                row.winner_metrics = ranking.winner.metrics
+                row.chart_data = build_chart_data(results, ranking).model_dump(mode="json")
+            if availability is not None:
+                row.business_summary = explain_winner(ranking, availability)
+
+            counts = self._status_counts(children)
+            row.completed_candidates = counts["completed"]
+            row.failed_candidates = counts["failed"]
+            row.cancelled_candidates = counts["cancelled"]
+            row.status = self._terminal_status(counts).value
+            row.completed_at = datetime.now(UTC)
+            await session.commit()
+            logger.info(
+                "model_selection.run_settled",
+                selection_id=selection_id,
+                status=row.status,
+                winner=row.winner_model_type,
+            )
+
+    async def cancel_run(self, db: AsyncSession, selection_id: str) -> ModelSelectionRunResponse:
+        """Cooperatively cancel + drain an in-flight selection run."""
+        row = await self._load(db, selection_id)
+        if row.status in TERMINAL_SELECTION_STATES:
+            raise ConflictError(
+                message=f"Selection run already terminal: {row.status}",
+                details={"selection_id": selection_id, "status": row.status},
+            )
+        logger.info("model_selection.run_cancel_requested", selection_id=selection_id)
+        fired = runner.cancel_selection(selection_id)
+        if not fired:
+            # Race: the worker settled between our load and the cancel.
+            raise ConflictError(
+                message="Selection run settled before cancel could fire",
+                details={"selection_id": selection_id},
+            )
+        settings = get_settings()
+        drained = await runner.await_drain(
+            selection_id,
+            timeout_seconds=float(settings.model_selection_cancel_drain_timeout_seconds),
+        )
+        if not drained:
+            raise GatewayTimeoutError(
+                message=(
+                    f"Drain exceeded {settings.model_selection_cancel_drain_timeout_seconds}s; "
+                    "in-flight sklearn / LightGBM fits are uncancellable mid-call — "
+                    "retry once the fit completes."
+                ),
+                details={"selection_id": selection_id},
+            )
+        # Re-load through a fresh read so the settled state is visible.
+        await db.commit()
+        refreshed = await self._load(db, selection_id)
+        logger.info(
+            "model_selection.run_cancel_drained",
+            selection_id=selection_id,
+            status=refreshed.status,
+        )
+        response = self._response(refreshed, self._load_ranking(refreshed))
+        await self._attach_progress(db, selection_id, response)
+        return response
+
+    @staticmethod
+    def _status_counts(children: Sequence[ModelSelectionCandidate]) -> dict[str, int]:
+        """Tally child statuses into the five count buckets."""
+        counts = {"pending": 0, "running": 0, "completed": 0, "failed": 0, "cancelled": 0}
+        for child in children:
+            counts[child.status] = counts.get(child.status, 0) + 1
+        return counts
+
+    @staticmethod
+    def _terminal_status(counts: dict[str, int]) -> ModelSelectionStatus:
+        """Terminal-status rule at settle (mirror ``batch.service._settle``)."""
+        completed = counts.get("completed", 0)
+        failed = counts.get("failed", 0)
+        cancelled = counts.get("cancelled", 0)
+        if cancelled > 0 and completed == 0 and failed == 0:
+            return ModelSelectionStatus.CANCELLED
+        if completed > 0 and failed == 0 and cancelled == 0:
+            return ModelSelectionStatus.COMPLETED
+        if failed > 0 and completed == 0 and cancelled == 0:
+            return ModelSelectionStatus.FAILED
+        if completed > 0 or failed > 0:
+            return ModelSelectionStatus.PARTIAL
+        return ModelSelectionStatus.FAILED
+
+    async def _attach_progress(
+        self, db: AsyncSession, selection_id: str, response: ModelSelectionRunResponse
+    ) -> None:
+        """Attach live ``progress`` + ``candidate_progress`` to a response.
+
+        A legacy synchronous ``/run`` row has no children → ``progress`` stays
+        ``None`` and ``candidate_progress`` stays ``[]``.
+        """
+        children = (
+            (
+                await db.execute(
+                    select(ModelSelectionCandidate)
+                    .where(ModelSelectionCandidate.selection_id == selection_id)
+                    .order_by(ModelSelectionCandidate.ordinal)
+                )
+            )
+            .scalars()
+            .all()
+        )
+        if not children:
+            return
+        counts = self._status_counts(children)
+        response.progress = SelectionProgress(
+            total=len(children),
+            pending=counts["pending"],
+            running=counts["running"],
+            completed=counts["completed"],
+            failed=counts["failed"],
+            cancelled=counts["cancelled"],
+        )
+        response.candidate_progress = [
+            CandidateProgress(
+                candidate_id=child.candidate_id,
+                ordinal=child.ordinal,
+                model_type=child.model_type,
+                status=child.status,  # type: ignore[arg-type]
+                error=child.error_message,
+                started_at=child.started_at,
+                completed_at=child.completed_at,
+                duration_ms=child.duration_ms,
+            )
+            for child in children
+        ]
+
+    # -------------------------------------------------------------------------
+    # Read / re-run helpers
+    # -------------------------------------------------------------------------
+
+    async def get_selection(self, db: AsyncSession, selection_id: str) -> ModelSelectionRunResponse:
+        """Return a persisted selection run by id (404 when missing).
+
+        Attaches live async progress (Slice B) when the run has child rows; a
+        legacy synchronous ``/run`` row has none and reads as before.
+        """
+        row = await self._load(db, selection_id)
+        response = self._response(row, self._load_ranking(row))
+        await self._attach_progress(db, selection_id, response)
+        return response
+
+    async def get_ranking(self, db: AsyncSession, selection_id: str) -> RankingResult:
+        """Return just the ranking block for a selection run."""
+        row = await self._load(db, selection_id)
+        return self._load_ranking(row)
+
+    async def train_winner(self, db: AsyncSession, selection_id: str) -> TrainWinnerResponse:
+        """Train the winning model for a completed selection (V1 contract)."""
+        from pydantic import TypeAdapter  # lazy
+
+        from app.features.forecasting.schemas import ModelConfig  # lazy
+        from app.features.forecasting.service import ForecastingService  # lazy
+
+        row = await self._load(db, selection_id)
+        ranking = self._load_ranking(row)
+        if ranking.winner is None:
+            raise BadRequestError(message="Selection has no winning model to train.")
+
+        adapter: TypeAdapter[object] = TypeAdapter(ModelConfig)
+        cfg = adapter.validate_python(
+            {"model_type": ranking.winner.model_type, **ranking.winner.params}
+        )
+        train = await ForecastingService().train_model(
+            db,
+            row.store_id,
+            row.product_id,
+            row.start_date,
+            row.end_date,
+            cfg,  # type: ignore[arg-type]
+            feature_frame_version=row.feature_frame_version,  # M1 — train as configured (V1/V2)
+        )
+        row.final_model_path = train.model_path
+        # Slice C — additive: the winner is the trained model and is NOT an
+        # override. The response shape is unchanged (is_override/override_warning
+        # default to False/None).
+        row.trained_model_type = ranking.winner.model_type
+        row.is_override = False
+        row.override_reason = None
+        await db.flush()
+        logger.info(
+            "model_selection.winner_trained",
+            selection_id=row.selection_id,
+            model_type=ranking.winner.model_type,
+        )
+        return TrainWinnerResponse(
+            selection_id=row.selection_id,
+            model_type=ranking.winner.model_type,
+            model_path=train.model_path,
+        )
+
+    async def train_selected(
+        self,
+        db: AsyncSession,
+        selection_id: str,
+        model_type: str,
+        override_reason: str | None,
+    ) -> TrainWinnerResponse:
+        """Train a USER-CHOSEN candidate (override) — Slice C.
+
+        ``model_type`` must be one of the run's CONFIGURED candidates
+        (``candidate_models``), NOT only the ranked/included entries: a candidate
+        that FAILED its backtest is still override-trainable (training is
+        independent of backtesting). A model never offered as a candidate → 400.
+        """
+        from pydantic import TypeAdapter  # lazy
+
+        from app.features.forecasting.schemas import ModelConfig  # lazy
+        from app.features.forecasting.service import ForecastingService  # lazy
+
+        row = await self._load(db, selection_id)
+        ranking = self._load_ranking(row)
+
+        configured = {
+            str(c.get("model_type")) for c in (row.candidate_models or []) if c.get("model_type")
+        }
+        if model_type not in configured:
+            raise BadRequestError(
+                message=(
+                    f"Model '{model_type}' was not a candidate in this selection. "
+                    f"Candidates: {sorted(configured)}."
+                )
+            )
+
+        params = self._params_for_trained_type(row, model_type)
+        adapter: TypeAdapter[object] = TypeAdapter(ModelConfig)
+        cfg = adapter.validate_python({"model_type": model_type, **params})
+        train = await ForecastingService().train_model(
+            db,
+            row.store_id,
+            row.product_id,
+            row.start_date,
+            row.end_date,
+            cfg,  # type: ignore[arg-type]
+            feature_frame_version=row.feature_frame_version,  # M1 — V1/V2 as configured
+        )
+        row.final_model_path = train.model_path
+        row.trained_model_type = model_type
+        winner_type = ranking.winner.model_type if ranking.winner else None
+        row.is_override = (model_type != winner_type) if winner_type is not None else True
+        row.override_reason = override_reason
+        await db.flush()
+
+        warning = self._override_warning(model_type, ranking) if row.is_override else None
+        logger.info(
+            "model_selection.winner_selected_override",
+            selection_id=row.selection_id,
+            model_type=model_type,
+            is_override=row.is_override,
+        )
+        return TrainWinnerResponse(
+            selection_id=row.selection_id,
+            model_type=model_type,
+            model_path=train.model_path,
+            is_override=row.is_override,
+            override_warning=warning,
+        )
+
+    async def predict_winner(
+        self,
+        db: AsyncSession,
+        selection_id: str,
+        lead_time_days: int,
+        service_level: float,
+    ) -> tuple[ForecastSummary, ForecastDecision | None]:
+        """Forecast with the trained model + compute the decision heuristic.
+
+        Returns a ``(forecast, decision)`` tuple — the ROUTE assembles the
+        ``PredictWinnerResponse``. ``decision`` (safety stock etc.) NEVER feeds
+        ranking. A feature-aware model 400s inside ``ForecastingService.predict``
+        (bubbles as ``ValueError`` → 400).
+        """
+        from app.features.forecasting.service import ForecastingService  # lazy
+
+        row = await self._load(db, selection_id)
+        if not row.final_model_path:
+            raise BadRequestError(
+                message="No trained model for this selection; call train-winner first."
+            )
+        prediction = await ForecastingService().predict(
+            row.store_id, row.product_id, row.forecast_horizon, row.final_model_path
+        )
+        summary = self._forecast_summary(prediction, row.forecast_horizon)
+        winner_bias: float | None = None
+        if row.winner_metrics is not None and row.winner_metrics.get("bias") is not None:
+            winner_bias = float(row.winner_metrics["bias"])
+        decision = compute_forecast_decision(
+            summary.points,
+            summary.average_demand,
+            lead_time_days,
+            service_level,
+            winner_bias,
+        )
+        row.forecast_result = summary.model_dump(mode="json")
+        await db.flush()
+        logger.info(
+            "model_selection.winner_predicted",
+            selection_id=row.selection_id,
+            horizon=row.forecast_horizon,
+            lead_time_days=lead_time_days,
+        )
+        return summary, decision
+
+    async def promote(
+        self, db: AsyncSession, selection_id: str, req: PromoteRequest
+    ) -> PromoteResponse:
+        """Approval-gated, audited promotion of a trained champion (Slice C).
+
+        Orchestrates the registry in ONE request transaction (create_run →
+        RUNNING → register artifact → SUCCESS → create_alias), then persists the
+        audit record on ``model_selection_run``. Promotion is NEVER automatic and
+        performs NO comparison.
+        """
+        from app.features.registry.schemas import (  # lazy
+            AliasCreate,
+            RunCreate,
+            RunStatus,
+            RunUpdate,
+        )
+        from app.features.registry.service import RegistryService  # lazy
+
+        row = await self._load(db, selection_id)
+        if not row.final_model_path or not row.trained_model_type:
+            raise UnprocessableEntityError(message="Train the model before promoting.")
+        if row.is_override and not req.acknowledge_non_recommended:
+            raise UnprocessableEntityError(
+                message=(
+                    "Promoting a non-recommended model requires acknowledge_non_recommended=true."
+                )
+            )
+
+        registry = RegistryService()
+        params = self._params_for_trained(row)
+        # ``RunCreate``/``RunUpdate`` use Pydantic ``Field(None, ...)`` defaults +
+        # the ``model_config`` alias; mypy's pydantic plugin resolves these but
+        # pyright (no plugin) cannot — mirror the established
+        # ``registry_tools.py`` suppression. ``model_config_data=`` is the field
+        # name (populate_by_name=True), NOT the ``model_config`` ConfigDict alias.
+        run = await registry.create_run(
+            db,
+            RunCreate(  # pyright: ignore[reportCallIssue]
+                model_type=row.trained_model_type,
+                model_config_data={  # pyright: ignore[reportCallIssue]
+                    "model_type": row.trained_model_type,
+                    **params,
+                },
+                data_window_start=row.start_date,
+                data_window_end=row.end_date,
+                store_id=row.store_id,
+                product_id=row.product_id,
+                runtime_info_extras={"feature_frame_version": row.feature_frame_version},
+            ),
+        )
+        await registry.update_run(
+            db,
+            run.run_id,
+            RunUpdate(status=RunStatus.RUNNING),  # pyright: ignore[reportCallIssue]
+        )
+        artifact_uri, artifact_hash, artifact_size = self._register_artifact(
+            row.final_model_path, run.run_id
+        )
+        await registry.update_run(
+            db,
+            run.run_id,
+            RunUpdate(  # pyright: ignore[reportCallIssue]
+                status=RunStatus.SUCCESS,
+                metrics=row.winner_metrics,
+                artifact_uri=artifact_uri,
+                artifact_hash=artifact_hash,
+                artifact_size_bytes=artifact_size,
+            ),
+        )
+        alias = await registry.create_alias(
+            db,
+            AliasCreate(alias_name=req.alias_name, run_id=run.run_id, description=req.description),
+        )
+
+        promoted_at = datetime.now(UTC)
+        row.champion_run_id = run.run_id
+        row.promoted_alias = alias.alias_name
+        row.promotion_decision = {
+            "decision_id": uuid.uuid4().hex,
+            "alias": alias.alias_name,
+            "champion_run_id": run.run_id,
+            "approved_by": req.approved_by,
+            "approved_at": promoted_at.isoformat(),
+            "decision": "promoted",
+            "reason": req.description,
+            "trained_model_type": row.trained_model_type,
+            "is_override": row.is_override,
+        }
+        await db.flush()
+        logger.info(
+            "model_selection.champion_promoted",
+            selection_id=row.selection_id,
+            alias=alias.alias_name,
+            run_id=run.run_id,
+            approved_by=req.approved_by,
+        )
+        return PromoteResponse(
+            selection_id=row.selection_id,
+            alias_name=alias.alias_name,
+            run_id=run.run_id,
+            run_status=alias.run_status.value,
+            model_type=row.trained_model_type,
+            is_override=row.is_override,
+            promoted_at=promoted_at,
+        )
+
+    # -------------------------------------------------------------------------
+    # Pure mappers
+    # -------------------------------------------------------------------------
+
+    def _shape_candidate(
+        self, candidate: CandidateModelConfig, backtest: BacktestResponse
+    ) -> CandidateResult:
+        main = backtest.main_model_results
+        sample_size = sum(len(fold.actuals) for fold in main.fold_results)
+        folds = [
+            FoldChart(
+                fold_index=fold.fold_index,
+                dates=fold.dates,
+                actuals=fold.actuals,
+                predictions=fold.predictions,
+            )
+            for fold in main.fold_results
+        ]
+        return CandidateResult(
+            model_type=candidate.model_type,
+            params=candidate.params,
+            failed=False,
+            aggregated_metrics=main.aggregated_metrics,
+            sample_size=sample_size,
+            config_hash=backtest.config_hash,
+            folds=folds,
+        )
+
+    def _shape_failed_candidate(
+        self, candidate: CandidateModelConfig, exc: Exception
+    ) -> CandidateResult:
+        return CandidateResult(
+            model_type=candidate.model_type,
+            params=candidate.params,
+            failed=True,
+            error=str(exc),
+            aggregated_metrics=None,
+            sample_size=0,
+            folds=[],
+        )
+
+    def _forecast_summary(self, prediction: PredictResponse, horizon: int) -> ForecastSummary:
+        points = [point.model_dump(mode="json") for point in prediction.forecasts]
+        total = float(sum(point.forecast for point in prediction.forecasts))
+        average = total / len(prediction.forecasts) if prediction.forecasts else 0.0
+        peak_date, peak_demand, low_date, low_demand = forecast_peak_low(points)
+        return ForecastSummary(
+            points=points,
+            total_demand=total,
+            average_demand=average,
+            horizon=horizon,
+            peak_date=peak_date,
+            peak_demand=peak_demand,
+            low_date=low_date,
+            low_demand=low_demand,
+        )
+
+    @staticmethod
+    def _params_for_trained_type(row: ModelSelectionRun, model_type: str) -> dict[str, Any]:
+        """Return the configured params for a candidate ``model_type`` (or {})."""
+        for candidate in row.candidate_models or []:
+            if candidate.get("model_type") == model_type:
+                params = candidate.get("params") or {}
+                return dict(params)
+        return {}
+
+    def _params_for_trained(self, row: ModelSelectionRun) -> dict[str, Any]:
+        """Return the params of the model actually trained on this run."""
+        if row.trained_model_type is None:
+            return {}
+        return self._params_for_trained_type(row, row.trained_model_type)
+
+    @staticmethod
+    def _override_warning(chosen_type: str, ranking: RankingResult) -> str:
+        """Deterministic warning copy when a non-recommended model is trained."""
+        winner = ranking.winner
+        if winner is None:
+            return f"You trained '{chosen_type}', but no model was recommended for this selection."
+        chosen_entry = next(
+            (e for e in ranking.entries if e.model_type == chosen_type and e.included),
+            None,
+        )
+        winner_wape = (winner.metrics or {}).get("wape")
+        if chosen_entry and chosen_entry.metrics and winner_wape is not None:
+            chosen_wape = chosen_entry.metrics.get("wape")
+            if chosen_wape is not None:
+                gap = chosen_wape - winner_wape
+                return (
+                    f"You trained '{chosen_type}' instead of the recommended "
+                    f"'{winner.model_type}'. Its backtest WAPE is {chosen_wape:.1f}% "
+                    f"vs the recommended {winner_wape:.1f}% "
+                    f"(a {gap:+.1f} percentage-point gap)."
+                )
+        return (
+            f"You trained '{chosen_type}' instead of the recommended "
+            f"'{winner.model_type}'. '{chosen_type}' was not successfully evaluated "
+            "in the backtest, so no WAPE comparison is available."
+        )
+
+    @staticmethod
+    def _register_artifact(final_model_path: str, run_id: str) -> tuple[str, str, int]:
+        """Copy the trained bundle into registry storage and return (uri, hash, size).
+
+        Mirrors the demo pipeline's register step (``demo/pipeline.py``): the
+        forecasting bundle lives under ``forecast_model_artifacts_dir``; copying
+        it into ``registry_artifact_root`` makes the promoted run's artifact
+        verifiable via ``GET /registry/runs/{id}/verify``.
+        """
+        from app.features.registry.storage import LocalFSProvider  # lazy
+
+        source = Path(final_model_path)
+        if not source.exists():
+            raise BadRequestError(message=f"Trained artifact missing at {final_model_path}")
+        artifact_uri = f"champion-selector/{run_id}-{source.name}"
+        file_hash, file_size = LocalFSProvider().save(source, artifact_uri)
+        return artifact_uri, file_hash, file_size
+
+    async def _load(self, db: AsyncSession, selection_id: str) -> ModelSelectionRun:
+        row = await db.scalar(
+            select(ModelSelectionRun).where(ModelSelectionRun.selection_id == selection_id)
+        )
+        if row is None:
+            raise NotFoundError(message=f"Selection run {selection_id} not found")
+        return row
+
+    def _load_ranking(self, row: ModelSelectionRun) -> RankingResult:
+        if row.ranking_result:
+            return RankingResult.model_validate(row.ranking_result)
+        return RankingResult(winner=None, entries=[], confidence="low", reasons=[])
+
+    def _response(
+        self, row: ModelSelectionRun, ranking: RankingResult
+    ) -> ModelSelectionRunResponse:
+        availability = (
+            PairAvailabilityResponse.model_validate(row.availability_snapshot)
+            if row.availability_snapshot
+            else None
+        )
+        chart_data = ChartData.model_validate(row.chart_data) if row.chart_data else None
+        forecast = (
+            ForecastSummary.model_validate(row.forecast_result) if row.forecast_result else None
+        )
+        winner: WinnerSummary | None = None
+        if ranking.winner is not None and row.status in _TERMINAL_WITH_WINNER:
+            winner = WinnerSummary(
+                model_type=ranking.winner.model_type,
+                params=ranking.winner.params,
+                metrics=ranking.winner.metrics or {},
+                rank=1,
+            )
+        confidence = ranking.confidence if (ranking.entries or ranking.winner) else None
+        final_model = {"model_path": row.final_model_path} if row.final_model_path else None
+        return ModelSelectionRunResponse(
+            selection_id=row.selection_id,
+            store_id=row.store_id,
+            product_id=row.product_id,
+            status=row.status,  # type: ignore[arg-type]
+            selection_window=SelectionWindow(start_date=row.start_date, end_date=row.end_date),
+            forecast_horizon=row.forecast_horizon,
+            ranking_metric=row.ranking_metric,
+            availability=availability,
+            ranking=ranking.entries,
+            winner=winner,
+            recommendation_confidence=confidence,
+            confidence_reasons=ranking.reasons,
+            chart_data=chart_data,
+            final_model=final_model,
+            forecast=forecast,
+            business_summary=row.business_summary,
+            error_message=row.error_message,
+            created_at=row.created_at,
+            started_at=row.started_at,
+            completed_at=row.completed_at,
+        )
diff --git a/app/features/model_selection/tests/__init__.py b/app/features/model_selection/tests/__init__.py
new file mode 100644
index 00000000..1dd09b80
--- /dev/null
+++ b/app/features/model_selection/tests/__init__.py
@@ -0,0 +1 @@
+"""Tests for the Forecast Champion Selector slice (issue #353)."""
diff --git a/app/features/model_selection/tests/conftest.py b/app/features/model_selection/tests/conftest.py
new file mode 100644
index 00000000..0a417631
--- /dev/null
+++ b/app/features/model_selection/tests/conftest.py
@@ -0,0 +1,331 @@
+"""Test fixtures + factories for the model_selection slice (issue #353).
+
+Unit helpers build ``CandidateResult`` / fake backtest+predict responses and a
+mock ``AsyncSession`` whose ``flush`` stamps ``created_at`` (so the response
+mapper, which reads it, works without a real DB). Integration fixtures
+(``@pytest.mark.integration``) seed a real ``docker compose`` Postgres and clean
+up after themselves with prefix-scoped teardown.
+"""
+
+from __future__ import annotations
+
+import uuid
+from collections.abc import AsyncGenerator
+from datetime import UTC, date, datetime, timedelta
+from decimal import Decimal
+from types import SimpleNamespace
+from typing import Any
+from unittest.mock import AsyncMock, MagicMock
+
+import pytest
+from httpx import ASGITransport, AsyncClient
+from sqlalchemy import delete, select
+from sqlalchemy.ext.asyncio import AsyncSession, async_sessionmaker, create_async_engine
+
+from app.core.config import get_settings
+from app.core.database import get_db
+from app.features.backtesting.schemas import SplitConfig
+from app.features.data_platform.models import Calendar, Product, SalesDaily, Store
+from app.features.model_selection.models import ModelSelectionRun
+from app.features.model_selection.schemas import (
+    CandidateResult,
+    FoldChart,
+    PairAvailabilityResponse,
+)
+from app.features.registry.models import DeploymentAlias, ModelRun
+from app.main import app
+
+# Integration test window.
+TEST_START = date(2024, 1, 1)
+# Largest ``n_days`` any seeding fixture below uses (``ready_pair`` = 120). The
+# teardown deletes Calendar over ``[TEST_START, TEST_START + _MAX_SEED_DAYS)``;
+# keep this >= the biggest ``_seed_pair`` call so no seeded calendar row leaks.
+_MAX_SEED_DAYS = 120
+
+
+# =============================================================================
+# Unit factories
+# =============================================================================
+
+
+def make_candidate_result(
+    model_type: str,
+    *,
+    wape: float = 20.0,
+    smape: float = 15.0,
+    mae: float = 5.0,
+    rmse: float = 6.0,
+    bias: float = 0.5,
+    sample_size: int = 28,
+    n_folds: int = 2,
+    points_per_fold: int = 14,
+    params: dict[str, Any] | None = None,
+    failed: bool = False,
+    error: str | None = None,
+    aggregated_metrics: dict[str, float] | None = None,
+) -> CandidateResult:
+    """Build a ``CandidateResult`` for ranking/chart unit tests."""
+    if failed:
+        return CandidateResult(
+            model_type=model_type,
+            params=params or {},
+            failed=True,
+            error=error or "boom",
+            aggregated_metrics=None,
+            sample_size=0,
+            folds=[],
+        )
+    folds = [
+        FoldChart(
+            fold_index=i,
+            dates=[
+                TEST_START + timedelta(days=i * points_per_fold + j) for j in range(points_per_fold)
+            ],
+            actuals=[10.0 + j for j in range(points_per_fold)],
+            predictions=[10.5 + j for j in range(points_per_fold)],
+        )
+        for i in range(n_folds)
+    ]
+    metrics = aggregated_metrics or {
+        "mae": mae,
+        "rmse": rmse,
+        "smape": smape,
+        "wape": wape,
+        "bias": bias,
+    }
+    return CandidateResult(
+        model_type=model_type,
+        params=params or {},
+        failed=False,
+        aggregated_metrics=metrics,
+        sample_size=sample_size,
+        config_hash="cafef00d",
+        folds=folds,
+    )
+
+
+def make_backtest_response(
+    *,
+    wape: float = 20.0,
+    smape: float = 15.0,
+    mae: float = 5.0,
+    rmse: float = 6.0,
+    bias: float = 0.5,
+    n_folds: int = 2,
+    points_per_fold: int = 14,
+) -> SimpleNamespace:
+    """A duck-typed stand-in for ``BacktestResponse`` (what _shape_candidate reads)."""
+    folds = [
+        SimpleNamespace(
+            fold_index=i,
+            dates=[
+                TEST_START + timedelta(days=i * points_per_fold + j) for j in range(points_per_fold)
+            ],
+            actuals=[10.0 + j for j in range(points_per_fold)],
+            predictions=[10.5 + j for j in range(points_per_fold)],
+        )
+        for i in range(n_folds)
+    ]
+    main = SimpleNamespace(
+        fold_results=folds,
+        aggregated_metrics={
+            "mae": mae,
+            "rmse": rmse,
+            "smape": smape,
+            "wape": wape,
+            "bias": bias,
+        },
+        metric_std={},
+    )
+    return SimpleNamespace(main_model_results=main, config_hash="bt00deadbeef", backtest_id="bt")
+
+
+def make_availability(
+    *,
+    status: str = "ready",
+    store_id: int = 1,
+    product_id: int = 1,
+    horizon: int = 14,
+) -> PairAvailabilityResponse:
+    """A ready/limited/unusable availability response for service unit tests."""
+    return PairAvailabilityResponse(
+        store_id=store_id,
+        product_id=product_id,
+        first_sales_date=TEST_START,
+        last_sales_date=TEST_START + timedelta(days=119),
+        observed_days=120,
+        expected_calendar_days=120,
+        coverage_ratio=1.0,
+        missing_days=0,
+        zero_sale_days=0,
+        promotion_days=0,
+        average_daily_demand=12.0,
+        status=status,  # type: ignore[arg-type]
+        recommended_split_config=SplitConfig(
+            strategy="expanding", n_splits=5, min_train_size=30, gap=0, horizon=horizon
+        ),
+        warnings=[],
+    )
+
+
+def make_mock_db() -> AsyncMock:
+    """Mock ``AsyncSession`` whose flush stamps ``created_at`` on added rows."""
+    db = AsyncMock()
+    added: list[Any] = []
+
+    def _add(obj: Any) -> None:
+        added.append(obj)
+
+    async def _flush() -> None:
+        for obj in added:
+            if isinstance(obj, ModelSelectionRun) and obj.created_at is None:
+                obj.created_at = datetime.now(UTC)
+
+    db.add = MagicMock(side_effect=_add)
+    db.flush = AsyncMock(side_effect=_flush)
+    db.refresh = AsyncMock()
+    return db
+
+
+# =============================================================================
+# Integration fixtures — real Postgres
+# =============================================================================
+
+
+@pytest.fixture
+async def db_session() -> AsyncGenerator[AsyncSession, None]:
+    """Yield an async session; wipe model_selection + test data on teardown."""
+    settings = get_settings()
+    engine = create_async_engine(settings.database_url, echo=False)
+    session_maker = async_sessionmaker(engine, class_=AsyncSession, expire_on_commit=False)
+
+    async with session_maker() as session:
+        try:
+            yield session
+        finally:
+            store_ids = _registered_store_ids()
+            if store_ids:
+                # Slice C — clean up registry runs/aliases a promote() created
+                # (cross-slice teardown). Delete aliases first (FK to
+                # model_run.id), then the runs, scoped to the seeded store ids.
+                run_id_rows = await session.execute(
+                    select(ModelRun.id).where(ModelRun.store_id.in_(store_ids))
+                )
+                run_ids = [r[0] for r in run_id_rows]
+                if run_ids:
+                    await session.execute(
+                        delete(DeploymentAlias).where(DeploymentAlias.run_id.in_(run_ids))
+                    )
+                    await session.execute(delete(ModelRun).where(ModelRun.id.in_(run_ids)))
+                await session.execute(
+                    delete(ModelSelectionRun).where(ModelSelectionRun.store_id.in_(store_ids))
+                )
+            await session.execute(
+                delete(SalesDaily).where(SalesDaily.unit_price == Decimal("3.33"))
+            )
+            await session.execute(delete(Product).where(Product.sku.like("TMSEL-%")))
+            await session.execute(delete(Store).where(Store.code.like("TMSEL-%")))
+            # Clean up the Calendar rows the fixtures seeded — leaving them
+            # orphaned poisons the shared integration DB: the seeder's
+            # calendar-seed step skips when the calendar is already non-empty,
+            # so downstream phase-2 enrichment (replenishment_event → calendar
+            # FK) fails on dates this partial calendar never covered. The
+            # seeded sales rows above are already gone, so this delete is
+            # FK-safe (scoped to exactly the dates _seed_pair creates).
+            await session.execute(
+                delete(Calendar).where(
+                    Calendar.date >= TEST_START,
+                    Calendar.date <= TEST_START + timedelta(days=_MAX_SEED_DAYS - 1),
+                )
+            )
+            await session.commit()
+
+    await engine.dispose()
+
+
+# Track store ids created by the seeding fixtures so teardown can scope the
+# model_selection_run cleanup precisely.
+_SEEDED_STORE_IDS: list[int] = []
+
+
+def _registered_store_ids() -> list[int]:
+    return list(_SEEDED_STORE_IDS)
+
+
+@pytest.fixture
+async def client(db_session: AsyncSession) -> AsyncGenerator[AsyncClient, None]:
+    """Test client with the database dependency overridden."""
+
+    async def override_get_db() -> AsyncGenerator[AsyncSession, None]:
+        yield db_session
+
+    app.dependency_overrides[get_db] = override_get_db
+    async with AsyncClient(transport=ASGITransport(app=app), base_url="http://test") as ac:
+        yield ac
+    app.dependency_overrides.pop(get_db, None)
+
+
+async def _seed_pair(db: AsyncSession, n_days: int) -> dict[str, Any]:
+    """Seed a store/product/calendar + a clean weekly sales series of n_days."""
+    suffix = uuid.uuid4().hex[:8]
+    store = Store(code=f"TMSEL-{suffix}", name="MSel Store", region="R", store_type="x")
+    product = Product(
+        sku=f"TMSEL-{suffix}",
+        name="MSel Product",
+        category="C",
+        base_price=Decimal("3.33"),
+        launch_date=TEST_START,
+    )
+    db.add_all([store, product])
+    await db.commit()
+    await db.refresh(store)
+    await db.refresh(product)
+    _SEEDED_STORE_IDS.append(store.id)
+
+    weekly = [10.0, 20.0, 30.0, 40.0, 50.0, 60.0, 70.0]
+    for i in range(n_days):
+        d = TEST_START + timedelta(days=i)
+        await db.merge(
+            Calendar(
+                date=d,
+                day_of_week=d.weekday(),
+                month=d.month,
+                quarter=(d.month - 1) // 3 + 1,
+                year=d.year,
+                is_holiday=False,
+            )
+        )
+    await db.commit()
+
+    for i in range(n_days):
+        qty = int(weekly[i % 7])
+        db.add(
+            SalesDaily(
+                date=TEST_START + timedelta(days=i),
+                store_id=store.id,
+                product_id=product.id,
+                quantity=qty,
+                unit_price=Decimal("3.33"),
+                total_amount=Decimal("3.33") * qty,
+            )
+        )
+    await db.commit()
+    return {
+        "store_id": store.id,
+        "product_id": product.id,
+        "start_date": TEST_START.isoformat(),
+        "end_date": (TEST_START + timedelta(days=n_days - 1)).isoformat(),
+        "n_days": n_days,
+    }
+
+
+@pytest.fixture
+async def ready_pair(db_session: AsyncSession) -> dict[str, Any]:
+    """A 120-day pair — ``ready`` for horizon=14, n_splits=5 (threshold 100)."""
+    return await _seed_pair(db_session, 120)
+
+
+@pytest.fixture
+async def limited_pair(db_session: AsyncSession) -> dict[str, Any]:
+    """A 50-day pair — ``limited`` (>= 44, < 100)."""
+    return await _seed_pair(db_session, 50)
diff --git a/app/features/model_selection/tests/test_async_routes.py b/app/features/model_selection/tests/test_async_routes.py
new file mode 100644
index 00000000..6d0f3532
--- /dev/null
+++ b/app/features/model_selection/tests/test_async_routes.py
@@ -0,0 +1,180 @@
+"""Unit route tests for the Slice B async endpoints (service mocked).
+
+Mirrors ``test_routes.py``: ``get_db`` overridden with a mock session, the
+service patched at the class level. Asserts the 202 shape + headers and the
+DELETE 404/409 mapping over the HTTP boundary.
+"""
+
+from __future__ import annotations
+
+from collections.abc import AsyncGenerator
+from contextlib import asynccontextmanager
+from datetime import UTC, datetime
+from typing import Any
+from unittest.mock import AsyncMock
+
+import pytest
+from httpx import ASGITransport, AsyncClient
+
+from app.core.database import get_db
+from app.core.exceptions import ConflictError, NotFoundError
+from app.features.model_selection.schemas import (
+    CandidateProgress,
+    ModelSelectionRunResponse,
+    SelectionProgress,
+    SelectionWindow,
+    SubmitRunResponse,
+)
+from app.features.model_selection.service import ModelSelectionService
+from app.main import app
+
+
+@asynccontextmanager
+async def _client() -> AsyncGenerator[AsyncClient, None]:
+    async def override_get_db() -> AsyncGenerator[AsyncMock, None]:
+        yield AsyncMock()
+
+    app.dependency_overrides[get_db] = override_get_db
+    try:
+        async with AsyncClient(transport=ASGITransport(app=app), base_url="http://test") as ac:
+            yield ac
+    finally:
+        app.dependency_overrides.pop(get_db, None)
+
+
+def _assert_problem_detail(body: dict[str, Any], expected_status: int) -> None:
+    for key in ("type", "title", "status", "detail"):
+        assert key in body, f"missing RFC 7807 field: {key}"
+    assert body["status"] == expected_status
+
+
+def _valid_run_body(**overrides: Any) -> dict[str, Any]:
+    body: dict[str, Any] = {
+        "store_id": 5,
+        "product_id": 8,
+        "selection_window": {"start_date": "2026-01-01", "end_date": "2026-05-31"},
+        "forecast_horizon": 14,
+        "split_config": {
+            "strategy": "expanding",
+            "n_splits": 5,
+            "min_train_size": 30,
+            "gap": 0,
+            "horizon": 14,
+        },
+        "candidate_models": [
+            {"model_type": "naive", "params": {}},
+            {"model_type": "seasonal_naive", "params": {"season_length": 7}},
+        ],
+    }
+    body.update(overrides)
+    return body
+
+
+def _running_submit_response(selection_id: str = "sel_async") -> SubmitRunResponse:
+    return SubmitRunResponse(
+        selection_id=selection_id,
+        store_id=5,
+        product_id=8,
+        status="running",
+        selection_window=SelectionWindow(start_date="2026-01-01", end_date="2026-05-31"),  # type: ignore[arg-type]
+        forecast_horizon=14,
+        ranking_metric="wape",
+        availability=None,
+        ranking=[],
+        winner=None,
+        recommendation_confidence=None,
+        confidence_reasons=[],
+        chart_data=None,
+        final_model=None,
+        forecast=None,
+        business_summary=None,
+        error_message=None,
+        created_at=datetime.now(UTC),
+        started_at=datetime.now(UTC),
+        completed_at=None,
+        progress=SelectionProgress(
+            total=2, pending=2, running=0, completed=0, failed=0, cancelled=0
+        ),
+        candidate_progress=[
+            CandidateProgress(candidate_id="c0", ordinal=0, model_type="naive", status="pending"),
+            CandidateProgress(
+                candidate_id="c1", ordinal=1, model_type="seasonal_naive", status="pending"
+            ),
+        ],
+        monitor_url=f"/model-selection/{selection_id}",
+        cancel_url=f"/model-selection/{selection_id}",
+    )
+
+
+async def test_submit_runs_returns_202_with_headers_and_running_body(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    monkeypatch.setattr(
+        ModelSelectionService,
+        "submit_run",
+        AsyncMock(return_value=_running_submit_response()),
+    )
+    async with _client() as ac:
+        response = await ac.post("/model-selection/runs", json=_valid_run_body())
+    assert response.status_code == 202
+    body = response.json()
+    assert body["status"] == "running"
+    assert body["monitor_url"] == "/model-selection/sel_async"
+    assert body["cancel_url"] == "/model-selection/sel_async"
+    assert body["progress"]["pending"] == 2
+    assert len(body["candidate_progress"]) == 2
+    # LRO status-monitor headers.
+    assert response.headers.get("location") == "/model-selection/sel_async"
+    assert response.headers.get("retry-after") == "2"
+
+
+async def test_submit_runs_validation_error_returns_problem_json() -> None:
+    """A horizon mismatch is rejected by the request validator (422)."""
+    bad = _valid_run_body(forecast_horizon=14)
+    bad["split_config"] = {
+        "strategy": "expanding",
+        "n_splits": 5,
+        "min_train_size": 30,
+        "gap": 0,
+        "horizon": 7,
+    }
+    async with _client() as ac:
+        response = await ac.post("/model-selection/runs", json=bad)
+    assert response.status_code == 422
+    _assert_problem_detail(response.json(), 422)
+
+
+async def test_delete_run_404_when_missing(monkeypatch: pytest.MonkeyPatch) -> None:
+    monkeypatch.setattr(
+        ModelSelectionService,
+        "cancel_run",
+        AsyncMock(side_effect=NotFoundError(message="Selection run missing not found")),
+    )
+    async with _client() as ac:
+        response = await ac.delete("/model-selection/missing")
+    assert response.status_code == 404
+    _assert_problem_detail(response.json(), 404)
+
+
+async def test_delete_run_409_when_terminal(monkeypatch: pytest.MonkeyPatch) -> None:
+    monkeypatch.setattr(
+        ModelSelectionService,
+        "cancel_run",
+        AsyncMock(side_effect=ConflictError(message="Selection run already terminal: completed")),
+    )
+    async with _client() as ac:
+        response = await ac.delete("/model-selection/sel_done")
+    assert response.status_code == 409
+    _assert_problem_detail(response.json(), 409)
+
+
+async def test_delete_run_returns_settled_200(monkeypatch: pytest.MonkeyPatch) -> None:
+    settled = _running_submit_response("sel_cancel")
+    settled_resp = ModelSelectionRunResponse.model_validate(
+        {**settled.model_dump(), "status": "cancelled"}
+    )
+    monkeypatch.setattr(ModelSelectionService, "cancel_run", AsyncMock(return_value=settled_resp))
+    async with _client() as ac:
+        response = await ac.delete("/model-selection/sel_cancel")
+    assert response.status_code == 200
+    assert response.json()["status"] == "cancelled"
diff --git a/app/features/model_selection/tests/test_capabilities.py b/app/features/model_selection/tests/test_capabilities.py
new file mode 100644
index 00000000..3ff73804
--- /dev/null
+++ b/app/features/model_selection/tests/test_capabilities.py
@@ -0,0 +1,102 @@
+"""Unit tests for the pure model-capability catalog (issue #356, Slice A).
+
+No DB, no I/O — exercises ``build_model_catalog`` directly, mirroring
+``test_ranking.py``. These pin the BACKEND-OWNED capability contract the
+frontend consumes read-only.
+"""
+
+from __future__ import annotations
+
+import typing
+
+from app.features.model_selection.capabilities import (
+    DEFAULT_CANDIDATE_MODEL_TYPES,
+    build_model_catalog,
+)
+from app.features.model_selection.schemas import ModelType
+
+_EXPECTED_MODEL_TYPES = set(typing.get_args(ModelType))
+
+
+def test_catalog_model_types_match_literal() -> None:
+    """The catalog covers EXACTLY the ``ModelType`` Literal — no drift."""
+    catalog = build_model_catalog()
+    catalog_types = {m.model_type for m in catalog.models}
+    assert catalog_types == _EXPECTED_MODEL_TYPES
+    # 11 models, no duplicates.
+    assert len(catalog.models) == len(_EXPECTED_MODEL_TYPES) == 11
+
+
+def test_catalog_families_are_valid_literals() -> None:
+    """Every family is one of the three lowercase literals from forecasting."""
+    catalog = build_model_catalog()
+    for model in catalog.models:
+        assert model.family in {"baseline", "tree", "additive"}
+
+
+def test_requires_extra_flags_lightgbm_xgboost_only() -> None:
+    """Only the opt-in extras (lightgbm/xgboost) carry requires_extra=True."""
+    catalog = build_model_catalog()
+    extras = {m.model_type for m in catalog.models if m.requires_extra}
+    assert extras == {"lightgbm", "xgboost"}
+
+
+def test_feature_aware_set_matches_predict_reject_set() -> None:
+    """feature_aware == the forecasters with requires_features=True."""
+    catalog = build_model_catalog()
+    feature_aware = {m.model_type for m in catalog.models if m.feature_aware}
+    assert feature_aware == {
+        "regression",
+        "prophet_like",
+        "lightgbm",
+        "xgboost",
+        "random_forest",
+    }
+
+
+def test_feature_aware_models_do_not_support_auto_predict() -> None:
+    """supports_auto_predict is the strict negation of feature_aware."""
+    catalog = build_model_catalog()
+    for model in catalog.models:
+        assert model.supports_auto_predict == (not model.feature_aware)
+
+
+def test_default_candidate_model_types_are_the_default_five() -> None:
+    """The pre-selected defaults match the backend /run contract example."""
+    catalog = build_model_catalog()
+    assert catalog.default_candidate_model_types == [
+        "naive",
+        "seasonal_naive",
+        "moving_average",
+        "regression",
+        "prophet_like",
+    ]
+    # The exported constant and the response agree.
+    assert DEFAULT_CANDIDATE_MODEL_TYPES == catalog.default_candidate_model_types
+    # Every default is a real catalog entry.
+    catalog_types = {m.model_type for m in catalog.models}
+    assert set(catalog.default_candidate_model_types) <= catalog_types
+
+
+def test_default_params_match_forecasting_defaults() -> None:
+    """default_params are pinned to the live forecasting ModelConfig defaults."""
+    by_type = {m.model_type: m.default_params for m in build_model_catalog().models}
+    assert by_type["naive"] == {}
+    assert by_type["seasonal_naive"] == {"season_length": 7}
+    assert by_type["moving_average"] == {"window_size": 7}
+    assert by_type["regression"] == {
+        "max_iter": 200,
+        "learning_rate": 0.05,
+        "max_depth": 6,
+    }
+    # No internal/meta fields leak into the catalog.
+    for params in by_type.values():
+        assert "schema_version" not in params
+        assert "feature_config_hash" not in params
+
+
+def test_labels_and_descriptions_are_non_empty() -> None:
+    """Each entry carries human-facing label + description copy."""
+    for model in build_model_catalog().models:
+        assert model.label.strip()
+        assert model.description.strip()
diff --git a/app/features/model_selection/tests/test_decision.py b/app/features/model_selection/tests/test_decision.py
new file mode 100644
index 00000000..f1ab66b2
--- /dev/null
+++ b/app/features/model_selection/tests/test_decision.py
@@ -0,0 +1,155 @@
+"""Unit tests for the pure forecast-decision module (Slice C).
+
+``decision.py`` has NO DB/IO — every function is deterministic and tested here
+directly (z-table, safety-stock formula, peak/low, bias wording).
+"""
+
+from __future__ import annotations
+
+import statistics
+from datetime import date
+
+import pytest
+
+from app.features.model_selection.decision import (
+    BIAS_EXPLANATION,
+    compute_forecast_decision,
+    forecast_peak_low,
+    z_for_service_level,
+)
+
+
+def _points(values: list[float], start: date = date(2026, 1, 1)) -> list[dict[str, object]]:
+    """Build forecast points (JSON-mode shape: ISO date string + forecast)."""
+    return [
+        {
+            "date": (start.fromordinal(start.toordinal() + i)).isoformat(),
+            "forecast": v,
+            "lower_bound": None,
+            "upper_bound": None,
+        }
+        for i, v in enumerate(values)
+    ]
+
+
+# -----------------------------------------------------------------------------
+# z-table
+# -----------------------------------------------------------------------------
+
+
+@pytest.mark.parametrize(
+    ("service_level", "expected_z"),
+    [(0.90, 1.2816), (0.95, 1.6449), (0.975, 1.9600), (0.99, 2.3263)],
+)
+def test_decision_z_table_exact(service_level: float, expected_z: float) -> None:
+    assert z_for_service_level(service_level) == expected_z
+
+
+@pytest.mark.parametrize(
+    ("service_level", "expected_z"),
+    [(0.92, 1.2816), (0.93, 1.6449), (0.96, 1.6449), (0.98, 1.9600)],
+)
+def test_decision_z_table_nearest(service_level: float, expected_z: float) -> None:
+    """In-between service levels snap to the nearest table key."""
+    assert z_for_service_level(service_level) == expected_z
+
+
+# -----------------------------------------------------------------------------
+# Safety stock
+# -----------------------------------------------------------------------------
+
+
+def test_safety_stock_formula_matches_z_sigma_sqrt_l() -> None:
+    values = [10.0, 12.0, 8.0, 11.0, 9.0]
+    decision = compute_forecast_decision(
+        _points(values), average_demand=10.0, lead_time_days=7, service_level=0.95, winner_bias=0.5
+    )
+    sigma = statistics.pstdev(values)
+    expected_ss = 1.6449 * sigma * (7**0.5)
+    assert decision.method == "heuristic"
+    assert decision.z_value == 1.6449
+    assert decision.sigma_daily_demand == pytest.approx(sigma)
+    assert decision.safety_stock == pytest.approx(expected_ss)
+    assert decision.expected_demand_over_lead_time == pytest.approx(70.0)
+    assert decision.reorder_point == pytest.approx(70.0 + expected_ss)
+    assert decision.caveats  # always carries a caveat
+
+
+def test_flat_forecast_safety_stock_zero() -> None:
+    """A flat (zero-variance) forecast → sigma 0 → safety stock 0 (honest)."""
+    decision = compute_forecast_decision(
+        _points([10.0, 10.0, 10.0]),
+        average_demand=10.0,
+        lead_time_days=7,
+        service_level=0.95,
+        winner_bias=0.0,
+    )
+    assert decision.sigma_daily_demand == 0.0
+    assert decision.safety_stock == 0.0
+
+
+def test_single_point_forecast_safety_stock_zero() -> None:
+    decision = compute_forecast_decision(
+        _points([42.0]),
+        average_demand=42.0,
+        lead_time_days=3,
+        service_level=0.95,
+        winner_bias=None,
+    )
+    assert decision.sigma_daily_demand == 0.0
+    assert decision.safety_stock == 0.0
+
+
+# -----------------------------------------------------------------------------
+# Peak / low
+# -----------------------------------------------------------------------------
+
+
+def test_forecast_peak_low_picks_max_and_min() -> None:
+    points = _points([10.0, 25.0, 5.0, 18.0])
+    peak_date, peak_demand, low_date, low_demand = forecast_peak_low(points)
+    assert peak_demand == 25.0
+    assert low_demand == 5.0
+    assert peak_date == date(2026, 1, 2)
+    assert low_date == date(2026, 1, 3)
+
+
+def test_forecast_peak_low_empty_returns_none() -> None:
+    assert forecast_peak_low([]) == (None, None, None, None)
+
+
+# -----------------------------------------------------------------------------
+# Bias wording (LOCKED #4 — reuses BIAS_EXPLANATION)
+# -----------------------------------------------------------------------------
+
+
+@pytest.mark.parametrize(
+    ("bias", "fragment"),
+    [
+        (1.5, "under-forecasts (risk of stockouts)"),
+        (-1.5, "over-forecasts (risk of overstock)"),
+        (0.0, "roughly unbiased"),
+    ],
+)
+def test_bias_risk_text_under_over_neutral(bias: float, fragment: str) -> None:
+    decision = compute_forecast_decision(
+        _points([10.0, 12.0]),
+        average_demand=11.0,
+        lead_time_days=7,
+        service_level=0.95,
+        winner_bias=bias,
+    )
+    assert BIAS_EXPLANATION in decision.bias_risk_text
+    assert fragment in decision.bias_risk_text
+
+
+def test_bias_risk_text_handles_missing_bias() -> None:
+    decision = compute_forecast_decision(
+        _points([10.0, 12.0]),
+        average_demand=11.0,
+        lead_time_days=7,
+        service_level=0.95,
+        winner_bias=None,
+    )
+    assert BIAS_EXPLANATION in decision.bias_risk_text
+    assert "no recorded bias" in decision.bias_risk_text
diff --git a/app/features/model_selection/tests/test_explanations.py b/app/features/model_selection/tests/test_explanations.py
new file mode 100644
index 00000000..040b8aa3
--- /dev/null
+++ b/app/features/model_selection/tests/test_explanations.py
@@ -0,0 +1,44 @@
+"""Unit tests for the deterministic business-explanation layer."""
+
+from __future__ import annotations
+
+from app.features.model_selection.explanations import explain_winner
+from app.features.model_selection.ranking import rank_candidates
+from app.features.model_selection.schemas import RankingPolicy
+from app.features.model_selection.tests.conftest import make_availability, make_candidate_result
+
+
+def test_explain_winner_produces_deterministic_summary() -> None:
+    results = [
+        make_candidate_result("winner", wape=10.0),
+        make_candidate_result("second", wape=20.0),
+    ]
+    ranking = rank_candidates(results, RankingPolicy(), "wape", availability_status="ready")
+    summary = explain_winner(ranking, make_availability(status="ready"))
+
+    assert "winner" in summary["headline"]
+    assert summary["winner"]["model_type"] == "winner"
+    assert summary["recommendation_confidence"] == ranking.confidence
+    assert summary["confidence_reasons"] == ranking.reasons
+    assert summary["comparison"]["runner_up_model_type"] == "second"
+    assert any("coverage" in note.lower() for note in summary["data_notes"])
+    assert summary["caveats"]
+
+
+def test_explain_winner_is_deterministic() -> None:
+    """Same input → byte-identical output (no LLM, no randomness)."""
+    results = [
+        make_candidate_result("winner", wape=10.0),
+        make_candidate_result("second", wape=20.0),
+    ]
+    ranking = rank_candidates(results, RankingPolicy(), "wape", availability_status="ready")
+    availability = make_availability(status="ready")
+    assert explain_winner(ranking, availability) == explain_winner(ranking, availability)
+
+
+def test_explain_winner_handles_no_winner() -> None:
+    results = [make_candidate_result("x", failed=True, error="boom")]
+    ranking = rank_candidates(results, RankingPolicy(), "wape")
+    summary = explain_winner(ranking, make_availability(status="limited"))
+    assert summary["winner"] is None
+    assert "No model" in summary["headline"]
diff --git a/app/features/model_selection/tests/test_models.py b/app/features/model_selection/tests/test_models.py
new file mode 100644
index 00000000..589d7630
--- /dev/null
+++ b/app/features/model_selection/tests/test_models.py
@@ -0,0 +1,115 @@
+"""Tests for the ModelSelectionRun ORM model + status enum.
+
+The status CHECK-constraint enforcement is exercised in the integration suite
+(it requires the real Postgres CHECK); here we cover the enum values and the
+in-Python ORM construction.
+"""
+
+from __future__ import annotations
+
+from datetime import date
+
+from app.features.model_selection.models import (
+    TERMINAL_SELECTION_STATES,
+    CandidateStatus,
+    ModelSelectionCandidate,
+    ModelSelectionRun,
+    ModelSelectionStatus,
+)
+
+
+def test_status_enum_values() -> None:
+    assert {s.value for s in ModelSelectionStatus} == {
+        "pending",
+        "running",
+        "completed",
+        "partial",
+        "failed",
+        "cancelled",
+    }
+
+
+def test_candidate_status_enum_values() -> None:
+    assert {s.value for s in CandidateStatus} == {
+        "pending",
+        "running",
+        "completed",
+        "failed",
+        "cancelled",
+    }
+
+
+def test_terminal_selection_states() -> None:
+    assert TERMINAL_SELECTION_STATES == {"completed", "partial", "failed", "cancelled"}
+    assert "running" not in TERMINAL_SELECTION_STATES
+    assert "pending" not in TERMINAL_SELECTION_STATES
+
+
+def test_model_selection_run_construction_defaults() -> None:
+    row = ModelSelectionRun(
+        selection_id="abc123",
+        store_id=1,
+        product_id=2,
+        start_date=date(2026, 1, 1),
+        end_date=date(2026, 5, 31),
+        forecast_horizon=14,
+        ranking_metric="wape",
+        status=ModelSelectionStatus.RUNNING.value,
+        candidate_models=[{"model_type": "naive", "params": {}}],
+        policy_snapshot={"minimum_sample_size": 0},
+    )
+    assert row.selection_id == "abc123"
+    assert row.status == "running"
+    assert row.winner_model_type is None
+    assert row.final_model_path is None
+
+
+def test_model_selection_candidate_construction() -> None:
+    cand = ModelSelectionCandidate(
+        candidate_id="cand1",
+        selection_id="abc123",
+        ordinal=0,
+        model_type="naive",
+        params={},
+        status=CandidateStatus.PENDING.value,
+    )
+    assert cand.candidate_id == "cand1"
+    assert cand.selection_id == "abc123"
+    assert cand.status == "pending"
+    assert cand.result is None
+    assert cand.error_message is None
+
+
+# =============================================================================
+# Slice C — decision + promotion columns (in-Python construction)
+# =============================================================================
+
+
+def test_model_selection_run_slice_c_columns_construct() -> None:
+    run = ModelSelectionRun(
+        selection_id="selC",
+        status=ModelSelectionStatus.COMPLETED.value,
+        store_id=3,
+        product_id=8,
+        start_date=date(2026, 1, 1),
+        end_date=date(2026, 5, 31),
+        forecast_horizon=14,
+        ranking_metric="wape",
+        candidate_models=[{"model_type": "naive", "params": {}}],
+        policy_snapshot={},
+        trained_model_type="naive",
+        is_override=True,
+        override_reason="domain seasonality",
+        champion_run_id="run_abc123",
+        promoted_alias="champion-test",
+        promotion_decision={"decision": "promoted", "approved_by": "gabor"},
+        feature_frame_version=2,
+    )
+    assert run.trained_model_type == "naive"
+    assert run.is_override is True
+    assert run.override_reason == "domain seasonality"
+    assert run.champion_run_id == "run_abc123"
+    assert run.promoted_alias == "champion-test"
+    assert run.promotion_decision is not None
+    assert run.promotion_decision["approved_by"] == "gabor"
+    assert run.feature_frame_version == 2
diff --git a/app/features/model_selection/tests/test_ranking.py b/app/features/model_selection/tests/test_ranking.py
new file mode 100644
index 00000000..3c01b25a
--- /dev/null
+++ b/app/features/model_selection/tests/test_ranking.py
@@ -0,0 +1,205 @@
+"""Unit tests for the pure ranking + chart logic."""
+
+from __future__ import annotations
+
+import math
+
+from app.features.model_selection.ranking import (
+    build_chart_data,
+    normalize_metrics,
+    rank_candidates,
+)
+from app.features.model_selection.schemas import RankingPolicy
+from app.features.model_selection.tests.conftest import make_candidate_result
+
+
+def test_rank_candidates_wape_smape_abs_bias_mae_tie_break() -> None:
+    """Default sort key is (wape, smape, abs(bias), mae, model_type) (LOCKED #6)."""
+    # Same wape; B wins on smape; C loses smape but would win mae (irrelevant).
+    results = [
+        make_candidate_result("a_model", wape=10.0, smape=20.0, bias=1.0, mae=9.0),
+        make_candidate_result("b_model", wape=10.0, smape=15.0, bias=5.0, mae=8.0),
+        make_candidate_result("c_model", wape=10.0, smape=18.0, bias=0.0, mae=1.0),
+    ]
+    ranking = rank_candidates(results, RankingPolicy(), "wape")
+    order = [e.model_type for e in ranking.entries if e.included]
+    assert order == ["b_model", "c_model", "a_model"]
+    assert ranking.winner is not None
+    assert ranking.winner.model_type == "b_model"
+    assert ranking.winner.rank == 1
+
+
+def test_rank_candidates_model_type_breaks_full_tie() -> None:
+    """Identical metrics fall back to model_type alphabetical for determinism."""
+    results = [
+        make_candidate_result("zeta", wape=5.0, smape=5.0, bias=0.0, mae=1.0),
+        make_candidate_result("alpha", wape=5.0, smape=5.0, bias=0.0, mae=1.0),
+    ]
+    ranking = rank_candidates(results, RankingPolicy(), "wape")
+    assert ranking.winner is not None
+    assert ranking.winner.model_type == "alpha"
+
+
+def test_rank_candidates_non_default_metric_puts_it_first() -> None:
+    """ranking_metric='mae' ranks by mae first."""
+    results = [
+        make_candidate_result("high_wape_low_mae", wape=50.0, mae=1.0),
+        make_candidate_result("low_wape_high_mae", wape=5.0, mae=99.0),
+    ]
+    ranking = rank_candidates(results, RankingPolicy(), "mae")
+    assert ranking.winner is not None
+    assert ranking.winner.model_type == "high_wape_low_mae"
+
+
+def test_rank_candidates_excludes_missing_or_nan_metrics() -> None:
+    """A NaN/None primary metric drops the candidate to an excluded entry."""
+    good = make_candidate_result("good", wape=10.0)
+    nan_metrics = make_candidate_result("nan_model", wape=float("nan"))
+    no_metrics = make_candidate_result("no_metrics", failed=False)
+    no_metrics.aggregated_metrics = None
+    ranking = rank_candidates([good, nan_metrics, no_metrics], RankingPolicy(), "wape")
+
+    assert ranking.winner is not None
+    assert ranking.winner.model_type == "good"
+    excluded = {e.model_type: e for e in ranking.entries if not e.included}
+    assert set(excluded) == {"nan_model", "no_metrics"}
+    assert excluded["nan_model"].rank is None
+    assert excluded["nan_model"].exclusion_reason is not None
+
+
+def test_rank_candidates_normalizes_five_metric_keys_including_rmse() -> None:
+    """normalize_metrics carries all five keys incl. rmse; entries echo them."""
+    metrics = normalize_metrics(
+        {"mae": 1.0, "rmse": 2.0, "smape": 3.0, "wape": 4.0, "bias": 5.0}, sample_size=20
+    )
+    assert metrics is not None
+    assert metrics.rmse == 2.0
+    as_dict = metrics.as_dict()
+    assert set(as_dict) == {"wape", "smape", "mae", "rmse", "bias", "sample_size"}
+
+    ranking = rank_candidates([make_candidate_result("m", rmse=7.5)], RankingPolicy(), "wape")
+    assert ranking.entries[0].metrics is not None
+    assert ranking.entries[0].metrics["rmse"] == 7.5
+
+
+def test_normalize_metrics_rejects_inf_wape() -> None:
+    """An inf WAPE (all-zero actuals) is unrankable."""
+    assert (
+        normalize_metrics(
+            {"mae": 1.0, "rmse": 2.0, "smape": 3.0, "wape": math.inf, "bias": 0.0}, 10
+        )
+        is None
+    )
+
+
+def test_rank_candidates_excludes_below_minimum_sample_size() -> None:
+    """A candidate below the policy sample floor is excluded."""
+    results = [
+        make_candidate_result("ok", wape=10.0, sample_size=40),
+        make_candidate_result("tiny", wape=1.0, sample_size=5),
+    ]
+    ranking = rank_candidates(results, RankingPolicy(minimum_sample_size=30), "wape")
+    assert ranking.winner is not None
+    assert ranking.winner.model_type == "ok"
+    excluded = [e for e in ranking.entries if not e.included]
+    assert excluded[0].model_type == "tiny"
+
+
+def test_confidence_high_when_winner_beats_second_by_10_percent() -> None:
+    """A >=10% relative WAPE lead with acceptable bias yields HIGH confidence."""
+    results = [
+        make_candidate_result("winner", wape=10.0, bias=0.1),
+        make_candidate_result("second", wape=20.0, bias=0.1),
+    ]
+    ranking = rank_candidates(results, RankingPolicy(), "wape", availability_status="ready")
+    assert ranking.winner is not None
+    assert ranking.winner.model_type == "winner"
+    assert ranking.confidence == "high"
+
+
+def test_confidence_low_for_single_valid_candidate() -> None:
+    ranking = rank_candidates([make_candidate_result("solo", wape=10.0)], RankingPolicy(), "wape")
+    assert ranking.confidence == "low"
+
+
+def test_confidence_low_for_near_tie() -> None:
+    """A sub-epsilon lead is a near tie → LOW."""
+    results = [
+        make_candidate_result("a", wape=10.0),
+        make_candidate_result("b", wape=10.05),
+    ]
+    ranking = rank_candidates(results, RankingPolicy(), "wape", availability_status="ready")
+    assert ranking.confidence == "low"
+
+
+def test_confidence_medium_when_lead_below_high_threshold() -> None:
+    """A 5% lead (between epsilon and 10%) is MEDIUM."""
+    results = [
+        make_candidate_result("a", wape=9.5),
+        make_candidate_result("b", wape=10.0),
+    ]
+    ranking = rank_candidates(results, RankingPolicy(), "wape", availability_status="ready")
+    assert ranking.confidence == "medium"
+
+
+def test_confidence_low_when_availability_limited() -> None:
+    """Limited availability caps confidence at LOW even with a clear lead."""
+    results = [
+        make_candidate_result("winner", wape=10.0),
+        make_candidate_result("second", wape=20.0),
+    ]
+    ranking = rank_candidates(results, RankingPolicy(), "wape", availability_status="limited")
+    assert ranking.confidence == "low"
+
+
+def test_confidence_low_when_bias_over_threshold() -> None:
+    """A winner bias above the policy bound caps confidence at LOW."""
+    results = [
+        make_candidate_result("winner", wape=10.0, bias=50.0),
+        make_candidate_result("second", wape=20.0, bias=0.0),
+    ]
+    ranking = rank_candidates(
+        results, RankingPolicy(max_acceptable_abs_bias=1.0), "wape", availability_status="ready"
+    )
+    assert ranking.confidence == "low"
+
+
+def test_all_failed_candidates_yield_no_winner() -> None:
+    results = [
+        make_candidate_result("x", failed=True, error="train error"),
+        make_candidate_result("y", failed=True, error="value error"),
+    ]
+    ranking = rank_candidates(results, RankingPolicy(), "wape")
+    assert ranking.winner is None
+    assert ranking.confidence == "low"
+    assert all(not e.included for e in ranking.entries)
+
+
+def test_winner_entry_carries_params_for_rebuild() -> None:
+    """The winner entry preserves the original candidate params."""
+    results = [
+        make_candidate_result("seasonal_naive", wape=10.0, params={"season_length": 7}),
+        make_candidate_result("naive", wape=20.0, params={}),
+    ]
+    ranking = rank_candidates(results, RankingPolicy(), "wape")
+    assert ranking.winner is not None
+    assert ranking.winner.model_type == "seasonal_naive"
+    assert ranking.winner.params == {"season_length": 7}
+
+
+def test_chart_data_has_wape_bias_fold_stability_and_winner_actual_vs_predicted() -> None:
+    """build_chart_data populates all four chart series."""
+    results = [
+        make_candidate_result("winner", wape=10.0, n_folds=3),
+        make_candidate_result("second", wape=20.0, n_folds=3),
+    ]
+    ranking = rank_candidates(results, RankingPolicy(), "wape")
+    chart = build_chart_data(results, ranking)
+
+    assert set(chart.wape_by_model) == {"winner", "second"}
+    assert chart.wape_by_model["winner"] == 10.0
+    assert set(chart.bias_by_model) == {"winner", "second"}
+    assert len(chart.fold_stability["winner"]) == 3
+    assert all(isinstance(v, float) for v in chart.fold_stability["winner"])
+    assert len(chart.winner_actual_vs_predicted) == 3
+    assert chart.winner_actual_vs_predicted[0].actuals
diff --git a/app/features/model_selection/tests/test_routes.py b/app/features/model_selection/tests/test_routes.py
new file mode 100644
index 00000000..6193012d
--- /dev/null
+++ b/app/features/model_selection/tests/test_routes.py
@@ -0,0 +1,407 @@
+"""Unit route tests — service methods mocked, exercised over the HTTP boundary.
+
+``get_db`` is overridden with a mock session; the service is patched at the
+class level so the routes are tested in isolation. Error paths assert the
+RFC 7807 problem-detail shape.
+"""
+
+from __future__ import annotations
+
+from collections.abc import AsyncGenerator
+from contextlib import asynccontextmanager
+from datetime import UTC, date, datetime
+from typing import Any
+from unittest.mock import AsyncMock
+
+import pytest
+from httpx import ASGITransport, AsyncClient
+
+from app.core.database import get_db
+from app.core.exceptions import BadRequestError, NotFoundError
+from app.features.model_selection.schemas import (
+    ModelRankEntry,
+    ModelSelectionRunResponse,
+    SelectionWindow,
+    WinnerSummary,
+)
+from app.features.model_selection.service import ModelSelectionService
+from app.main import app
+
+
+@asynccontextmanager
+async def _client() -> AsyncGenerator[AsyncClient, None]:
+    async def override_get_db() -> AsyncGenerator[AsyncMock, None]:
+        yield AsyncMock()
+
+    app.dependency_overrides[get_db] = override_get_db
+    try:
+        async with AsyncClient(transport=ASGITransport(app=app), base_url="http://test") as ac:
+            yield ac
+    finally:
+        app.dependency_overrides.pop(get_db, None)
+
+
+def _assert_problem_detail(body: dict[str, Any], expected_status: int) -> None:
+    for key in ("type", "title", "status", "detail"):
+        assert key in body, f"missing RFC 7807 field: {key}"
+    assert body["status"] == expected_status
+
+
+def _run_response() -> ModelSelectionRunResponse:
+    metrics = {
+        "wape": 10.0,
+        "smape": 8.0,
+        "mae": 4.0,
+        "rmse": 5.0,
+        "bias": 0.1,
+        "sample_size": 28.0,
+    }
+    return ModelSelectionRunResponse(
+        selection_id="sel123",
+        store_id=1,
+        product_id=1,
+        status="completed",
+        selection_window=SelectionWindow(start_date=date(2026, 1, 1), end_date=date(2026, 5, 31)),
+        forecast_horizon=14,
+        ranking_metric="wape",
+        availability=None,
+        ranking=[
+            ModelRankEntry(rank=1, model_type="naive", params={}, included=True, metrics=metrics)
+        ],
+        winner=WinnerSummary(model_type="naive", params={}, metrics=metrics, rank=1),
+        recommendation_confidence="high",
+        confidence_reasons=["clear lead"],
+        chart_data=None,
+        final_model=None,
+        forecast=None,
+        business_summary=None,
+        error_message=None,
+        created_at=datetime.now(UTC),
+        completed_at=None,
+    )
+
+
+def _valid_run_body(**overrides: Any) -> dict[str, Any]:
+    body: dict[str, Any] = {
+        "store_id": 1,
+        "product_id": 1,
+        "selection_window": {"start_date": "2026-01-01", "end_date": "2026-05-31"},
+        "forecast_horizon": 14,
+        "split_config": {
+            "strategy": "expanding",
+            "n_splits": 5,
+            "min_train_size": 30,
+            "gap": 0,
+            "horizon": 14,
+        },
+        "candidate_models": [{"model_type": "naive", "params": {}}],
+    }
+    body.update(overrides)
+    return body
+
+
+async def test_run_returns_200(monkeypatch: pytest.MonkeyPatch) -> None:
+    monkeypatch.setattr(
+        ModelSelectionService, "run_selection", AsyncMock(return_value=_run_response())
+    )
+    async with _client() as ac:
+        response = await ac.post("/model-selection/run", json=_valid_run_body())
+    assert response.status_code == 200
+    body = response.json()
+    assert body["selection_id"] == "sel123"
+    assert body["recommendation_confidence"] == "high"
+    assert "confidence" not in body
+
+
+async def test_run_validation_error_returns_problem_json() -> None:
+    """auto_predict without auto_train_winner is rejected by the validator (422)."""
+    async with _client() as ac:
+        response = await ac.post(
+            "/model-selection/run",
+            json=_valid_run_body(auto_predict=True, auto_train_winner=False),
+        )
+    assert response.status_code == 422
+    _assert_problem_detail(response.json(), 422)
+
+
+async def test_routes_return_problem_json_on_bad_request(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    monkeypatch.setattr(
+        ModelSelectionService,
+        "run_selection",
+        AsyncMock(side_effect=BadRequestError(message="availability unusable")),
+    )
+    async with _client() as ac:
+        response = await ac.post("/model-selection/run", json=_valid_run_body())
+    assert response.status_code == 400
+    _assert_problem_detail(response.json(), 400)
+
+
+async def test_get_selection_not_found_returns_problem_json(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    monkeypatch.setattr(
+        ModelSelectionService,
+        "get_selection",
+        AsyncMock(side_effect=NotFoundError(message="Selection run missing not found")),
+    )
+    async with _client() as ac:
+        response = await ac.get("/model-selection/missing")
+    assert response.status_code == 404
+    _assert_problem_detail(response.json(), 404)
+
+
+async def test_availability_returns_200(monkeypatch: pytest.MonkeyPatch) -> None:
+    from app.features.model_selection.tests.conftest import make_availability
+
+    monkeypatch.setattr(
+        ModelSelectionService,
+        "get_availability",
+        AsyncMock(return_value=make_availability(status="ready")),
+    )
+    async with _client() as ac:
+        response = await ac.get(
+            "/model-selection/availability",
+            params={"store_id": 1, "product_id": 1, "forecast_horizon": 14},
+        )
+    assert response.status_code == 200
+    assert response.json()["status"] == "ready"
+
+
+async def test_availability_rejects_bad_query() -> None:
+    """store_id < 1 fails Query validation → 422 problem+json."""
+    async with _client() as ac:
+        response = await ac.get(
+            "/model-selection/availability",
+            params={"store_id": 0, "product_id": 1},
+        )
+    assert response.status_code == 422
+    _assert_problem_detail(response.json(), 422)
+
+
+async def test_get_models_returns_catalog_200() -> None:
+    """GET /model-selection/models returns the static catalog (no mock needed)."""
+    async with _client() as ac:
+        response = await ac.get("/model-selection/models")
+    assert response.status_code == 200
+    body = response.json()
+    assert isinstance(body["models"], list)
+    assert len(body["models"]) == 11
+    # Each entry carries the backend-owned capability contract.
+    first = body["models"][0]
+    for key in (
+        "model_type",
+        "label",
+        "family",
+        "feature_aware",
+        "requires_extra",
+        "default_params",
+        "supports_auto_predict",
+        "description",
+    ):
+        assert key in first, f"missing catalog field: {key}"
+    assert body["default_candidate_model_types"] == [
+        "naive",
+        "seasonal_naive",
+        "moving_average",
+        "regression",
+        "prophet_like",
+    ]
+
+
+async def test_models_route_not_captured_by_selection_id(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    """Literal /models must NOT be matched as GET /{selection_id}.
+
+    If route ordering regressed, the request would hit ``get_selection`` (here
+    forced to 404) instead of the catalog handler. We assert the catalog shape
+    comes back, proving the literal-before-path-param ordering holds.
+    """
+    monkeypatch.setattr(
+        ModelSelectionService,
+        "get_selection",
+        AsyncMock(side_effect=NotFoundError(message="selection run models not found")),
+    )
+    async with _client() as ac:
+        response = await ac.get("/model-selection/models")
+    assert response.status_code == 200
+    assert "models" in response.json()
+
+
+# =============================================================================
+# Slice C — train-selected / predict-with-decision / promote routes
+# =============================================================================
+
+from app.core.exceptions import UnprocessableEntityError  # noqa: E402
+from app.features.model_selection.schemas import (  # noqa: E402
+    ForecastDecision,
+    ForecastSummary,
+    PromoteResponse,
+    TrainWinnerResponse,
+)
+
+
+def _forecast_summary() -> ForecastSummary:
+    return ForecastSummary(
+        points=[{"date": "2026-06-01", "forecast": 10.0}],
+        total_demand=10.0,
+        average_demand=10.0,
+        horizon=14,
+        peak_date=date(2026, 6, 1),
+        peak_demand=10.0,
+        low_date=date(2026, 6, 1),
+        low_demand=10.0,
+    )
+
+
+def _forecast_decision() -> ForecastDecision:
+    return ForecastDecision(
+        lead_time_days=7,
+        service_level=0.95,
+        z_value=1.6449,
+        sigma_daily_demand=0.0,
+        expected_demand_over_lead_time=70.0,
+        safety_stock=0.0,
+        reorder_point=70.0,
+        bias_risk_text="bias text",
+        caveats=["heuristic"],
+    )
+
+
+async def test_train_selected_returns_200(monkeypatch: pytest.MonkeyPatch) -> None:
+    monkeypatch.setattr(
+        ModelSelectionService,
+        "train_selected",
+        AsyncMock(
+            return_value=TrainWinnerResponse(
+                selection_id="sel123",
+                model_type="seasonal_naive",
+                model_path="artifacts/models/model_x.joblib",
+                is_override=True,
+                override_warning="you overrode the recommendation",
+            )
+        ),
+    )
+    async with _client() as ac:
+        response = await ac.post(
+            "/model-selection/sel123/train-selected",
+            json={"model_type": "seasonal_naive", "override_reason": "domain"},
+        )
+    assert response.status_code == 200
+    body = response.json()
+    assert body["is_override"] is True
+    assert body["override_warning"]
+
+
+async def test_train_selected_bad_model_type_returns_400(monkeypatch: pytest.MonkeyPatch) -> None:
+    monkeypatch.setattr(
+        ModelSelectionService,
+        "train_selected",
+        AsyncMock(side_effect=BadRequestError(message="not a candidate")),
+    )
+    async with _client() as ac:
+        response = await ac.post(
+            "/model-selection/sel123/train-selected",
+            json={"model_type": "naive"},
+        )
+    assert response.status_code == 400
+    _assert_problem_detail(response.json(), 400)
+
+
+async def test_predict_no_body_uses_defaults_returns_200(monkeypatch: pytest.MonkeyPatch) -> None:
+    """Empty body → ForecastDecisionParams defaults → 200 with a decision."""
+    predict_mock = AsyncMock(return_value=(_forecast_summary(), _forecast_decision()))
+    monkeypatch.setattr(ModelSelectionService, "predict_winner", predict_mock)
+    async with _client() as ac:
+        response = await ac.post("/model-selection/sel123/predict")
+    assert response.status_code == 200
+    body = response.json()
+    assert body["decision"]["lead_time_days"] == 7
+    assert body["forecast"]["peak_demand"] == 10.0
+    # service called with the default lead time + service level
+    assert predict_mock.await_args is not None
+    assert predict_mock.await_args.args[2] == 7
+    assert predict_mock.await_args.args[3] == 0.95
+
+
+async def test_predict_with_body_returns_200(monkeypatch: pytest.MonkeyPatch) -> None:
+    predict_mock = AsyncMock(return_value=(_forecast_summary(), _forecast_decision()))
+    monkeypatch.setattr(ModelSelectionService, "predict_winner", predict_mock)
+    async with _client() as ac:
+        response = await ac.post(
+            "/model-selection/sel123/predict",
+            json={"lead_time_days": 14, "service_level": 0.99},
+        )
+    assert response.status_code == 200
+    assert predict_mock.await_args is not None
+    assert predict_mock.await_args.args[2] == 14
+    assert predict_mock.await_args.args[3] == 0.99
+
+
+async def test_predict_feature_aware_returns_400(monkeypatch: pytest.MonkeyPatch) -> None:
+    monkeypatch.setattr(
+        ModelSelectionService,
+        "predict_winner",
+        AsyncMock(side_effect=ValueError("Feature-aware models forecast through /scenarios")),
+    )
+    async with _client() as ac:
+        response = await ac.post("/model-selection/sel123/predict")
+    assert response.status_code == 400
+    _assert_problem_detail(response.json(), 400)
+
+
+async def test_promote_returns_200(monkeypatch: pytest.MonkeyPatch) -> None:
+    monkeypatch.setattr(
+        ModelSelectionService,
+        "promote",
+        AsyncMock(
+            return_value=PromoteResponse(
+                selection_id="sel123",
+                alias_name="champion-test",
+                run_id="run_abc",
+                run_status="success",
+                model_type="naive",
+                is_override=False,
+                promoted_at=datetime(2026, 6, 1, tzinfo=UTC),
+            )
+        ),
+    )
+    async with _client() as ac:
+        response = await ac.post(
+            "/model-selection/sel123/promote",
+            json={"alias_name": "champion-test", "approved_by": "gabor"},
+        )
+    assert response.status_code == 200
+    body = response.json()
+    assert body["alias_name"] == "champion-test"
+    assert body["run_status"] == "success"
+
+
+async def test_promote_bad_alias_name_returns_422() -> None:
+    """A bad alias_name is rejected by the schema regex (422) before the service."""
+    async with _client() as ac:
+        response = await ac.post(
+            "/model-selection/sel123/promote",
+            json={"alias_name": "Bad Alias!", "approved_by": "gabor"},
+        )
+    assert response.status_code == 422
+    _assert_problem_detail(response.json(), 422)
+
+
+async def test_promote_before_train_returns_422(monkeypatch: pytest.MonkeyPatch) -> None:
+    monkeypatch.setattr(
+        ModelSelectionService,
+        "promote",
+        AsyncMock(
+            side_effect=UnprocessableEntityError(message="Train the model before promoting.")
+        ),
+    )
+    async with _client() as ac:
+        response = await ac.post(
+            "/model-selection/sel123/promote",
+            json={"alias_name": "champion-test", "approved_by": "gabor"},
+        )
+    assert response.status_code == 422
+    _assert_problem_detail(response.json(), 422)
diff --git a/app/features/model_selection/tests/test_routes_integration.py b/app/features/model_selection/tests/test_routes_integration.py
new file mode 100644
index 00000000..bc03d122
--- /dev/null
+++ b/app/features/model_selection/tests/test_routes_integration.py
@@ -0,0 +1,403 @@
+"""Integration tests for the model_selection slice against real Postgres.
+
+Marked ``@pytest.mark.integration`` — require ``docker compose up -d`` + an
+applied ``alembic upgrade head``.
+"""
+
+from __future__ import annotations
+
+import asyncio
+from typing import Any
+
+import pytest
+from httpx import AsyncClient
+from sqlalchemy import text
+from sqlalchemy.ext.asyncio import AsyncSession
+
+pytestmark = pytest.mark.integration
+
+_TERMINAL = {"completed", "partial", "failed", "cancelled"}
+
+
+async def _poll_until_terminal(
+    client: AsyncClient, selection_id: str, *, attempts: int = 60, delay: float = 0.5
+) -> dict[str, Any]:
+    """Poll GET /{id} until the run reaches a terminal status (or attempts run out)."""
+    body: dict[str, Any] = {}
+    for _ in range(attempts):
+        response = await client.get(f"/model-selection/{selection_id}")
+        assert response.status_code == 200
+        body = response.json()
+        if body["status"] in _TERMINAL:
+            return body
+        await asyncio.sleep(delay)
+    raise AssertionError(f"run {selection_id} did not settle: last status {body.get('status')}")
+
+
+def _run_body(
+    pair: dict[str, Any], extra_candidates: list[dict[str, Any]] | None = None
+) -> dict[str, Any]:
+    candidates = [
+        {"model_type": "naive", "params": {}},
+        {"model_type": "seasonal_naive", "params": {"season_length": 7}},
+        {"model_type": "moving_average", "params": {"window_size": 7}},
+    ]
+    if extra_candidates:
+        candidates.extend(extra_candidates)
+    return {
+        "store_id": pair["store_id"],
+        "product_id": pair["product_id"],
+        "selection_window": {"start_date": pair["start_date"], "end_date": pair["end_date"]},
+        "forecast_horizon": 14,
+        "ranking_metric": "wape",
+        "split_config": {
+            "strategy": "expanding",
+            "n_splits": 5,
+            "min_train_size": 30,
+            "gap": 0,
+            "horizon": 14,
+        },
+        "candidate_models": candidates,
+        "auto_train_winner": False,
+        "auto_predict": False,
+    }
+
+
+async def test_table_has_named_indexes(db_session: AsyncSession) -> None:
+    rows = await db_session.execute(
+        text("SELECT indexname FROM pg_indexes WHERE tablename = 'model_selection_run'")
+    )
+    names = {row[0] for row in rows}
+    assert "ix_model_selection_run_selection_id" in names
+    assert "ix_model_selection_run_store_product_created" in names
+    assert "ix_model_selection_run_status_created" in names
+
+
+async def test_availability_ready_pair(client: AsyncClient, ready_pair: dict[str, Any]) -> None:
+    response = await client.get(
+        "/model-selection/availability",
+        params={
+            "store_id": ready_pair["store_id"],
+            "product_id": ready_pair["product_id"],
+            "forecast_horizon": 14,
+        },
+    )
+    assert response.status_code == 200
+    body = response.json()
+    assert body["status"] == "ready"
+    assert body["observed_days"] == ready_pair["n_days"]
+    assert body["recommended_split_config"]["horizon"] == 14
+
+
+async def test_availability_limited_pair(client: AsyncClient, limited_pair: dict[str, Any]) -> None:
+    response = await client.get(
+        "/model-selection/availability",
+        params={
+            "store_id": limited_pair["store_id"],
+            "product_id": limited_pair["product_id"],
+            "forecast_horizon": 14,
+        },
+    )
+    assert response.status_code == 200
+    assert response.json()["status"] == "limited"
+
+
+async def test_availability_unknown_pair_returns_404(client: AsyncClient) -> None:
+    response = await client.get(
+        "/model-selection/availability",
+        params={"store_id": 999999, "product_id": 999999, "forecast_horizon": 14},
+    )
+    assert response.status_code == 404
+    assert response.json()["status"] == 404
+
+
+async def test_run_persists_and_get_returns_same(
+    client: AsyncClient, ready_pair: dict[str, Any]
+) -> None:
+    run = await client.post("/model-selection/run", json=_run_body(ready_pair))
+    assert run.status_code == 200
+    body = run.json()
+    assert body["status"] in {"completed", "partial"}
+    assert body["winner"] is not None
+    assert body["recommendation_confidence"] in {"high", "medium", "low"}
+    assert body["chart_data"] is not None
+    assert body["ranking"]
+    selection_id = body["selection_id"]
+
+    fetched = await client.get(f"/model-selection/{selection_id}")
+    assert fetched.status_code == 200
+    assert fetched.json()["selection_id"] == selection_id
+
+    ranking = await client.get(f"/model-selection/{selection_id}/ranking")
+    assert ranking.status_code == 200
+    assert ranking.json()["winner"] is not None
+
+
+async def test_run_partial_with_bad_candidate(
+    client: AsyncClient, ready_pair: dict[str, Any]
+) -> None:
+    """An invalid candidate param surfaces as a failed entry, not a 500."""
+    body = _run_body(
+        ready_pair,
+        extra_candidates=[{"model_type": "moving_average", "params": {"window_size": 0}}],
+    )
+    response = await client.post("/model-selection/run", json=body)
+    assert response.status_code == 200
+    payload = response.json()
+    assert payload["status"] == "partial"
+    excluded = [e for e in payload["ranking"] if not e["included"]]
+    assert excluded
+    assert payload["winner"] is not None
+
+
+async def test_get_missing_selection_returns_404(client: AsyncClient) -> None:
+    response = await client.get("/model-selection/does-not-exist")
+    assert response.status_code == 404
+    assert response.json()["status"] == 404
+
+
+# --------------------------------------------------------------------- Slice B
+
+
+async def test_async_runs_submits_202_and_polls_to_terminal_with_winner(
+    client: AsyncClient, ready_pair: dict[str, Any]
+) -> None:
+    """POST /runs returns 202 running immediately; polling settles with a winner."""
+    submit = await client.post("/model-selection/runs", json=_run_body(ready_pair))
+    assert submit.status_code == 202
+    body = submit.json()
+    assert body["status"] == "running"
+    selection_id = body["selection_id"]
+    assert body["monitor_url"] == f"/model-selection/{selection_id}"
+    assert body["cancel_url"] == f"/model-selection/{selection_id}"
+    assert body["progress"]["total"] == 3
+    assert submit.headers.get("location") == f"/model-selection/{selection_id}"
+    assert submit.headers.get("retry-after") == "2"
+
+    terminal = await _poll_until_terminal(client, selection_id)
+    assert terminal["status"] in {"completed", "partial"}
+    assert terminal["winner"] is not None
+    assert terminal["chart_data"] is not None
+    assert terminal["ranking"]
+    assert terminal["progress"]["total"] == 3
+    # Terminal GET output is byte-compatible with the sync /run shape.
+    assert terminal["recommendation_confidence"] in {"high", "medium", "low"}
+
+
+async def test_async_runs_failed_candidate_stays_visible(
+    client: AsyncClient, ready_pair: dict[str, Any]
+) -> None:
+    """An invalid candidate surfaces as a failed/excluded entry, not a 500."""
+    body = _run_body(
+        ready_pair,
+        extra_candidates=[{"model_type": "moving_average", "params": {"window_size": 0}}],
+    )
+    submit = await client.post("/model-selection/runs", json=body)
+    assert submit.status_code == 202
+    selection_id = submit.json()["selection_id"]
+
+    terminal = await _poll_until_terminal(client, selection_id)
+    assert terminal["status"] == "partial"
+    excluded = [e for e in terminal["ranking"] if not e["included"]]
+    assert excluded
+    assert terminal["winner"] is not None
+    # The failed candidate is visible in candidate_progress too.
+    failed = [c for c in terminal["candidate_progress"] if c["status"] == "failed"]
+    assert failed
+
+
+async def test_cancel_leaves_no_candidate_running(
+    client: AsyncClient, ready_pair: dict[str, Any], db_session: AsyncSession
+) -> None:
+    """DELETE cooperatively cancels + drains — no candidate left 'running'."""
+    submit = await client.post("/model-selection/runs", json=_run_body(ready_pair))
+    assert submit.status_code == 202
+    selection_id = submit.json()["selection_id"]
+
+    # Cancel almost immediately. Fast baseline fits are uncancellable mid-call
+    # and may settle the whole run before the DELETE arrives — an HONEST race:
+    #   200 = the cancel fired and drained;
+    #   409 = the run had already settled (so nothing was left to cancel).
+    # Either way the LOAD-BEARING invariant below must hold.
+    cancel = await client.delete(f"/model-selection/{selection_id}")
+    assert cancel.status_code in {200, 409}
+
+    # Ensure the run is terminal before asserting the invariant (covers the 200
+    # path where the worker just settled, and the 409 already-settled path).
+    await _poll_until_terminal(client, selection_id)
+
+    # The load-bearing invariant: after the drain, no candidate row is 'running'.
+    rows = await db_session.execute(
+        text(
+            "SELECT count(*) FROM model_selection_candidate "
+            "WHERE selection_id = :sid AND status = 'running'"
+        ),
+        {"sid": selection_id},
+    )
+    assert rows.scalar() == 0
+
+
+async def test_cancel_terminal_run_returns_409(
+    client: AsyncClient, ready_pair: dict[str, Any]
+) -> None:
+    """Cancelling an already-settled run returns 409."""
+    submit = await client.post("/model-selection/runs", json=_run_body(ready_pair))
+    selection_id = submit.json()["selection_id"]
+    await _poll_until_terminal(client, selection_id)
+
+    cancel = await client.delete(f"/model-selection/{selection_id}")
+    assert cancel.status_code == 409
+    assert cancel.json()["status"] == 409
+
+
+async def test_candidate_table_has_named_indexes(db_session: AsyncSession) -> None:
+    rows = await db_session.execute(
+        text("SELECT indexname FROM pg_indexes WHERE tablename = 'model_selection_candidate'")
+    )
+    names = {row[0] for row in rows}
+    assert "ix_model_selection_candidate_candidate_id" in names
+    assert "ix_model_selection_candidate_selection_status" in names
+
+
+async def test_legacy_sync_run_has_no_progress_children(
+    client: AsyncClient, ready_pair: dict[str, Any]
+) -> None:
+    """A legacy synchronous /run row carries no async progress."""
+    run = await client.post("/model-selection/run", json=_run_body(ready_pair))
+    assert run.status_code == 200
+    selection_id = run.json()["selection_id"]
+    fetched = await client.get(f"/model-selection/{selection_id}")
+    body = fetched.json()
+    assert body["progress"] is None
+    assert body["candidate_progress"] == []
+
+
+# --------------------------------------------------------------------- Slice C
+
+from uuid import uuid4  # noqa: E402
+
+
+async def test_decision_journey_override_predict(
+    client: AsyncClient, ready_pair: dict[str, Any]
+) -> None:
+    """Sync run → train-selected (override) → predict (decision + peak/low)."""
+    run = await client.post("/model-selection/run", json=_run_body(ready_pair))
+    assert run.status_code == 200
+    body = run.json()
+    selection_id = body["selection_id"]
+    winner_type = body["winner"]["model_type"]
+
+    # Pick a candidate that is NOT the winner to exercise the override path.
+    candidate_types = [c["model_type"] for c in _run_body(ready_pair)["candidate_models"]]
+    override_type = next(t for t in candidate_types if t != winner_type)
+
+    trained = await client.post(
+        f"/model-selection/{selection_id}/train-selected",
+        json={"model_type": override_type, "override_reason": "domain seasonality"},
+    )
+    assert trained.status_code == 200
+    tbody = trained.json()
+    assert tbody["is_override"] is True
+    assert tbody["override_warning"]
+
+    predicted = await client.post(
+        f"/model-selection/{selection_id}/predict",
+        json={"lead_time_days": 7, "service_level": 0.95},
+    )
+    assert predicted.status_code == 200
+    pbody = predicted.json()
+    assert pbody["forecast"]["peak_demand"] is not None
+    assert pbody["forecast"]["low_demand"] is not None
+    assert pbody["decision"]["method"] == "heuristic"
+    assert pbody["decision"]["lead_time_days"] == 7
+    assert "safety_stock" in pbody["decision"]
+    assert "reorder_point" in pbody["decision"]
+
+
+async def test_promote_creates_registry_run_and_alias_with_real_v(
+    client: AsyncClient, ready_pair: dict[str, Any], db_session: AsyncSession
+) -> None:
+    """V2-configured run → train-winner → promote → SUCCESS registry run + alias.
+
+    Asserts the registry run's runtime_info carries the REAL feature_frame_version
+    (2), and the selection persisted champion_run_id/promoted_alias/decision.
+    """
+    body = _run_body(ready_pair)
+    body["feature_frame_version"] = 2  # baseline winner ignores V at train, column persists 2
+    run = await client.post("/model-selection/run", json=body)
+    assert run.status_code == 200
+    selection_id = run.json()["selection_id"]
+
+    trained = await client.post(f"/model-selection/{selection_id}/train-winner")
+    assert trained.status_code == 200
+
+    alias_name = f"champ-{uuid4().hex[:8]}"
+    promoted = await client.post(
+        f"/model-selection/{selection_id}/promote",
+        json={"alias_name": alias_name, "approved_by": "integration", "description": "Q3"},
+    )
+    assert promoted.status_code == 200
+    pbody = promoted.json()
+    assert pbody["alias_name"] == alias_name
+    assert pbody["run_status"] == "success"
+    run_id = pbody["run_id"]
+
+    # The alias resolves to the SUCCESS run via the registry endpoint.
+    alias_resp = await client.get(f"/registry/aliases/{alias_name}")
+    assert alias_resp.status_code == 200
+    assert alias_resp.json()["run_status"] == "success"
+
+    # The registry run carries the REAL feature_frame_version (2).
+    run_detail = await client.get(f"/registry/runs/{run_id}")
+    assert run_detail.status_code == 200
+    assert run_detail.json()["runtime_info"]["feature_frame_version"] == 2
+
+    # The selection persisted the promotion audit.
+    selection = await client.get(f"/model-selection/{selection_id}")
+    sbody = selection.json()
+    rows = await db_session.execute(
+        text(
+            "SELECT champion_run_id, promoted_alias, promotion_decision "
+            "FROM model_selection_run WHERE selection_id = :sid"
+        ),
+        {"sid": selection_id},
+    )
+    champion_run_id, promoted_alias, promotion_decision = rows.one()
+    assert champion_run_id == run_id
+    assert promoted_alias == alias_name
+    assert promotion_decision["approved_by"] == "integration"
+    assert promotion_decision["decision"] == "promoted"
+    assert sbody["status"] in {"completed", "partial"}
+
+
+async def test_promote_before_train_returns_422(
+    client: AsyncClient, ready_pair: dict[str, Any]
+) -> None:
+    run = await client.post("/model-selection/run", json=_run_body(ready_pair))
+    selection_id = run.json()["selection_id"]
+    promoted = await client.post(
+        f"/model-selection/{selection_id}/promote",
+        json={"alias_name": f"champ-{uuid4().hex[:8]}", "approved_by": "x"},
+    )
+    assert promoted.status_code == 422
+    assert promoted.json()["status"] == 422
+
+
+async def test_seven_decision_columns_exist(db_session: AsyncSession) -> None:
+    rows = await db_session.execute(
+        text(
+            "SELECT column_name FROM information_schema.columns "
+            "WHERE table_name = 'model_selection_run'"
+        )
+    )
+    cols = {row[0] for row in rows}
+    for col in (
+        "trained_model_type",
+        "is_override",
+        "override_reason",
+        "champion_run_id",
+        "promoted_alias",
+        "promotion_decision",
+        "feature_frame_version",
+    ):
+        assert col in cols, f"missing Slice C column: {col}"
diff --git a/app/features/model_selection/tests/test_runner.py b/app/features/model_selection/tests/test_runner.py
new file mode 100644
index 00000000..9421d303
--- /dev/null
+++ b/app/features/model_selection/tests/test_runner.py
@@ -0,0 +1,238 @@
+"""Unit tests for the Slice B bounded-concurrency candidate runner.
+
+The runner's DB helpers are monkeypatched to awaitable no-ops so the asyncio
+orchestration is exercised without docker-compose. The DB invariants (no
+candidate left ``running`` after a cancel drain) are covered in the integration
+suite. Mirrors ``app/features/batch/tests/test_runner.py``.
+"""
+
+from __future__ import annotations
+
+import asyncio
+from contextlib import asynccontextmanager
+from typing import Any, cast
+from unittest.mock import AsyncMock
+
+import pytest
+
+from app.features.model_selection import runner
+
+
+@pytest.fixture(autouse=True)
+def _clear_registry() -> Any:
+    runner._ACTIVE_SELECTIONS.clear()
+    yield
+    runner._ACTIVE_SELECTIONS.clear()
+
+
+@pytest.fixture
+def patch_db_helpers(monkeypatch: pytest.MonkeyPatch) -> dict[str, list[Any]]:
+    """Replace runner DB helpers with awaitable no-ops + a call tracker."""
+    calls: dict[str, list[Any]] = {
+        "mark_cancelled_skipped": [],
+        "mark_cancelled_running": [],
+        "mark_failed_unexpected": [],
+    }
+
+    async def _mark_cancelled_skipped(_session: Any, candidate_id: str) -> None:
+        calls["mark_cancelled_skipped"].append(candidate_id)
+
+    async def _mark_cancelled_running(_session: Any, candidate_id: str) -> None:
+        calls["mark_cancelled_running"].append(candidate_id)
+
+    async def _mark_failed_unexpected(_session: Any, candidate_id: str) -> None:
+        calls["mark_failed_unexpected"].append(candidate_id)
+
+    monkeypatch.setattr(runner, "_mark_cancelled_skipped", _mark_cancelled_skipped)
+    monkeypatch.setattr(runner, "_mark_cancelled_running", _mark_cancelled_running)
+    monkeypatch.setattr(runner, "_mark_failed_unexpected", _mark_failed_unexpected)
+    return calls
+
+
+def _fake_session_maker() -> Any:
+    @asynccontextmanager
+    async def _ctx() -> Any:
+        yield AsyncMock()
+
+    def _maker() -> Any:
+        return _ctx()
+
+    return cast(Any, _maker)
+
+
+# ---------------------------------------------------------------- semaphore
+
+
+async def test_runner_semaphore_caps_concurrency(
+    patch_db_helpers: dict[str, list[Any]],
+) -> None:
+    """5 candidates with max_parallel=2 — observed concurrent peak == 2."""
+    in_flight = 0
+    peak = 0
+
+    async def child(_cid: str) -> None:
+        nonlocal in_flight, peak
+        in_flight += 1
+        peak = max(peak, in_flight)
+        try:
+            await asyncio.sleep(0.02)
+        finally:
+            in_flight -= 1
+
+    effective = await runner.run_selection_candidates(
+        selection_id="s_sem",
+        candidate_ids=[f"c{i}" for i in range(5)],
+        max_parallel=2,
+        global_max_parallel=10,
+        session_maker=_fake_session_maker(),
+        execute_candidate=child,
+    )
+    runner.mark_completed("s_sem")
+    assert effective == 2
+    assert peak == 2, f"observed peak {peak}, expected exactly 2"
+
+
+async def test_runner_global_cap_clamps_max_parallel(
+    patch_db_helpers: dict[str, list[Any]],
+) -> None:
+    """max_parallel=32 clamped by global_max_parallel=1 → sequential (peak 1)."""
+    in_flight = 0
+    peak = 0
+
+    async def child(_cid: str) -> None:
+        nonlocal in_flight, peak
+        in_flight += 1
+        peak = max(peak, in_flight)
+        try:
+            await asyncio.sleep(0.01)
+        finally:
+            in_flight -= 1
+
+    effective = await runner.run_selection_candidates(
+        selection_id="s_seq",
+        candidate_ids=[f"c{i}" for i in range(4)],
+        max_parallel=32,
+        global_max_parallel=1,
+        session_maker=_fake_session_maker(),
+        execute_candidate=child,
+    )
+    runner.mark_completed("s_seq")
+    assert effective == 1
+    assert peak == 1, f"global cap of 1 must serialize; observed peak {peak}"
+
+
+# ---------------------------------------------------- per-child failure isolation
+
+
+async def test_runner_child_failure_does_not_abort_siblings(
+    patch_db_helpers: dict[str, list[Any]],
+) -> None:
+    completed: list[str] = []
+
+    async def child(cid: str) -> None:
+        if cid == "c2":
+            raise RuntimeError("synthetic failure")
+        await asyncio.sleep(0.01)
+        completed.append(cid)
+
+    await runner.run_selection_candidates(
+        selection_id="s_fail",
+        candidate_ids=[f"c{i}" for i in range(5)],
+        max_parallel=5,
+        global_max_parallel=10,
+        session_maker=_fake_session_maker(),
+        execute_candidate=child,
+    )
+    runner.mark_completed("s_fail")
+    assert sorted(completed) == ["c0", "c1", "c3", "c4"]
+    assert patch_db_helpers["mark_failed_unexpected"] == ["c2"]
+
+
+# --------------------------------------------------------------- cancel paths
+
+
+async def test_runner_cancel_before_start_skips(
+    patch_db_helpers: dict[str, list[Any]],
+) -> None:
+    """max_parallel=1, 3 candidates. Cancel after c0 starts → c1/c2 skip."""
+    started: list[str] = []
+
+    async def child(cid: str) -> None:
+        started.append(cid)
+        await asyncio.sleep(0.5)
+
+    task = asyncio.create_task(
+        runner.run_selection_candidates(
+            selection_id="s_pending",
+            candidate_ids=["c0", "c1", "c2"],
+            max_parallel=1,
+            global_max_parallel=10,
+            session_maker=_fake_session_maker(),
+            execute_candidate=child,
+        )
+    )
+    await asyncio.sleep(0.05)
+    fired = runner.cancel_selection("s_pending")
+    await task
+    runner.mark_completed("s_pending")
+
+    assert fired is True
+    assert patch_db_helpers["mark_cancelled_running"] == ["c0"]
+    assert set(patch_db_helpers["mark_cancelled_skipped"]) == {"c1", "c2"}
+    assert started == ["c0"]
+
+
+async def test_runner_cancel_mid_flight_marks_cancelled(
+    patch_db_helpers: dict[str, list[Any]],
+) -> None:
+    cancelled_in_child: list[str] = []
+
+    async def child(cid: str) -> None:
+        try:
+            await asyncio.sleep(1.0)
+        except asyncio.CancelledError:
+            cancelled_in_child.append(cid)
+            raise
+
+    task = asyncio.create_task(
+        runner.run_selection_candidates(
+            selection_id="s_running",
+            candidate_ids=["c0"],
+            max_parallel=1,
+            global_max_parallel=10,
+            session_maker=_fake_session_maker(),
+            execute_candidate=child,
+        )
+    )
+    await asyncio.sleep(0.05)
+    runner.cancel_selection("s_running")
+    await task
+    runner.mark_completed("s_running")
+    assert cancelled_in_child == ["c0"]
+    assert patch_db_helpers["mark_cancelled_running"] == ["c0"]
+
+
+# ------------------------------------------------------------- registry hygiene
+
+
+async def test_mark_completed_unblocks_await_drain() -> None:
+    runner._ACTIVE_SELECTIONS["sx"] = runner.CancelHandle()
+    drain_task = asyncio.create_task(runner.await_drain("sx", timeout_seconds=1.0))
+    await asyncio.sleep(0.01)
+    runner.mark_completed("sx")
+    drained = await drain_task
+    assert drained is True
+    assert "sx" not in runner._ACTIVE_SELECTIONS
+
+
+async def test_cancel_selection_returns_false_when_unregistered() -> None:
+    assert runner.cancel_selection("nope") is False
+
+
+async def test_await_drain_returns_true_when_unregistered() -> None:
+    assert await runner.await_drain("nope", timeout_seconds=0.0) is True
+
+
+async def test_await_drain_times_out_on_stuck_handle() -> None:
+    runner._ACTIVE_SELECTIONS["s_stuck"] = runner.CancelHandle()
+    assert await runner.await_drain("s_stuck", timeout_seconds=0.05) is False
diff --git a/app/features/model_selection/tests/test_schemas.py b/app/features/model_selection/tests/test_schemas.py
new file mode 100644
index 00000000..0ad530de
--- /dev/null
+++ b/app/features/model_selection/tests/test_schemas.py
@@ -0,0 +1,254 @@
+"""Unit tests for model_selection request schemas (strict mode + validators)."""
+
+from __future__ import annotations
+
+from datetime import UTC, datetime
+
+import pytest
+from pydantic import ValidationError
+
+from app.features.model_selection.schemas import (
+    CandidateProgress,
+    ModelSelectionRunRequest,
+    ModelSelectionRunResponse,
+    SelectionProgress,
+    SelectionWindow,
+    SubmitRunResponse,
+)
+
+
+def _base_request_dict(**overrides: object) -> dict[str, object]:
+    payload: dict[str, object] = {
+        "store_id": 1,
+        "product_id": 1,
+        "selection_window": {"start_date": "2026-01-01", "end_date": "2026-05-31"},
+        "forecast_horizon": 14,
+        "split_config": {
+            "strategy": "expanding",
+            "n_splits": 5,
+            "min_train_size": 30,
+            "gap": 0,
+            "horizon": 14,
+        },
+        "candidate_models": [{"model_type": "naive", "params": {}}],
+    }
+    payload.update(overrides)
+    return payload
+
+
+def test_schema_accepts_iso_dates_under_strict_model() -> None:
+    """ISO-string dates validate through the strict ``validate_python`` path."""
+    window = SelectionWindow.model_validate({"start_date": "2026-01-01", "end_date": "2026-02-01"})
+    assert window.start_date.isoformat() == "2026-01-01"
+
+    request = ModelSelectionRunRequest.model_validate(_base_request_dict())
+    assert request.selection_window.end_date.isoformat() == "2026-05-31"
+
+
+def test_schema_rejects_auto_predict_without_train_winner() -> None:
+    """LOCKED #7 — auto_predict requires auto_train_winner."""
+    with pytest.raises(ValidationError, match="auto_predict requires auto_train_winner"):
+        ModelSelectionRunRequest.model_validate(
+            _base_request_dict(auto_predict=True, auto_train_winner=False)
+        )
+
+
+def test_schema_rejects_horizon_mismatch_between_split_and_forecast() -> None:
+    """LOCKED #5 — split_config.horizon must equal forecast_horizon."""
+    bad = _base_request_dict(forecast_horizon=14)
+    bad["split_config"] = {
+        "strategy": "expanding",
+        "n_splits": 5,
+        "min_train_size": 30,
+        "gap": 0,
+        "horizon": 7,
+    }
+    with pytest.raises(ValidationError, match="must equal"):
+        ModelSelectionRunRequest.model_validate(bad)
+
+
+def test_schema_rejects_feature_groups_with_v1() -> None:
+    """V1 must not carry feature_groups (mirrors forecasting TrainRequest)."""
+    with pytest.raises(ValidationError, match="feature_groups is only valid"):
+        ModelSelectionRunRequest.model_validate(
+            _base_request_dict(feature_frame_version=1, feature_groups=["calendar"])
+        )
+
+
+def test_selection_window_rejects_inverted_range() -> None:
+    """An end <= start window is rejected."""
+    with pytest.raises(ValidationError, match="after start_date"):
+        SelectionWindow.model_validate({"start_date": "2026-02-01", "end_date": "2026-01-01"})
+
+
+def test_candidate_models_min_length_enforced() -> None:
+    """At least one candidate is required."""
+    with pytest.raises(ValidationError):
+        ModelSelectionRunRequest.model_validate(_base_request_dict(candidate_models=[]))
+
+
+# --------------------------------------------------------------------- Slice B
+
+
+def _base_response_dict(**overrides: object) -> dict[str, object]:
+    payload: dict[str, object] = {
+        "selection_id": "sel1",
+        "store_id": 1,
+        "product_id": 2,
+        "status": "running",
+        "selection_window": {"start_date": "2026-01-01", "end_date": "2026-05-31"},
+        "forecast_horizon": 14,
+        "ranking_metric": "wape",
+        "availability": None,
+        "ranking": [],
+        "winner": None,
+        "recommendation_confidence": None,
+        "confidence_reasons": [],
+        "chart_data": None,
+        "final_model": None,
+        "forecast": None,
+        "business_summary": None,
+        "error_message": None,
+        "created_at": datetime(2026, 6, 1, 12, 0, 0, tzinfo=UTC),
+        "completed_at": None,
+    }
+    payload.update(overrides)
+    return payload
+
+
+def test_response_progress_fields_default_safely() -> None:
+    """Legacy sync-run rows validate without progress fields (additive defaults)."""
+    resp = ModelSelectionRunResponse.model_validate(_base_response_dict())
+    assert resp.started_at is None
+    assert resp.progress is None
+    assert resp.candidate_progress == []
+
+
+def test_status_literal_accepts_cancelled() -> None:
+    """The 'cancelled' status (Slice B) is accepted by the response literal."""
+    resp = ModelSelectionRunResponse.model_validate(_base_response_dict(status="cancelled"))
+    assert resp.status == "cancelled"
+
+
+def test_selection_and_candidate_progress_models() -> None:
+    progress = SelectionProgress(total=5, pending=3, running=1, completed=1, failed=0, cancelled=0)
+    assert progress.total == 5
+    cand = CandidateProgress(candidate_id="c1", ordinal=0, model_type="naive", status="running")
+    assert cand.status == "running"
+    assert cand.error is None
+
+
+def test_submit_run_response_carries_monitor_and_cancel_urls() -> None:
+    submit = SubmitRunResponse.model_validate(
+        _base_response_dict(
+            monitor_url="/model-selection/sel1",
+            cancel_url="/model-selection/sel1",
+            progress={
+                "total": 1,
+                "pending": 1,
+                "running": 0,
+                "completed": 0,
+                "failed": 0,
+                "cancelled": 0,
+            },
+            candidate_progress=[
+                {"candidate_id": "c1", "ordinal": 0, "model_type": "naive", "status": "pending"}
+            ],
+        )
+    )
+    assert submit.monitor_url == "/model-selection/sel1"
+    assert submit.cancel_url == "/model-selection/sel1"
+    assert submit.progress is not None
+    assert submit.progress.pending == 1
+    assert submit.candidate_progress[0].model_type == "naive"
+
+
+# =============================================================================
+# Slice C — decision + promotion schemas
+# =============================================================================
+
+from app.features.model_selection.schemas import (  # noqa: E402
+    ForecastDecisionParams,
+    ForecastSummary,
+    PredictWinnerResponse,
+    PromoteRequest,
+    TrainSelectedRequest,
+    TrainWinnerResponse,
+)
+
+
+def test_train_selected_request_accepts_model_type() -> None:
+    req = TrainSelectedRequest.model_validate(
+        {"model_type": "seasonal_naive", "override_reason": "domain"}
+    )
+    assert req.model_type == "seasonal_naive"
+    assert req.override_reason == "domain"
+
+
+def test_train_selected_request_rejects_unknown_model_type() -> None:
+    with pytest.raises(ValidationError):
+        TrainSelectedRequest.model_validate({"model_type": "not_a_model"})
+
+
+def test_forecast_decision_params_defaults() -> None:
+    params = ForecastDecisionParams()
+    assert params.lead_time_days == 7
+    assert params.service_level == 0.95
+
+
+@pytest.mark.parametrize("service_level", [0.49, 1.0, 1.5])
+def test_forecast_decision_params_rejects_out_of_bound_service_level(service_level: float) -> None:
+    with pytest.raises(ValidationError):
+        ForecastDecisionParams.model_validate({"service_level": service_level})
+
+
+def test_forecast_decision_params_validate_python_path() -> None:
+    """Exercise the validate_python path (matches FastAPI's body coercion)."""
+    params = ForecastDecisionParams.model_validate({"lead_time_days": 14, "service_level": 0.99})
+    assert params.lead_time_days == 14
+
+
+@pytest.mark.parametrize("alias", ["Bad Alias", "UPPER", "-leading", "has space"])
+def test_promote_request_rejects_bad_alias_name(alias: str) -> None:
+    with pytest.raises(ValidationError):
+        PromoteRequest.model_validate({"alias_name": alias, "approved_by": "gabor"})
+
+
+def test_promote_request_accepts_valid_alias_and_defaults() -> None:
+    req = PromoteRequest.model_validate({"alias_name": "champion-store5", "approved_by": "gabor"})
+    assert req.alias_name == "champion-store5"
+    assert req.acknowledge_non_recommended is False
+    assert req.description is None
+
+
+def test_promote_request_requires_approved_by() -> None:
+    with pytest.raises(ValidationError):
+        PromoteRequest.model_validate({"alias_name": "champion-x"})
+
+
+def test_train_winner_response_back_compat_defaults() -> None:
+    """train-winner callers that omit the Slice C fields still validate."""
+    resp = TrainWinnerResponse.model_validate(
+        {"selection_id": "s", "model_type": "naive", "model_path": "p"}
+    )
+    assert resp.is_override is False
+    assert resp.override_warning is None
+
+
+def test_forecast_summary_peak_low_optional() -> None:
+    """Legacy ForecastSummary (no peak/low) still validates."""
+    summary = ForecastSummary.model_validate(
+        {"points": [], "total_demand": 0.0, "average_demand": 0.0, "horizon": 14}
+    )
+    assert summary.peak_date is None
+    assert summary.peak_demand is None
+
+
+def test_predict_winner_response_decision_optional() -> None:
+    resp = PredictWinnerResponse.model_validate(
+        {
+            "selection_id": "s",
+            "forecast": {"points": [], "total_demand": 0.0, "average_demand": 0.0, "horizon": 14},
+        }
+    )
+    assert resp.decision is None
diff --git a/app/features/model_selection/tests/test_service.py b/app/features/model_selection/tests/test_service.py
new file mode 100644
index 00000000..c60080b1
--- /dev/null
+++ b/app/features/model_selection/tests/test_service.py
@@ -0,0 +1,773 @@
+"""Unit tests for ModelSelectionService orchestration (mocked sibling services)."""
+
+from __future__ import annotations
+
+from datetime import date, timedelta
+from types import SimpleNamespace
+from typing import Any
+from unittest.mock import AsyncMock, MagicMock
+from uuid import uuid4
+
+import pytest
+from pydantic import TypeAdapter
+
+from app.core.exceptions import BadRequestError, NotFoundError
+from app.features.forecasting.schemas import ModelConfig
+from app.features.model_selection.schemas import ModelSelectionRunRequest
+from app.features.model_selection.service import ModelSelectionService
+from app.features.model_selection.tests.conftest import (
+    make_availability,
+    make_backtest_response,
+    make_mock_db,
+)
+
+
+def _request(**overrides: Any) -> ModelSelectionRunRequest:
+    payload: dict[str, Any] = {
+        "store_id": 1,
+        "product_id": 1,
+        "selection_window": {"start_date": "2026-01-01", "end_date": "2026-05-31"},
+        "forecast_horizon": 14,
+        "split_config": {
+            "strategy": "expanding",
+            "n_splits": 5,
+            "min_train_size": 30,
+            "gap": 0,
+            "horizon": 14,
+        },
+        "candidate_models": [{"model_type": "naive", "params": {}}],
+    }
+    payload.update(overrides)
+    return ModelSelectionRunRequest.model_validate(payload)
+
+
+def _patch_backtester(
+    monkeypatch: pytest.MonkeyPatch, *, side_effect: list[Any]
+) -> SimpleNamespace:
+    instance = SimpleNamespace(run_backtest=AsyncMock(side_effect=side_effect))
+    monkeypatch.setattr("app.features.backtesting.service.BacktestingService", lambda: instance)
+    return instance
+
+
+def _patch_availability(monkeypatch: pytest.MonkeyPatch, status: str) -> None:
+    monkeypatch.setattr(
+        ModelSelectionService,
+        "get_availability",
+        AsyncMock(return_value=make_availability(status=status)),
+    )
+
+
+# -----------------------------------------------------------------------------
+# Flattening
+# -----------------------------------------------------------------------------
+
+
+def test_build_model_config_flattens_params() -> None:
+    """The service's flatten-then-validate builds a typed ModelConfig."""
+    adapter: TypeAdapter[Any] = TypeAdapter(ModelConfig)
+    cfg = adapter.validate_python({"model_type": "seasonal_naive", "season_length": 7})
+    assert cfg.model_type == "seasonal_naive"
+    assert cfg.season_length == 7
+
+
+# -----------------------------------------------------------------------------
+# Availability thresholds
+# -----------------------------------------------------------------------------
+
+
+def _availability_db(observed: int) -> AsyncMock:
+    """Mock DB returning a contiguous `observed`-day aggregate for one pair."""
+    first = date(2024, 1, 1) if observed else None
+    last = date(2024, 1, 1) + timedelta(days=observed - 1) if observed else None
+    db = AsyncMock()
+    db.get = AsyncMock(return_value=SimpleNamespace(id=1))
+    result = AsyncMock()
+    result.one = lambda: (first, last, observed, 12.0, 0)
+    db.execute = AsyncMock(return_value=result)
+    db.scalar = AsyncMock(return_value=0)
+    return db
+
+
+@pytest.mark.parametrize(
+    ("observed", "expected"),
+    [(120, "ready"), (50, "limited"), (20, "unusable")],
+)
+async def test_availability_ready_limited_unusable_thresholds(observed: int, expected: str) -> None:
+    service = ModelSelectionService()
+    db = _availability_db(observed)
+    availability = await service.get_availability(db, 1, 1, forecast_horizon=14)
+    assert availability.status == expected
+
+
+async def test_availability_missing_store_raises_not_found() -> None:
+    service = ModelSelectionService()
+    db = AsyncMock()
+    db.get = AsyncMock(return_value=None)
+    with pytest.raises(NotFoundError):
+        await service.get_availability(db, 999, 1, forecast_horizon=14)
+
+
+# -----------------------------------------------------------------------------
+# Orchestration
+# -----------------------------------------------------------------------------
+
+
+async def test_run_selection_partial_success_chooses_valid_winner(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    _patch_availability(monkeypatch, "ready")
+    _patch_backtester(
+        monkeypatch,
+        side_effect=[make_backtest_response(wape=10.0), ValueError("insufficient data")],
+    )
+    request = _request(
+        candidate_models=[
+            {"model_type": "naive", "params": {}},
+            {"model_type": "seasonal_naive", "params": {"season_length": 7}},
+        ]
+    )
+    response = await ModelSelectionService().run_selection(make_mock_db(), request)
+
+    assert response.status == "partial"
+    assert response.winner is not None
+    assert response.winner.model_type == "naive"
+    failed = [e for e in response.ranking if not e.included]
+    assert [e.model_type for e in failed] == ["seasonal_naive"]
+    assert failed[0].exclusion_reason is not None
+
+
+async def test_run_selection_all_candidates_fail_returns_failed_status_not_500(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    """LOCKED #3 — every candidate failing persists FAILED and returns (no raise)."""
+    _patch_availability(monkeypatch, "ready")
+    _patch_backtester(monkeypatch, side_effect=[ValueError("boom-1"), ValueError("boom-2")])
+    request = _request(
+        candidate_models=[
+            {"model_type": "naive", "params": {}},
+            {"model_type": "seasonal_naive", "params": {"season_length": 7}},
+        ]
+    )
+    response = await ModelSelectionService().run_selection(make_mock_db(), request)
+
+    assert response.status == "failed"
+    assert response.winner is None
+    assert response.selection_id
+    assert all(not e.included for e in response.ranking)
+
+
+async def test_run_selection_unusable_availability_raises_bad_request(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    """LOCKED #2 — unusable availability fails fast with 400."""
+    _patch_availability(monkeypatch, "unusable")
+    with pytest.raises(BadRequestError):
+        await ModelSelectionService().run_selection(make_mock_db(), _request())
+
+
+async def test_run_selection_auto_train_passes_feature_frame_version_and_groups(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    _patch_availability(monkeypatch, "ready")
+    _patch_backtester(monkeypatch, side_effect=[make_backtest_response(wape=10.0)])
+    train_mock = AsyncMock(
+        return_value=SimpleNamespace(model_path="artifacts/models/model_abc.joblib")
+    )
+    monkeypatch.setattr(
+        "app.features.forecasting.service.ForecastingService",
+        lambda: SimpleNamespace(train_model=train_mock),
+    )
+    request = _request(
+        feature_frame_version=2,
+        feature_groups=["calendar"],
+        auto_train_winner=True,
+        auto_predict=False,
+    )
+    response = await ModelSelectionService().run_selection(make_mock_db(), request)
+
+    assert response.final_model == {"model_path": "artifacts/models/model_abc.joblib"}
+    train_mock.assert_awaited_once()
+    assert train_mock.await_args is not None
+    assert train_mock.await_args.kwargs["feature_frame_version"] == 2
+    assert train_mock.await_args.kwargs["feature_groups"] == ["calendar"]
+
+
+async def test_response_uses_recommendation_confidence_key(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    """The response carries ``recommendation_confidence`` (not ``confidence``)."""
+    _patch_availability(monkeypatch, "ready")
+    _patch_backtester(
+        monkeypatch,
+        side_effect=[make_backtest_response(wape=10.0), make_backtest_response(wape=20.0)],
+    )
+    request = _request(
+        candidate_models=[
+            {"model_type": "naive", "params": {}},
+            {"model_type": "seasonal_naive", "params": {"season_length": 7}},
+        ]
+    )
+    response = await ModelSelectionService().run_selection(make_mock_db(), request)
+    dumped = response.model_dump()
+    assert "recommendation_confidence" in dumped
+    assert "confidence" not in dumped
+    assert response.recommendation_confidence in {"high", "medium", "low"}
+    assert response.chart_data is not None
+
+
+async def test_get_selection_missing_raises_not_found() -> None:
+    db = AsyncMock()
+    db.scalar = AsyncMock(return_value=None)
+    db.execute = AsyncMock()
+    with pytest.raises(NotFoundError):
+        await ModelSelectionService().get_selection(db, uuid4().hex)
+
+
+# -----------------------------------------------------------------------------
+# Slice B — async submit / settle / cancel (worker mocked or DB-free units)
+# -----------------------------------------------------------------------------
+
+from datetime import UTC, datetime  # noqa: E402
+
+from app.core.exceptions import ConflictError  # noqa: E402
+from app.features.model_selection import runner as _runner  # noqa: E402
+from app.features.model_selection.models import (  # noqa: E402
+    ModelSelectionCandidate,
+    ModelSelectionRun,
+    ModelSelectionStatus,
+)
+
+
+def _submit_mock_db() -> AsyncMock:
+    """Mock ``AsyncSession`` whose ``refresh`` stamps ``created_at`` on the run."""
+    db = AsyncMock()
+    added: list[Any] = []
+
+    def _add(obj: Any) -> None:
+        added.append(obj)
+
+    async def _refresh(obj: Any) -> None:
+        if isinstance(obj, ModelSelectionRun) and obj.created_at is None:
+            obj.created_at = datetime.now(UTC)
+
+    db.add = MagicMock(side_effect=_add)
+    db.commit = AsyncMock()
+    db.refresh = AsyncMock(side_effect=_refresh)
+    db._added = added  # expose for assertions
+    return db
+
+
+async def test_submit_run_inserts_running_parent_and_pending_candidates(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    _patch_availability(monkeypatch, "ready")
+    # Stub the detached worker so create_task schedules a harmless no-op.
+    monkeypatch.setattr(ModelSelectionService, "_run_in_background", AsyncMock())
+
+    request = _request(
+        candidate_models=[
+            {"model_type": "naive", "params": {}},
+            {"model_type": "seasonal_naive", "params": {"season_length": 7}},
+        ]
+    )
+    db = _submit_mock_db()
+    response = await ModelSelectionService().submit_run(db, request)
+
+    assert response.status == "running"
+    assert response.monitor_url == f"/model-selection/{response.selection_id}"
+    assert response.cancel_url == f"/model-selection/{response.selection_id}"
+    assert response.progress is not None
+    assert response.progress.total == 2
+    assert response.progress.pending == 2
+    assert len(response.candidate_progress) == 2
+    assert {c.status for c in response.candidate_progress} == {"pending"}
+
+    parents = [o for o in db._added if isinstance(o, ModelSelectionRun)]
+    children = [o for o in db._added if isinstance(o, ModelSelectionCandidate)]
+    assert len(parents) == 1
+    assert parents[0].status == ModelSelectionStatus.RUNNING.value
+    assert parents[0].started_at is not None
+    assert parents[0].total_candidates == 2
+    assert len(children) == 2
+    assert {c.status for c in children} == {"pending"}
+    assert [c.ordinal for c in children] == [0, 1]
+
+
+async def test_submit_run_unusable_availability_raises_400(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    _patch_availability(monkeypatch, "unusable")
+    monkeypatch.setattr(ModelSelectionService, "_run_in_background", AsyncMock())
+    db = _submit_mock_db()
+    with pytest.raises(BadRequestError):
+        await ModelSelectionService().submit_run(db, _request())
+    # The parent was persisted as failed; no children were inserted.
+    parents = [o for o in db._added if isinstance(o, ModelSelectionRun)]
+    children = [o for o in db._added if isinstance(o, ModelSelectionCandidate)]
+    assert parents[0].status == ModelSelectionStatus.FAILED.value
+    assert children == []
+
+
+def test_terminal_status_rule() -> None:
+    svc = ModelSelectionService()
+    f = svc._terminal_status
+    assert f({"completed": 3, "failed": 0, "cancelled": 0}) is ModelSelectionStatus.COMPLETED
+    assert f({"completed": 0, "failed": 3, "cancelled": 0}) is ModelSelectionStatus.FAILED
+    assert f({"completed": 0, "failed": 0, "cancelled": 3}) is ModelSelectionStatus.CANCELLED
+    assert f({"completed": 2, "failed": 1, "cancelled": 0}) is ModelSelectionStatus.PARTIAL
+    assert f({"completed": 1, "failed": 0, "cancelled": 1}) is ModelSelectionStatus.PARTIAL
+
+
+async def test_cancel_run_404_when_missing() -> None:
+    db = AsyncMock()
+    db.scalar = AsyncMock(return_value=None)
+    with pytest.raises(NotFoundError):
+        await ModelSelectionService().cancel_run(db, uuid4().hex)
+
+
+async def test_cancel_run_409_when_terminal() -> None:
+    row = ModelSelectionRun(
+        selection_id="sel_terminal",
+        status=ModelSelectionStatus.COMPLETED.value,
+        store_id=1,
+        product_id=1,
+        start_date=date(2026, 1, 1),
+        end_date=date(2026, 5, 31),
+        forecast_horizon=14,
+        ranking_metric="wape",
+        candidate_models=[],
+        policy_snapshot={},
+    )
+    db = AsyncMock()
+    db.scalar = AsyncMock(return_value=row)
+    with pytest.raises(ConflictError):
+        await ModelSelectionService().cancel_run(db, "sel_terminal")
+
+
+async def test_cancel_run_409_when_settle_races_cancel(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    """If the worker settled (no handle) between load and cancel → 409."""
+    row = ModelSelectionRun(
+        selection_id="sel_race",
+        status=ModelSelectionStatus.RUNNING.value,
+        store_id=1,
+        product_id=1,
+        start_date=date(2026, 1, 1),
+        end_date=date(2026, 5, 31),
+        forecast_horizon=14,
+        ranking_metric="wape",
+        candidate_models=[],
+        policy_snapshot={},
+    )
+    db = AsyncMock()
+    db.scalar = AsyncMock(return_value=row)
+    monkeypatch.setattr(_runner, "cancel_selection", lambda _sid: False)
+    with pytest.raises(ConflictError):
+        await ModelSelectionService().cancel_run(db, "sel_race")
+
+
+# =============================================================================
+# Slice C — train-selected (override) / predict-decision / promote
+# =============================================================================
+
+from app.core.exceptions import UnprocessableEntityError  # noqa: E402
+from app.features.forecasting.schemas import ForecastPoint  # noqa: E402
+from app.features.model_selection.schemas import PromoteRequest  # noqa: E402
+
+
+def _ranking_dict(
+    *,
+    winner_type: str = "naive",
+    extra_included: list[dict[str, Any]] | None = None,
+) -> dict[str, Any]:
+    """A persisted ``ranking_result`` JSONB with a winner + ranked entries."""
+    winner_metrics = {"wape": 10.0, "smape": 8.0, "mae": 4.0, "bias": 0.5}
+    entries: list[dict[str, Any]] = [
+        {
+            "rank": 1,
+            "model_type": winner_type,
+            "params": {},
+            "included": True,
+            "exclusion_reason": None,
+            "metrics": winner_metrics,
+        }
+    ]
+    if extra_included:
+        entries.extend(extra_included)
+    return {
+        "winner": {
+            "rank": 1,
+            "model_type": winner_type,
+            "params": {},
+            "included": True,
+            "exclusion_reason": None,
+            "metrics": winner_metrics,
+        },
+        "entries": entries,
+        "confidence": "high",
+        "reasons": [],
+    }
+
+
+def _decision_row(
+    *,
+    candidate_models: list[dict[str, Any]] | None = None,
+    ranking_result: dict[str, Any] | None = None,
+    feature_frame_version: int = 1,
+    final_model_path: str | None = None,
+    trained_model_type: str | None = None,
+    is_override: bool = False,
+    winner_metrics: dict[str, Any] | None = None,
+) -> ModelSelectionRun:
+    """Build an in-memory ModelSelectionRun for decision-layer unit tests."""
+    return ModelSelectionRun(
+        selection_id="sel_decision",
+        status=ModelSelectionStatus.COMPLETED.value,
+        store_id=3,
+        product_id=8,
+        start_date=date(2026, 1, 1),
+        end_date=date(2026, 5, 31),
+        forecast_horizon=14,
+        ranking_metric="wape",
+        candidate_models=candidate_models or [{"model_type": "naive", "params": {}}],
+        policy_snapshot={},
+        ranking_result=ranking_result,
+        feature_frame_version=feature_frame_version,
+        final_model_path=final_model_path,
+        trained_model_type=trained_model_type,
+        is_override=is_override,
+        winner_metrics=winner_metrics,
+    )
+
+
+def _row_db(row: ModelSelectionRun) -> AsyncMock:
+    db = AsyncMock()
+    db.scalar = AsyncMock(return_value=row)
+    db.flush = AsyncMock()
+    return db
+
+
+def _patch_train(monkeypatch: pytest.MonkeyPatch) -> AsyncMock:
+    train_mock = AsyncMock(
+        return_value=SimpleNamespace(model_path="artifacts/models/model_sel.joblib")
+    )
+    monkeypatch.setattr(
+        "app.features.forecasting.service.ForecastingService",
+        lambda: SimpleNamespace(train_model=train_mock),
+    )
+    return train_mock
+
+
+async def test_train_selected_trains_chosen_candidate(monkeypatch: pytest.MonkeyPatch) -> None:
+    train_mock = _patch_train(monkeypatch)
+    row = _decision_row(
+        candidate_models=[
+            {"model_type": "naive", "params": {}},
+            {"model_type": "seasonal_naive", "params": {"season_length": 7}},
+        ],
+        ranking_result=_ranking_dict(winner_type="naive"),
+    )
+    resp = await ModelSelectionService().train_selected(_row_db(row), "sel_decision", "naive", None)
+    assert resp.model_type == "naive"
+    assert resp.is_override is False
+    assert resp.override_warning is None
+    assert row.trained_model_type == "naive"
+    assert row.is_override is False
+    train_mock.assert_awaited_once()
+
+
+async def test_train_selected_rejects_non_candidate_model_type_400(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    train_mock = _patch_train(monkeypatch)
+    row = _decision_row(
+        candidate_models=[{"model_type": "naive", "params": {}}],
+        ranking_result=_ranking_dict(winner_type="naive"),
+    )
+    with pytest.raises(BadRequestError):
+        await ModelSelectionService().train_selected(_row_db(row), "sel_decision", "lightgbm", None)
+    train_mock.assert_not_awaited()
+
+
+async def test_train_selected_sets_is_override_and_warning_for_non_winner(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    _patch_train(monkeypatch)
+    row = _decision_row(
+        candidate_models=[
+            {"model_type": "naive", "params": {}},
+            {"model_type": "seasonal_naive", "params": {"season_length": 7}},
+        ],
+        ranking_result=_ranking_dict(
+            winner_type="naive",
+            extra_included=[
+                {
+                    "rank": 2,
+                    "model_type": "seasonal_naive",
+                    "params": {"season_length": 7},
+                    "included": True,
+                    "exclusion_reason": None,
+                    "metrics": {"wape": 15.0, "smape": 9.0, "mae": 5.0, "bias": 0.2},
+                }
+            ],
+        ),
+    )
+    resp = await ModelSelectionService().train_selected(
+        _row_db(row), "sel_decision", "seasonal_naive", "domain seasonality"
+    )
+    assert resp.is_override is True
+    assert resp.override_warning is not None
+    assert "seasonal_naive" in resp.override_warning
+    assert "naive" in resp.override_warning
+    assert row.override_reason == "domain seasonality"
+
+
+async def test_train_selected_failed_candidate_still_trainable(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    """A candidate that FAILED its backtest (no ranked metrics) stays trainable."""
+    _patch_train(monkeypatch)
+    row = _decision_row(
+        candidate_models=[
+            {"model_type": "naive", "params": {}},
+            {"model_type": "moving_average", "params": {}},
+        ],
+        # moving_average failed its backtest → not in ranking entries.
+        ranking_result=_ranking_dict(winner_type="naive"),
+    )
+    resp = await ModelSelectionService().train_selected(
+        _row_db(row), "sel_decision", "moving_average", None
+    )
+    assert resp.is_override is True
+    assert resp.override_warning is not None
+    assert "not successfully evaluated" in resp.override_warning
+
+
+async def test_train_selected_threads_feature_frame_version_into_train_model(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    train_mock = _patch_train(monkeypatch)
+    row = _decision_row(
+        candidate_models=[{"model_type": "prophet_like", "params": {}}],
+        ranking_result=_ranking_dict(winner_type="prophet_like"),
+        feature_frame_version=2,
+    )
+    await ModelSelectionService().train_selected(_row_db(row), "sel_decision", "prophet_like", None)
+    assert train_mock.await_args is not None
+    assert train_mock.await_args.kwargs["feature_frame_version"] == 2
+
+
+async def test_train_winner_now_persists_trained_model_type_not_override(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    """Regression — train-winner persists trained_model_type, is_override=False."""
+    train_mock = _patch_train(monkeypatch)
+    row = _decision_row(
+        candidate_models=[{"model_type": "naive", "params": {}}],
+        ranking_result=_ranking_dict(winner_type="naive"),
+        feature_frame_version=2,
+    )
+    resp = await ModelSelectionService().train_winner(_row_db(row), "sel_decision")
+    assert resp.model_type == "naive"
+    assert resp.is_override is False
+    assert resp.override_warning is None
+    assert row.trained_model_type == "naive"
+    assert row.is_override is False
+    assert train_mock.await_args is not None
+    assert train_mock.await_args.kwargs["feature_frame_version"] == 2
+
+
+def _predict_points() -> list[ForecastPoint]:
+    base = date(2026, 6, 1)
+    values = [10.0, 25.0, 8.0, 12.0]
+    return [
+        ForecastPoint(date=base.fromordinal(base.toordinal() + i), forecast=v)
+        for i, v in enumerate(values)
+    ]
+
+
+async def test_predict_attaches_decision_and_peak_low(monkeypatch: pytest.MonkeyPatch) -> None:
+    predict_mock = AsyncMock(return_value=SimpleNamespace(forecasts=_predict_points()))
+    monkeypatch.setattr(
+        "app.features.forecasting.service.ForecastingService",
+        lambda: SimpleNamespace(predict=predict_mock),
+    )
+    row = _decision_row(
+        final_model_path="artifacts/models/model_sel.joblib",
+        trained_model_type="naive",
+        winner_metrics={"wape": 10.0, "bias": 0.5},
+    )
+    forecast, decision = await ModelSelectionService().predict_winner(
+        _row_db(row), "sel_decision", 7, 0.95
+    )
+    assert decision is not None
+    assert decision.lead_time_days == 7
+    assert decision.method == "heuristic"
+    assert forecast.peak_demand == 25.0
+    assert forecast.low_demand == 8.0
+    assert forecast.peak_date == date(2026, 6, 2)
+
+
+async def test_predict_winner_untrained_raises_400() -> None:
+    row = _decision_row(final_model_path=None)
+    with pytest.raises(BadRequestError):
+        await ModelSelectionService().predict_winner(_row_db(row), "sel_decision", 7, 0.95)
+
+
+def _patch_registry(monkeypatch: pytest.MonkeyPatch) -> dict[str, AsyncMock]:
+    from app.features.registry.schemas import RunStatus
+
+    run_resp = SimpleNamespace(run_id="run_abc123def456")
+    alias_resp = SimpleNamespace(alias_name="champion-test", run_status=RunStatus.SUCCESS)
+    create_run = AsyncMock(return_value=run_resp)
+    update_run = AsyncMock(return_value=run_resp)
+    create_alias = AsyncMock(return_value=alias_resp)
+    monkeypatch.setattr(
+        "app.features.registry.service.RegistryService",
+        lambda: SimpleNamespace(
+            create_run=create_run, update_run=update_run, create_alias=create_alias
+        ),
+    )
+    monkeypatch.setattr(
+        ModelSelectionService,
+        "_register_artifact",
+        staticmethod(lambda final_model_path, run_id: ("champion-selector/x.joblib", "h", 100)),
+    )
+    return {"create_run": create_run, "update_run": update_run, "create_alias": create_alias}
+
+
+async def test_promote_orchestrates_create_run_success_and_alias(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    mocks = _patch_registry(monkeypatch)
+    row = _decision_row(
+        final_model_path="artifacts/models/model_sel.joblib",
+        trained_model_type="naive",
+        is_override=False,
+        winner_metrics={"wape": 10.0},
+        feature_frame_version=1,
+    )
+    req = PromoteRequest(alias_name="champion-test", approved_by="gabor")
+    resp = await ModelSelectionService().promote(_row_db(row), "sel_decision", req)
+    assert resp.run_id == "run_abc123def456"
+    assert resp.run_status == "success"
+    assert resp.alias_name == "champion-test"
+    mocks["create_run"].assert_awaited_once()
+    mocks["create_alias"].assert_awaited_once()
+    # two update_run calls: RUNNING then SUCCESS
+    assert mocks["update_run"].await_count == 2
+
+
+async def test_promote_persists_promotion_decision_audit(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    _patch_registry(monkeypatch)
+    row = _decision_row(
+        final_model_path="artifacts/models/model_sel.joblib",
+        trained_model_type="naive",
+        winner_metrics={"wape": 10.0},
+    )
+    req = PromoteRequest(alias_name="champion-test", approved_by="gabor", description="Q3")
+    await ModelSelectionService().promote(_row_db(row), "sel_decision", req)
+    assert row.champion_run_id == "run_abc123def456"
+    assert row.promoted_alias == "champion-test"
+    assert row.promotion_decision is not None
+    assert row.promotion_decision["approved_by"] == "gabor"
+    assert row.promotion_decision["decision"] == "promoted"
+    assert row.promotion_decision["reason"] == "Q3"
+
+
+async def test_promote_carries_real_feature_frame_version_v2(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    mocks = _patch_registry(monkeypatch)
+    row = _decision_row(
+        final_model_path="artifacts/models/model_sel.joblib",
+        trained_model_type="prophet_like",
+        winner_metrics={"wape": 10.0},
+        feature_frame_version=2,
+    )
+    req = PromoteRequest(alias_name="champion-v2", approved_by="gabor")
+    await ModelSelectionService().promote(_row_db(row), "sel_decision", req)
+    assert mocks["create_run"].await_args is not None
+    run_create = mocks["create_run"].await_args.args[1]
+    assert run_create.runtime_info_extras["feature_frame_version"] == 2
+
+
+async def test_promote_defaults_feature_frame_version_1_for_legacy_run(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    mocks = _patch_registry(monkeypatch)
+    row = _decision_row(
+        final_model_path="artifacts/models/model_sel.joblib",
+        trained_model_type="naive",
+        winner_metrics={"wape": 10.0},
+        feature_frame_version=1,  # legacy / server_default
+    )
+    req = PromoteRequest(alias_name="champion-legacy", approved_by="gabor")
+    await ModelSelectionService().promote(_row_db(row), "sel_decision", req)
+    assert mocks["create_run"].await_args is not None
+    run_create = mocks["create_run"].await_args.args[1]
+    assert run_create.runtime_info_extras["feature_frame_version"] == 1
+
+
+async def test_promote_requires_trained_model_422(monkeypatch: pytest.MonkeyPatch) -> None:
+    _patch_registry(monkeypatch)
+    row = _decision_row(final_model_path=None, trained_model_type=None)
+    req = PromoteRequest(alias_name="champion-test", approved_by="gabor")
+    with pytest.raises(UnprocessableEntityError):
+        await ModelSelectionService().promote(_row_db(row), "sel_decision", req)
+
+
+async def test_promote_non_recommended_requires_ack_422(monkeypatch: pytest.MonkeyPatch) -> None:
+    _patch_registry(monkeypatch)
+    row = _decision_row(
+        final_model_path="artifacts/models/model_sel.joblib",
+        trained_model_type="seasonal_naive",
+        is_override=True,
+        winner_metrics={"wape": 10.0},
+    )
+    req = PromoteRequest(
+        alias_name="champion-test", approved_by="gabor", acknowledge_non_recommended=False
+    )
+    with pytest.raises(UnprocessableEntityError):
+        await ModelSelectionService().promote(_row_db(row), "sel_decision", req)
+
+
+def _capturing_run_db() -> AsyncMock:
+    db = AsyncMock()
+    rows: list[Any] = []
+    db.add = MagicMock(side_effect=lambda o: rows.append(o))
+
+    async def _flush() -> None:
+        for obj in rows:
+            if isinstance(obj, ModelSelectionRun) and obj.created_at is None:
+                obj.created_at = datetime.now(UTC)
+
+    db.flush = AsyncMock(side_effect=_flush)
+    db.refresh = AsyncMock()
+    db._rows = rows
+    return db
+
+
+async def test_run_creation_persists_request_feature_frame_version_sync(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    _patch_availability(monkeypatch, "ready")
+    _patch_backtester(monkeypatch, side_effect=[make_backtest_response(wape=10.0)])
+    db = _capturing_run_db()
+    await ModelSelectionService().run_selection(db, _request(feature_frame_version=2))
+    runs = [r for r in db._rows if isinstance(r, ModelSelectionRun)]
+    assert runs[0].feature_frame_version == 2
+
+
+async def test_run_creation_persists_request_feature_frame_version_async(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    _patch_availability(monkeypatch, "ready")
+    monkeypatch.setattr(ModelSelectionService, "_run_in_background", AsyncMock())
+    db = _submit_mock_db()
+    await ModelSelectionService().submit_run(db, _request(feature_frame_version=2))
+    runs = [o for o in db._added if isinstance(o, ModelSelectionRun)]
+    assert runs[0].feature_frame_version == 2
diff --git a/app/features/ops/service.py b/app/features/ops/service.py
index 43c59318..4ec3af78 100644
--- a/app/features/ops/service.py
+++ b/app/features/ops/service.py
@@ -154,7 +154,10 @@ def _run_feature_frame_version(run: ModelRun) -> int:
     """
     info = run.runtime_info or {}
     value = info.get("feature_frame_version")
-    if isinstance(value, int) and value in (1, 2):
+    # Honor any positive int V (feature_frame_version is an opaque incrementing
+    # integer per docs/_base/DOMAIN_MODEL.md). bool is excluded because it
+    # subclasses int. Missing / invalid value -> V=1 back-compat (#338).
+    if isinstance(value, int) and not isinstance(value, bool) and value >= 1:
         return value
     return 1
 
diff --git a/app/features/ops/tests/test_service.py b/app/features/ops/tests/test_service.py
index fcfb61a7..8a4c107c 100644
--- a/app/features/ops/tests/test_service.py
+++ b/app/features/ops/tests/test_service.py
@@ -188,14 +188,23 @@ def test_run_feature_frame_version_reads_runtime_info() -> None:
     assert _run_feature_frame_version(_make_run(run_id="b")) == 1
 
 
-def test_run_feature_frame_version_rejects_unsupported_value() -> None:
-    """Unknown int (e.g. 3) or non-int values fall back to V=1 (defensive)."""
-    legacy_explicit_v3 = _make_run(run_id="bad-int")
-    legacy_explicit_v3.runtime_info = {"feature_frame_version": 3}
-    legacy_str = _make_run(run_id="bad-str")
-    legacy_str.runtime_info = {"feature_frame_version": "2"}
-    assert _run_feature_frame_version(legacy_explicit_v3) == 1
-    assert _run_feature_frame_version(legacy_str) == 1
+def test_run_feature_frame_version_honors_any_positive_int() -> None:
+    """Any positive int V is honored (e.g. 3); non-int / non-positive / bool -> V=1.
+
+    Regression for #338: feature_frame_version is an opaque incrementing integer
+    (docs/_base/DOMAIN_MODEL.md), so V>=3 must NOT be clamped to 1 — the showcase
+    stale_alias_trigger step registers a V=3 run to fire the
+    feature_frame_version_mismatch verdict.
+    """
+    v3 = _make_run(run_id="v3")
+    v3.runtime_info = {"feature_frame_version": 3}
+    assert _run_feature_frame_version(v3) == 3
+
+    # Non-int / non-positive / bool all fall back to V=1.
+    for bad in ("2", 0, -1, True):
+        run = _make_run(run_id=f"bad-{bad!r}")
+        run.runtime_info = {"feature_frame_version": bad}
+        assert _run_feature_frame_version(run) == 1
 
 
 def test_alias_staleness_legacy_run_treated_as_v1_no_spurious_mismatch() -> None:
@@ -241,6 +250,24 @@ def test_alias_staleness_v_mismatch_wins_over_newer_run() -> None:
     assert comparable_v == 2
 
 
+def test_alias_staleness_v1_alias_v3_latest_reports_mismatch() -> None:
+    """A V1 alias with a newer V3 comparable reports MISMATCH, not NEWER (#338).
+
+    Mirrors the showcase stale_alias_trigger scenario: the demo-production alias
+    points at a V1 run while the grain's newest run is V=3. Before #338 the V=3
+    latest was clamped to V=1, so this fell through to NEWER_SUCCESS_RUN.
+    """
+    older = datetime(2026, 1, 1, tzinfo=UTC)
+    newer = datetime(2026, 5, 1, tzinfo=UTC)
+    run = _make_run(run_id="v1-alias", created_at=older, feature_frame_version=1)
+    latest = _make_run(run_id="v3-latest", created_at=newer, feature_frame_version=3)
+    is_stale, reason, alias_v, comparable_v = _alias_staleness(run, {(1, 1): latest})
+    assert is_stale is True
+    assert reason == StaleReason.FEATURE_FRAME_VERSION_MISMATCH.value
+    assert alias_v == 1
+    assert comparable_v == 3
+
+
 def test_alias_staleness_same_v_newer_run_uses_newer_reason() -> None:
     """V matches but the comparable is newer → NEWER_SUCCESS_RUN reason."""
     older = datetime(2026, 1, 1, tzinfo=UTC)
diff --git a/app/features/rag/embeddings.py b/app/features/rag/embeddings.py
index cffa1b1d..4f5cc5bc 100644
--- a/app/features/rag/embeddings.py
+++ b/app/features/rag/embeddings.py
@@ -16,7 +16,12 @@
 import httpx
 import structlog
 import tiktoken
-from openai import AsyncOpenAI, RateLimitError
+from openai import (
+    AsyncOpenAI,
+    AuthenticationError,
+    PermissionDeniedError,
+    RateLimitError,
+)
 
 from app.core.config import get_settings
 
@@ -32,6 +37,21 @@ class EmbeddingError(Exception):
     pass
 
 
+class EmbeddingAuthError(EmbeddingError):
+    """Embedding provider rejected the credentials (HTTP 401/403).
+
+    A *distinct* subclass of :class:`EmbeddingError` so callers can tell an
+    authentication/authorization failure (invalid or placeholder API key) apart
+    from a transient connection/server failure. The RAG routes map this to a
+    machine-readable ``EMBEDDING_AUTH`` problem so the showcase demo pipeline
+    can SKIP the knowledge phase gracefully instead of hard-failing on a bad
+    key (issue #329). Carries no secret material — only the provider's own
+    error string, which never contains the key value.
+    """
+
+    pass
+
+
 class EmbeddingProvider(ABC):
     """Abstract base class for embedding providers.
 
@@ -293,6 +313,18 @@ async def _embed_batch(
                     await asyncio.sleep(wait_time)
                 continue
 
+            except (AuthenticationError, PermissionDeniedError) as e:
+                # Invalid / placeholder / unauthorized key (401/403). Not
+                # retryable — surface as a distinct auth failure so callers can
+                # classify it (issue #329). Log the type only, never the key.
+                logger.warning(
+                    "rag.embedding_auth_error",
+                    error_type=type(e).__name__,
+                    batch_size=len(texts),
+                    provider="openai",
+                )
+                raise EmbeddingAuthError(f"OpenAI rejected the embedding credentials: {e}") from e
+
             except Exception as e:
                 last_error = e
                 logger.error(
@@ -418,6 +450,19 @@ async def embed_texts(
                         f"Ollama model '{self.settings.ollama_embedding_model}' not found. "
                         f"Run: ollama pull {self.settings.ollama_embedding_model}"
                     ) from e
+                if e.response.status_code in (401, 403):
+                    # Auth rejected (e.g. Ollama behind an authenticating proxy
+                    # with a bad/placeholder credential). Not retryable —
+                    # surface as a distinct auth failure (issue #329).
+                    logger.warning(
+                        "rag.embedding_auth_error",
+                        error_type=type(e).__name__,
+                        status_code=e.response.status_code,
+                        provider="ollama",
+                    )
+                    raise EmbeddingAuthError(
+                        f"Ollama embedding endpoint rejected the credentials: {e}"
+                    ) from e
                 if e.response.status_code >= 500 and attempt < max_retries:
                     # Server error - retry
                     wait_time = retry_delay * (2**attempt)
diff --git a/app/features/rag/routes.py b/app/features/rag/routes.py
index e4474fb2..57d42928 100644
--- a/app/features/rag/routes.py
+++ b/app/features/rag/routes.py
@@ -6,9 +6,9 @@
 
 from app.core.config import get_settings
 from app.core.database import get_db
-from app.core.exceptions import DatabaseError
+from app.core.exceptions import DatabaseError, EmbeddingProviderAuthError
 from app.core.logging import get_logger
-from app.features.rag.embeddings import EmbeddingError
+from app.features.rag.embeddings import EmbeddingAuthError, EmbeddingError
 from app.features.rag.schemas import (
     DeleteResponse,
     IndexProjectDocsRequest,
@@ -26,6 +26,21 @@
 router = APIRouter(prefix="/rag", tags=["rag"])
 
 
+def _embedding_auth_failure(log_event: str, exc: EmbeddingAuthError) -> EmbeddingProviderAuthError:
+    """Map a low-level embedding auth failure to the marked 502 (#329).
+
+    Shared by all three RAG routes (``index_document`` / ``index_project_docs``
+    / ``retrieve``) so the warning log + RFC 7807 ``EMBEDDING_AUTH`` mapping
+    never drift between handlers. The caller passes a route-specific
+    ``log_event`` for tracing and re-raises the returned error ``from`` the
+    original exception. Logs the exception TYPE only, never a key value.
+    """
+    logger.warning(log_event, error_type=type(exc).__name__)
+    return EmbeddingProviderAuthError(
+        message=f"Embedding provider rejected the credentials: {exc}",
+    )
+
+
 # =============================================================================
 # Index Endpoint
 # =============================================================================
@@ -110,6 +125,9 @@ async def index_document(
             detail=str(e),
         ) from e
 
+    except EmbeddingAuthError as e:
+        raise _embedding_auth_failure("rag.index_request_auth_failed", e) from e
+
     except EmbeddingError as e:
         logger.error(
             "rag.index_request_failed",
@@ -195,6 +213,9 @@ async def index_project_docs(
 
         return response
 
+    except EmbeddingAuthError as e:
+        raise _embedding_auth_failure("rag.index_project_docs_request_auth_failed", e) from e
+
     except EmbeddingError as e:
         logger.error(
             "rag.index_project_docs_request_failed",
@@ -298,6 +319,9 @@ async def retrieve(
 
         return response
 
+    except EmbeddingAuthError as e:
+        raise _embedding_auth_failure("rag.retrieve_request_auth_failed", e) from e
+
     except EmbeddingError as e:
         logger.error(
             "rag.retrieve_request_failed",
diff --git a/app/features/rag/tests/test_embeddings.py b/app/features/rag/tests/test_embeddings.py
index 2eb59b70..2783a3af 100644
--- a/app/features/rag/tests/test_embeddings.py
+++ b/app/features/rag/tests/test_embeddings.py
@@ -4,8 +4,10 @@
 
 import httpx
 import pytest
+from openai import AuthenticationError
 
 from app.features.rag.embeddings import (
+    EmbeddingAuthError,
     EmbeddingError,
     EmbeddingProvider,
     EmbeddingService,
@@ -153,6 +155,36 @@ async def test_embed_texts_batching(self):
             assert len(result) == 4
             assert mock_client.embeddings.create.call_count == 2
 
+    @pytest.mark.asyncio
+    async def test_embed_texts_invalid_key_raises_auth_error(self):
+        """#329 — a 401 from OpenAI surfaces as EmbeddingAuthError, not retried."""
+        with patch("app.features.rag.embeddings.get_settings") as mock_settings:
+            mock_settings.return_value.openai_api_key = "sk-placeholder-invalid"
+            mock_settings.return_value.rag_embedding_model = "text-embedding-3-small"
+            mock_settings.return_value.rag_embedding_dimension = 1536
+            mock_settings.return_value.rag_embedding_batch_size = 100
+
+            provider = OpenAIEmbeddingProvider()
+
+            auth_error = AuthenticationError(
+                "Incorrect API key provided",
+                response=httpx.Response(
+                    401,
+                    request=httpx.Request("POST", "https://api.openai.com/v1/embeddings"),
+                ),
+                body=None,
+            )
+            mock_client = MagicMock()
+            mock_client.embeddings.create = AsyncMock(side_effect=auth_error)
+            provider._client = mock_client
+
+            with pytest.raises(EmbeddingAuthError) as exc_info:
+                await provider.embed_texts(["text"])
+            # Subclass of EmbeddingError so existing callers still catch it.
+            assert isinstance(exc_info.value, EmbeddingError)
+            # Not retried: a single create() call, no backoff loop.
+            assert mock_client.embeddings.create.call_count == 1
+
     @pytest.mark.asyncio
     async def test_embed_query_returns_single_embedding(self):
         """Test embed_query returns single embedding."""
@@ -327,6 +359,32 @@ async def test_embed_texts_model_not_found(self):
             assert "not found" in str(exc_info.value).lower()
             assert "ollama pull" in str(exc_info.value)
 
+    @pytest.mark.asyncio
+    async def test_embed_texts_auth_rejected_raises_auth_error(self):
+        """#329 — a 401/403 from the Ollama endpoint surfaces as EmbeddingAuthError."""
+        with patch("app.features.rag.embeddings.get_settings") as mock_settings:
+            mock_settings.return_value.ollama_base_url = "http://localhost:11434"
+            mock_settings.return_value.ollama_embedding_model = "nomic-embed-text"
+            mock_settings.return_value.rag_embedding_dimension = 768
+
+            provider = OllamaEmbeddingProvider()
+
+            mock_response = MagicMock()
+            mock_response.status_code = 401
+            error = httpx.HTTPStatusError(
+                "Unauthorized",
+                request=MagicMock(),
+                response=mock_response,
+            )
+            mock_client = MagicMock(spec=httpx.AsyncClient)
+            mock_client.post = AsyncMock(side_effect=error)
+            provider._client = mock_client
+
+            with pytest.raises(EmbeddingAuthError) as exc_info:
+                await provider.embed_texts(["test"])
+            assert isinstance(exc_info.value, EmbeddingError)
+            assert "rejected the credentials" in str(exc_info.value)
+
     @pytest.mark.asyncio
     async def test_embed_texts_connection_error(self):
         """Test error handling when Ollama not reachable."""
diff --git a/app/features/rag/tests/test_routes.py b/app/features/rag/tests/test_routes.py
index f898a9f1..fa60ac80 100644
--- a/app/features/rag/tests/test_routes.py
+++ b/app/features/rag/tests/test_routes.py
@@ -13,7 +13,7 @@
 import pytest
 from httpx import AsyncClient
 
-from app.features.rag.embeddings import EmbeddingError, EmbeddingService
+from app.features.rag.embeddings import EmbeddingAuthError, EmbeddingError, EmbeddingService
 from app.features.rag.service import RAGService
 
 # =============================================================================
@@ -168,6 +168,42 @@ async def test_index_file_not_found(self, client: AsyncClient):
         )
         assert response.status_code == 404
 
+    @pytest.mark.asyncio
+    async def test_index_embedding_auth_failure_returns_502_with_marker(self, client: AsyncClient):
+        """#329 — /rag/index maps an embedding auth failure to the marked 502.
+
+        Mirrors the /rag/index/project-docs assertion so all three RAG routes
+        stay aligned on the same RFC 7807 type/code.
+        """
+        # MagicMock var (not the EmbeddingService-typed factory return) so mypy
+        # permits the method assignment — same pattern as
+        # test_embedding_failure_returns_502.
+        mock_service = MagicMock(spec=EmbeddingService)
+        mock_service.embed_texts = AsyncMock(
+            side_effect=EmbeddingAuthError("OpenAI rejected the embedding credentials")
+        )
+        mock_service.count_tokens = MagicMock(side_effect=lambda text: len(text.split()))
+        mock_service.truncate_to_tokens = MagicMock(side_effect=lambda text, max_tokens: text)
+
+        with patch(
+            "app.features.rag.service.get_embedding_service",
+            return_value=mock_service,
+        ):
+            response = await client.post(
+                "/rag/index",
+                json={
+                    "source_type": "markdown",
+                    "source_path": "test-index-auth-001",
+                    "content": "# Auth\n\nContent that needs embedding.",
+                },
+            )
+
+        assert response.status_code == 502
+        body = response.json()
+        assert body["code"] == "EMBEDDING_AUTH"
+        assert body["type"].endswith("/embedding-auth")
+        assert body["status"] == 502
+
 
 # =============================================================================
 # Retrieve Endpoint Tests
@@ -281,6 +317,38 @@ async def test_retrieve_validates_query(self, client: AsyncClient):
         )
         assert response.status_code == 422
 
+    @pytest.mark.asyncio
+    async def test_retrieve_embedding_auth_failure_returns_502_with_marker(
+        self, client: AsyncClient
+    ):
+        """#329 — /rag/retrieve maps an embedding auth failure to the marked 502.
+
+        Keeps the retrieve handler aligned with the two index handlers on the
+        same RFC 7807 type/code.
+        """
+        # MagicMock var (not the EmbeddingService-typed factory return) so mypy
+        # permits the method assignment — same pattern as
+        # test_embedding_failure_returns_502.
+        mock_service = MagicMock(spec=EmbeddingService)
+        auth_error = EmbeddingAuthError("OpenAI rejected the embedding credentials")
+        mock_service.embed_query = AsyncMock(side_effect=auth_error)
+        mock_service.embed_texts = AsyncMock(side_effect=auth_error)
+
+        with patch(
+            "app.features.rag.service.get_embedding_service",
+            return_value=mock_service,
+        ):
+            response = await client.post(
+                "/rag/retrieve",
+                json={"query": "anything", "top_k": 5, "similarity_threshold": 0.0},
+            )
+
+        assert response.status_code == 502
+        body = response.json()
+        assert body["code"] == "EMBEDDING_AUTH"
+        assert body["type"].endswith("/embedding-auth")
+        assert body["status"] == 502
+
 
 # =============================================================================
 # Sources Endpoint Tests
@@ -565,3 +633,41 @@ async def test_embedding_failure_returns_502(self, client: AsyncClient, tmp_path
             response = await client.post("/rag/index/project-docs", json={})
 
         assert response.status_code == 502
+
+    @pytest.mark.asyncio
+    async def test_embedding_auth_failure_returns_502_with_marker(
+        self, client: AsyncClient, tmp_path
+    ):
+        """#329 — an embedding auth failure stays 502 but carries the
+
+        machine-readable EMBEDDING_AUTH problem marker so the demo pipeline can
+        classify it (vs a generic embedding 502) without brittle text matching.
+        """
+        (tmp_path / "docs").mkdir()
+        (tmp_path / "docs" / "auth-doc.md").write_text(
+            "# Delta\n\nDelta content.", encoding="utf-8"
+        )
+        mock_service = MagicMock(spec=EmbeddingService)
+        mock_service.embed_texts = AsyncMock(
+            side_effect=EmbeddingAuthError("OpenAI rejected the embedding credentials")
+        )
+
+        with (
+            patch(
+                "app.features.rag.routes.RAGService",
+                partial(RAGService, base_dir=str(tmp_path)),
+            ),
+            patch(
+                "app.features.rag.service.get_embedding_service",
+                return_value=mock_service,
+            ),
+        ):
+            response = await client.post("/rag/index/project-docs", json={})
+
+        # Status stays 502 (public contract stable); body is RFC 7807 with a
+        # stable type/code an automated consumer can branch on.
+        assert response.status_code == 502
+        body = response.json()
+        assert body["code"] == "EMBEDDING_AUTH"
+        assert body["type"].endswith("/embedding-auth")
+        assert body["status"] == 502
diff --git a/app/features/registry/service.py b/app/features/registry/service.py
index 503c45d2..37e8a3fe 100644
--- a/app/features/registry/service.py
+++ b/app/features/registry/service.py
@@ -649,7 +649,10 @@ def _extract_feature_frame_version(
         if not runtime_info_extras:
             return 1
         value = runtime_info_extras.get("feature_frame_version")
-        if isinstance(value, int) and value in (1, 2):
+        # Honor any positive int V (feature_frame_version is an opaque
+        # incrementing integer per docs/_base/DOMAIN_MODEL.md). bool is excluded
+        # because it subclasses int. Missing / invalid value -> V=1 (#338).
+        if isinstance(value, int) and not isinstance(value, bool) and value >= 1:
             return value
         return 1
 
diff --git a/app/features/registry/tests/test_service.py b/app/features/registry/tests/test_service.py
index abd2a2ce..1014d7bc 100644
--- a/app/features/registry/tests/test_service.py
+++ b/app/features/registry/tests/test_service.py
@@ -165,10 +165,19 @@ def test_extract_feature_frame_version_explicit_v2(self) -> None:
         """Explicit feature_frame_version=2 round-trips."""
         assert RegistryService._extract_feature_frame_version({"feature_frame_version": 2}) == 2
 
-    def test_extract_feature_frame_version_rejects_unsupported_value(self) -> None:
-        """Unknown int (e.g. 3) and non-int (e.g. '2') fall back to V1."""
-        assert RegistryService._extract_feature_frame_version({"feature_frame_version": 3}) == 1
+    def test_extract_feature_frame_version_honors_any_positive_int(self) -> None:
+        """Any positive int V is honored (e.g. 3); non-int / non-positive / bool -> V1.
+
+        Regression for #338: feature_frame_version is an opaque incrementing
+        integer, so V>=3 must not be clamped to 1 (the showcase
+        stale_alias_trigger step registers a V=3 run).
+        """
+        assert RegistryService._extract_feature_frame_version({"feature_frame_version": 3}) == 3
+        assert RegistryService._extract_feature_frame_version({"feature_frame_version": 7}) == 7
+        # Non-int / non-positive / bool all fall back to V1.
         assert RegistryService._extract_feature_frame_version({"feature_frame_version": "2"}) == 1
+        assert RegistryService._extract_feature_frame_version({"feature_frame_version": 0}) == 1
+        assert RegistryService._extract_feature_frame_version({"feature_frame_version": True}) == 1
 
 
 class TestRegistryServiceConfigDiff:
diff --git a/app/features/scenarios/agent_tools.py b/app/features/scenarios/agent_tools.py
index ab99c17c..b987afca 100644
--- a/app/features/scenarios/agent_tools.py
+++ b/app/features/scenarios/agent_tools.py
@@ -26,7 +26,7 @@
 from sqlalchemy import select
 from sqlalchemy.ext.asyncio import AsyncSession
 
-from app.features.data_platform.models import SalesDaily
+from app.features.data_platform.models import Product, SalesDaily, Store
 from app.features.scenarios.models import SCENARIO_SOURCE_AGENT
 from app.features.scenarios.schemas import (
     CreateScenarioRequest,
@@ -52,6 +52,27 @@
 AGENT_SAVE_APPROVED_BY = "operator"
 
 
+async def _grain_exists(db: AsyncSession, store_id: int, product_id: int) -> tuple[bool, bool]:
+    """Report whether the store and product dimension rows exist.
+
+    Read-only existence probe against the ``store`` / ``product`` dimension
+    tables. Used to reject a proposal for a grain that does not exist (issue
+    #347 — a weak model derailed into proposing a what-if for a hallucinated
+    ``store_id=123`` / ``product_id=456``).
+
+    Args:
+        db: Database session.
+        store_id: Candidate store id.
+        product_id: Candidate product id.
+
+    Returns:
+        ``(store_exists, product_exists)``.
+    """
+    store_exists = await db.scalar(select(Store.id).where(Store.id == store_id)) is not None
+    product_exists = await db.scalar(select(Product.id).where(Product.id == product_id)) is not None
+    return store_exists, product_exists
+
+
 async def propose_scenario(
     db: AsyncSession,
     store_id: int,
@@ -79,6 +100,12 @@ async def propose_scenario(
         the candidate ``assumptions`` (JSON-mode dump so dates are ISO strings,
         ready to pass straight back into ``save_scenario``), and a
         plain-language ``recommendation``.
+
+        When the ``(store_id, product_id)`` grain does not exist, returns a
+        non-persistable validation error instead — ``{"valid": False,
+        "persistable": False, "error": ..., "missing": [...]}`` — so a
+        hallucinated grain (e.g. store 123 / product 456) never yields a normal
+        proposal (issue #347).
     """
     logger.info(
         "agents.scenario_tool.propose_scenario_called",
@@ -87,6 +114,36 @@ async def propose_scenario(
         horizon=horizon,
     )
 
+    # Reject a grain that does not exist before drafting anything. A weak model
+    # can hallucinate placeholder ids (store 123 / product 456); a proposal for a
+    # non-existent grain is meaningless and must never look like a normal,
+    # save-able candidate (issue #347). This is read-only and persists nothing.
+    store_exists, product_exists = await _grain_exists(db, store_id, product_id)
+    if not (store_exists and product_exists):
+        missing: list[str] = []
+        if not store_exists:
+            missing.append(f"store_id={store_id}")
+        if not product_exists:
+            missing.append(f"product_id={product_id}")
+        logger.info(
+            "agents.scenario_tool.propose_scenario_rejected_unknown_grain",
+            store_id=store_id,
+            product_id=product_id,
+            missing=missing,
+        )
+        return {
+            "valid": False,
+            "persistable": False,
+            "store_id": store_id,
+            "product_id": product_id,
+            "missing": missing,
+            "error": (
+                f"Cannot propose a scenario: {' and '.join(missing)} "
+                "do not exist. Use a real store/product pair (look one up with a "
+                "read-only tool) — do not invent identifiers."
+            ),
+        }
+
     # Read the most recent unit price for a grounded recommendation. Read-only.
     latest_price = await db.scalar(
         select(SalesDaily.unit_price)
diff --git a/app/features/scenarios/tests/conftest.py b/app/features/scenarios/tests/conftest.py
index c5ebc731..0ef3ca06 100644
--- a/app/features/scenarios/tests/conftest.py
+++ b/app/features/scenarios/tests/conftest.py
@@ -66,6 +66,29 @@ async def db_session() -> AsyncGenerator[AsyncSession, None]:
     await engine.dispose()
 
 
+@pytest.fixture
+async def existing_grain(db_session: AsyncSession) -> AsyncGenerator[tuple[int, int], None]:
+    """Insert the Store + Product dimension rows for the test grain; clean up after.
+
+    ``propose_scenario`` now rejects a grain whose store/product do not exist
+    (#347). ``TEST_STORE_ID`` / ``TEST_PRODUCT_ID`` are deliberately high IDs no
+    seeder uses, so a read-only proposal for them needs the dimension rows seeded
+    explicitly. Removed on teardown so the grain stays absent for the
+    rejection-path tests.
+    """
+    from app.features.data_platform.models import Product, Store
+
+    db_session.add(Store(id=TEST_STORE_ID, code=f"S{TEST_STORE_ID}", name="Test Store"))
+    db_session.add(Product(id=TEST_PRODUCT_ID, sku=f"SKU{TEST_PRODUCT_ID}", name="Test Product"))
+    await db_session.commit()
+    try:
+        yield (TEST_STORE_ID, TEST_PRODUCT_ID)
+    finally:
+        await db_session.execute(delete(Product).where(Product.id == TEST_PRODUCT_ID))
+        await db_session.execute(delete(Store).where(Store.id == TEST_STORE_ID))
+        await db_session.commit()
+
+
 @pytest.fixture
 async def client(db_session: AsyncSession) -> AsyncGenerator[AsyncClient, None]:
     """Create a test client with the database dependency overridden."""
diff --git a/app/features/scenarios/tests/test_agent_tools.py b/app/features/scenarios/tests/test_agent_tools.py
index 5f1ba739..95400c92 100644
--- a/app/features/scenarios/tests/test_agent_tools.py
+++ b/app/features/scenarios/tests/test_agent_tools.py
@@ -14,6 +14,7 @@
 
 import uuid
 from datetime import UTC, datetime, timedelta
+from unittest.mock import AsyncMock
 
 import pytest
 from sqlalchemy import delete, func, select
@@ -35,18 +36,85 @@ def test_save_scenario_requires_approval() -> None:
     assert requires_approval("save_scenario") is True
 
 
+class TestProposeScenarioEntityValidation:
+    """propose_scenario rejects a grain whose store/product do not exist (#347).
+
+    Unit-level (mocked DB): the entity-existence probe (`_grain_exists`) issues
+    `db.scalar(...)` for the store id, then the product id, then — only on the
+    valid path — the latest unit price. Driving `db.scalar` with a `side_effect`
+    list exercises every branch with no database. These run in the fast
+    ``not integration`` gate.
+    """
+
+    @staticmethod
+    def _mock_db(scalar_returns: list[object]) -> AsyncMock:
+        """An AsyncSession-shaped mock whose `scalar` yields the given values."""
+        db = AsyncMock(spec=AsyncSession)
+        db.scalar = AsyncMock(side_effect=scalar_returns)
+        return db
+
+    async def test_existing_grain_returns_a_proposal(self) -> None:
+        """A real store/product pair yields a normal, save-able proposal."""
+        db = self._mock_db([5, 8, 12.5])  # store id, product id, latest price
+
+        result = await propose_scenario(
+            db, store_id=5, product_id=8, horizon=14, objective="grow demand"
+        )
+
+        assert result.get("valid") is not False
+        assert "assumptions" in result
+        assert "recommendation" in result
+        ScenarioAssumptions.model_validate(result["assumptions"])
+
+    async def test_nonexistent_grain_is_rejected(self) -> None:
+        """A grain with no store and no product row is rejected, not proposed."""
+        db = self._mock_db([None, None])
+
+        result = await propose_scenario(
+            db, store_id=77001, product_id=77002, horizon=14, objective="x"
+        )
+
+        assert result["valid"] is False
+        assert result["persistable"] is False
+        assert "assumptions" not in result
+        assert "store_id=77001" in result["missing"]
+        assert "product_id=77002" in result["missing"]
+
+    async def test_hallucinated_123_456_is_rejected(self) -> None:
+        """The exact hallucinated store 123 / product 456 case never proposes."""
+        db = self._mock_db([None, None])
+
+        result = await propose_scenario(db, store_id=123, product_id=456, horizon=14, objective="")
+
+        assert result["valid"] is False
+        assert "assumptions" not in result
+        # Read-only rejection — nothing is written.
+        db.add.assert_not_called()
+        db.commit.assert_not_awaited()
+
+    async def test_missing_product_only_is_rejected(self) -> None:
+        """A real store but a missing product is still rejected."""
+        db = self._mock_db([5, None])
+
+        result = await propose_scenario(db, store_id=5, product_id=999999, horizon=7, objective="")
+
+        assert result["valid"] is False
+        assert result["missing"] == ["product_id=999999"]
+
+
 @pytest.mark.integration
 class TestProposeScenario:
-    """propose_scenario drafts a candidate and persists nothing."""
+    """propose_scenario drafts a candidate (for a real grain) and persists nothing."""
 
     async def test_returns_valid_assumptions_and_recommendation(
-        self, db_session: AsyncSession
+        self, db_session: AsyncSession, existing_grain: tuple[int, int]
     ) -> None:
         """A default objective yields a valid price-cut candidate."""
+        store_id, product_id = existing_grain
         result = await propose_scenario(
             db_session,
-            store_id=TEST_STORE_ID,
-            product_id=TEST_PRODUCT_ID,
+            store_id=store_id,
+            product_id=product_id,
             horizon=14,
             objective="grow demand for the summer range",
         )
@@ -58,12 +126,15 @@ async def test_returns_valid_assumptions_and_recommendation(
         assert isinstance(result["recommendation"], str)
         assert result["recommendation"]
 
-    async def test_promotion_keyword_proposes_a_promotion(self, db_session: AsyncSession) -> None:
+    async def test_promotion_keyword_proposes_a_promotion(
+        self, db_session: AsyncSession, existing_grain: tuple[int, int]
+    ) -> None:
         """An objective mentioning a promotion steers the candidate accordingly."""
+        store_id, product_id = existing_grain
         result = await propose_scenario(
             db_session,
-            store_id=TEST_STORE_ID,
-            product_id=TEST_PRODUCT_ID,
+            store_id=store_id,
+            product_id=product_id,
             horizon=7,
             objective="run a promotion next week",
         )
@@ -72,12 +143,15 @@ async def test_promotion_keyword_proposes_a_promotion(self, db_session: AsyncSes
         assert assumptions.promotion is not None
         assert assumptions.price is None
 
-    async def test_persists_no_row(self, db_session: AsyncSession) -> None:
+    async def test_persists_no_row(
+        self, db_session: AsyncSession, existing_grain: tuple[int, int]
+    ) -> None:
         """propose_scenario is read-only — it never writes a scenario_plan row."""
+        store_id, product_id = existing_grain
         await propose_scenario(
             db_session,
-            store_id=TEST_STORE_ID,
-            product_id=TEST_PRODUCT_ID,
+            store_id=store_id,
+            product_id=product_id,
             horizon=10,
             objective="test",
         )
@@ -85,6 +159,31 @@ async def test_persists_no_row(self, db_session: AsyncSession) -> None:
         assert count == 0
 
 
+@pytest.mark.integration
+class TestProposeScenarioRejectsUnknownGrain:
+    """propose_scenario rejects a non-existent grain against a real DB (#347)."""
+
+    async def test_rejects_nonexistent_grain_and_persists_nothing(
+        self, db_session: AsyncSession
+    ) -> None:
+        """A grain with no dimension rows is rejected and writes no plan."""
+        # IDs far above any seeded range — guaranteed absent.
+        result = await propose_scenario(
+            db_session,
+            store_id=9_999_001,
+            product_id=9_999_002,
+            horizon=14,
+            objective="grow demand",
+        )
+
+        assert result["valid"] is False
+        assert result["persistable"] is False
+        assert "assumptions" not in result
+
+        count = await db_session.scalar(select(func.count()).select_from(ScenarioPlan))
+        assert count == 0
+
+
 @pytest.mark.integration
 class TestSaveScenario:
     """save_scenario persists a plan stamped with agent provenance."""
diff --git a/app/main.py b/app/main.py
index eb4f5145..1533ce50 100644
--- a/app/main.py
+++ b/app/main.py
@@ -26,6 +26,7 @@
 from app.features.forecasting.routes import router as forecasting_router
 from app.features.ingest.routes import router as ingest_router
 from app.features.jobs.routes import router as jobs_router
+from app.features.model_selection.routes import router as model_selection_router
 from app.features.ops.routes import router as ops_router
 from app.features.rag.routes import router as rag_router
 from app.features.registry.routes import router as registry_router
@@ -145,6 +146,7 @@ def create_app() -> FastAPI:
     app.include_router(forecasting_router)
     app.include_router(explainability_router)
     app.include_router(backtesting_router)
+    app.include_router(model_selection_router)
     app.include_router(registry_router)
     app.include_router(rag_router)
     app.include_router(scenarios_router)
diff --git a/docs/_base/RUNBOOKS.md b/docs/_base/RUNBOOKS.md
index a3b5b1ba..4ba53dca 100644
--- a/docs/_base/RUNBOOKS.md
+++ b/docs/_base/RUNBOOKS.md
@@ -126,6 +126,7 @@ uv run python scripts/run_demo.py --seed 42 --quiet 2>&1 | tee demo.log
 18. **`scenario_simulate_and_save` step fails with `Cannot parse artifact-key from artifact_uri` (PRP-40, `showcase_rich` only)** — FIXED in #324. The cascade had two root causes: `safer_promote_flow` (PRP-39) swapped the `demo-production` alias to a worse-WAPE run whose placeholder `artifact_uri` (`demo/safer-promote-placeholder.joblib`) the `_parse_artifact_key` regex (`r"model_([0-9a-f]+)(?:\.joblib)?$"`) could not match, and `scenario_simulate_and_save` then resolved that corrupted alias. The fix: the planning step now resolves the champion via `ctx.winning_run_id` (recorded by `register`, never touched by the swap) instead of the live alias, and `safer_promote_flow` writes a real-shape parseable `artifact_uri`. The orchestrator also runs an alias-restore safeguard (`_restore_demo_alias_after_failure`) on any mid-run failure so `demo-production` is never left on the worse-WAPE run. If you still hit this on a forked pipeline, the run's `artifact_uri` is irregular: confirm it matches one of the V1 (`demo/{model_type}-model_{KEY}.joblib`) or V2 (`artifacts/models/model_{KEY}.joblib`) shapes via `GET /registry/runs/{run_id}`, re-run the showcase (the next `register` step rewrites the artifact_uri), or extend `_ARTIFACT_KEY_RE` if a new shape is intentional.
 19. **`multi_plan_compare` step shows ⚠️ with `holiday-plan save failed: ...; price-cut plan still saved` (PRP-40, `showcase_rich` only)** — the second `POST /scenarios` returned 4xx (most likely 422). The price-cut plan was still saved (partial success — R19), so the run keeps going green. Fix: read the RFC 7807 body in the detail; common causes are a horizon out of range or a malformed `holiday.dates` payload. Re-running the showcase regenerates both plans from scratch.
 20. **`embedding_provider_probe` step shows ✅ but `reachable=False` (PRP-40, `showcase_rich` only)** — expected when no embedding provider is configured. The probe always emits PASS so the pipeline still greens; downstream `rag_index_subset` and `rag_retrieve_probe` will emit ⏭️ skip with `detail="embedding provider unreachable"`. Fix only if you want the knowledge phase to run: set `OPENAI_API_KEY` (when `RAG_EMBEDDING_PROVIDER=openai`) or start Ollama on `OLLAMA_BASE_URL` (when `RAG_EMBEDDING_PROVIDER=ollama`), then re-run.
+    - **Invalid / placeholder key (PRP-42, #329):** the probe only checks key *presence*, so a non-empty-but-invalid key (e.g. the `.env.example` placeholder) reports `reachable=true` and the index call then gets a provider **401/403**. As of #329 the RAG routes classify that auth failure as a machine-readable `EMBEDDING_AUTH` problem (RFC 7807 `type=/errors/embedding-auth`, `code="EMBEDDING_AUTH"`) — the public `/rag/index/project-docs` and `/rag/retrieve` endpoints still return **502**, but `rag_index_subset` / `rag_retrieve_probe` now **⏭️ skip** with `detail="embedding provider rejected credentials"` (instead of hard-failing) and the pipeline still greens. Fix only if you want the knowledge phase to run: set a *valid* key for the configured provider and re-run.
 21. **`rag_index_subset` step fails with `path_prefix escapes the project root` (PRP-40, `showcase_rich` only)** — the demo step hard-codes `path_prefix="docs/user-guide"`, so a real-world hit means `RAGService._base_dir` no longer points at the repo root (e.g. a misconfigured container start). Fix: confirm the backend was started from the repo root (or that `RAGService(base_dir=...)` was constructed with the right path); rerun the showcase. The path-traversal guard is load-bearing security — never relax it.
 22. **`rag_retrieve_probe` step shows ⚠️ with `no hits — corpus indexed but query did not match` (PRP-40, `showcase_rich` only)** — the 5-file corpus was indexed (the prior step PASSed) but the canned query `"How do I run the demo pipeline?"` returned zero hits. Common cause: the embedding-provider was switched mid-showcase and indexed chunks are now orphaned (memory anchor: `[[rag-runtime-config-and-corpus-state]]`); the pgvector column has one fixed dimension per provider. Fix: stick to one provider, or clear the RAG corpus (`DELETE /rag/sources/{id}` per source) and re-run.
 23. **`agent_hitl_flow` step shows ⏭️ with `no API key matching agent_default_model provider` (PRP-41, `showcase_rich` only)** — expected when no LLM key is set for the configured `agent_default_model` provider. Pipeline still goes green. Fix only if you want the HITL phase to run: set `OPENAI_API_KEY` / `ANTHROPIC_API_KEY` / `GOOGLE_API_KEY` to match the provider prefix in `agent_default_model` (e.g. `anthropic:claude-...` → `ANTHROPIC_API_KEY`).
diff --git a/docs/user-guide/champion-selector-guide.md b/docs/user-guide/champion-selector-guide.md
new file mode 100644
index 00000000..1bef1afb
--- /dev/null
+++ b/docs/user-guide/champion-selector-guide.md
@@ -0,0 +1,126 @@
+# Champion Selector Guide
+
+The **Champion Selector** turns "which forecasting model is best for this
+store + product?" into a guided, end-to-end workflow: compare candidate models
+on a leakage-safe backtest, read a recommendation, **decide** (accept it or
+override), train the chosen model, generate and interpret its forecast, and —
+only with explicit approval — **promote** it to a registry alias.
+
+It lives at **`/visualize/champion`** in the dashboard and is served by the
+`/model-selection/*` REST API (Swagger at **/docs** is the authoritative
+contract).
+
+> **The golden rule of promotion:** the app *recommends* a champion, but a
+> human *approves* it, and that decision is **recorded**. Promotion is never
+> automatic.
+
+## The journey at a glance
+
+```
+Select → Run comparison → Results → Decide / override → Train → Forecast → Interpret → Promote
+```
+
+### 1 · Select & check availability
+
+Pick a store, a product, a time period, a forecast horizon (1–90 days), and the
+candidate models to compare. The page checks **data availability** for the pair
+and recommends a cross-validation split. A pair with too little history is
+flagged *unusable* and the comparison is refused (`400`).
+
+### 2 · Run the comparison
+
+`POST /model-selection/runs` submits an asynchronous run (returns `202` with a
+monitor URL); the page polls it to a terminal state. Each candidate is
+backtested with time-series cross-validation; results are ranked deterministically.
+
+**Ranking** is by **WAPE** by default, with a fixed tie-break chain:
+*WAPE, then sMAPE, then |bias|, then MAE.* The winner, runners-up, and any
+failed candidates are all shown.
+
+### 3 · Decide — accept or override
+
+The recommended winner is pre-selected. You can:
+
+- **Accept the recommendation** → trains the ranked winner.
+- **Override to another candidate** → you must confirm an explicit warning (the
+  recommended model and the WAPE gap are named) and may record a reason. The
+  override is flagged (`is_override=true`) and audited. A candidate that *failed*
+  its backtest is still override-trainable (training is independent of backtesting).
+
+`POST /model-selection/{id}/train-selected` trains the chosen model;
+`train-winner` trains the recommendation.
+
+### 4 · Forecast
+
+`POST /model-selection/{id}/predict` generates the horizon forecast for the
+trained model. The response carries the **peak** and **low** demand days plus a
+**decision** block (see below).
+
+> **Capability limit.** A *feature-aware* model (`regression`, `prophet_like`,
+> `lightgbm`, `xgboost`, `random_forest`) cannot auto-forecast here — it needs a
+> future feature frame. The page shows a blocked state and routes you to the
+> **What-If Planner** (Scenarios) instead of faking a forecast.
+
+### 5 · Interpret
+
+The **business interpretation** panel restates *why the model won*, the
+**expected demand over the lead time**, and the **bias risk**:
+
+> Positive bias means the model under-forecasts (risk of stockouts); negative
+> bias means it over-forecasts (risk of overstock).
+
+The **safety stock** panel shows a clearly-labeled, deterministic heuristic:
+
+```
+safety_stock        = z(service_level) · σ_daily · √(lead_time_days)
+expected_demand     = average_demand · lead_time_days
+reorder_point       = expected_demand + safety_stock
+```
+
+`σ_daily` is the standard deviation of the daily forecast; `z` comes from a fixed
+service-level table (90% → 1.2816, 95% → 1.6449, 97.5% → 1.9600, 99% → 2.3263),
+snapping to the nearest level in between. Adjust the lead time / service level and
+recompute.
+
+> **This is a heuristic** (demand variability only, constant lead time) — not a
+> full inventory-optimisation model, and it **never** influences the model
+> ranking.
+
+### 6 · Promote (approval-gated, audited)
+
+`POST /model-selection/{id}/promote` registers the trained model as a registry
+`model_run` (transitioned to **SUCCESS** with a verified artifact) and points a
+**registry alias** at it. It records a `promotion_decision` audit
+(`approved_by`, the alias, the run id, the decision, the reason, and whether it
+was an override).
+
+Promotion requires:
+
+- a valid **alias name** (`^[a-z0-9][a-z0-9\-_]*$`) — a bad name is rejected `422`;
+- an **approver** (`approved_by`) — promotion is never anonymous;
+- for a **non-recommended** (override) model, an explicit
+  `acknowledge_non_recommended=true` — else `422`;
+- a **trained** model first — promoting before training is `422`.
+
+Re-promoting the same alias name repoints the existing alias (registry upsert
+semantics). **Compare and promote stay separate** — promote performs no
+ranking or comparison; it only registers and aliases the already-trained champion.
+
+## Endpoint reference
+
+| Method | Path | Purpose |
+|--------|------|---------|
+| POST | `/model-selection/runs` | Submit an async comparison (202) |
+| GET | `/model-selection/{id}` | Poll progress / fetch terminal results |
+| POST | `/model-selection/{id}/train-winner` | Train the ranked winner |
+| POST | `/model-selection/{id}/train-selected` | Train a chosen candidate (override) |
+| POST | `/model-selection/{id}/predict` | Forecast + inventory decision |
+| POST | `/model-selection/{id}/promote` | Promote to a registry alias (audited) |
+
+## Notes & caveats
+
+- Backtest accuracy reflects historical fit, not a guarantee of future
+  performance; metrics measure correlation with past demand, not causation.
+- The decision layer is **deterministic** — no LLM is involved.
+- V2 (richer feature frame) runs promote as V2: the registry run records the
+  real `feature_frame_version`.
diff --git a/docs/user-guide/feature-reference.md b/docs/user-guide/feature-reference.md
index 71e2d21b..521f795b 100644
--- a/docs/user-guide/feature-reference.md
+++ b/docs/user-guide/feature-reference.md
@@ -133,6 +133,23 @@ Tracks every trained model so runs are reproducible and comparable.
 A run moves through `pending → running → success` (or `failed`), and an alias is a
 human-friendly pointer (like `production` or `champion`) to a chosen successful run.
 
+## Champion Selector
+
+An end-to-end "which model is best, and now what?" workflow over one (store,
+product) pair: compare candidate models, accept or override the recommendation,
+train, forecast, interpret, and promote to a registry alias.
+
+- `POST /model-selection/runs` — submit an async candidate comparison (`202`).
+- `GET /model-selection/{id}` — poll progress / fetch the ranked results + winner.
+- `POST /model-selection/{id}/train-winner` — train the ranked winner.
+- `POST /model-selection/{id}/train-selected` — train a chosen candidate (override + audit).
+- `POST /model-selection/{id}/predict` — forecast the trained model + a labeled
+  safety-stock decision heuristic (feature-aware models are blocked → use Scenarios).
+- `POST /model-selection/{id}/promote` — approval-gated, audited promotion to a
+  registry alias (requires an approver; a non-recommended model needs an explicit ack).
+
+See the full walkthrough in **[champion-selector-guide.md](./champion-selector-guide.md)**.
+
 ## Jobs
 
 Long-running work — training, prediction, backtesting — submitted as jobs.
diff --git a/docs/user-guide/img/agent-hitl-approve.png b/docs/user-guide/img/agent-hitl-approve.png
new file mode 100644
index 00000000..d0d4bd2a
Binary files /dev/null and b/docs/user-guide/img/agent-hitl-approve.png differ
diff --git a/docs/user-guide/img/inspect-artifacts-panel.png b/docs/user-guide/img/inspect-artifacts-panel.png
new file mode 100644
index 00000000..f8ed83f9
Binary files /dev/null and b/docs/user-guide/img/inspect-artifacts-panel.png differ
diff --git a/docs/user-guide/img/kpi-strip.png b/docs/user-guide/img/kpi-strip.png
new file mode 100644
index 00000000..abb73afd
Binary files /dev/null and b/docs/user-guide/img/kpi-strip.png differ
diff --git a/docs/user-guide/img/ops-snapshot-tiles.png b/docs/user-guide/img/ops-snapshot-tiles.png
new file mode 100644
index 00000000..35c1724d
Binary files /dev/null and b/docs/user-guide/img/ops-snapshot-tiles.png differ
diff --git a/docs/user-guide/img/run-history-strip.png b/docs/user-guide/img/run-history-strip.png
new file mode 100644
index 00000000..d926a428
Binary files /dev/null and b/docs/user-guide/img/run-history-strip.png differ
diff --git a/docs/user-guide/showcase-walkthrough.md b/docs/user-guide/showcase-walkthrough.md
index 62ea3912..0f63837e 100644
--- a/docs/user-guide/showcase-walkthrough.md
+++ b/docs/user-guide/showcase-walkthrough.md
@@ -156,7 +156,7 @@ run. The Inspect button deep-links to `/chat` where the approved tool
 call is visible in the transcript. See
 [Agents and RAG Guide](./agents-and-rag-guide.md) for the approval gate.
 
-<!-- screenshot: agent-hitl-approve.png -->
+![Agents (HITL) phase — the agent_hitl_flow step card. In this local run the agent answered without calling save_scenario, so the step is skipped by design; the one-click Approve button renders only when the agent triggers the gated save_scenario tool.](./img/agent-hitl-approve.png)
 
 ### Phase: Ops snapshot
 
@@ -168,7 +168,7 @@ endpoints are 200-safe on an empty DB, so the step always reports `pass`
 unless every endpoint fails (then `warn`). The Inspect button deep-links
 to `/ops`.
 
-<!-- screenshot: ops-snapshot-tiles.png -->
+![Ops snapshot step card — the five-tile KPI grid (stale aliases, retraining queue, total runs, total aliases, degrading-health grains) rendered after a green showcase_rich run.](./img/ops-snapshot-tiles.png)
 
 ### Cross-cutting polish
 
@@ -198,9 +198,9 @@ Five chrome-level additions wrap the page:
   phase. Prior behavior pinned the open panel to the running/fallback
   phase.
 
-<!-- screenshot: kpi-strip.png -->
-<!-- screenshot: inspect-artifacts-panel.png -->
-<!-- screenshot: run-history-strip.png -->
+![Showcase KPI strip — five tiles populated after a completed run: runs registered, aliases live, batch items completed, scenario plans saved, RAG chunks indexed.](./img/kpi-strip.png)
+![Inspect-Artifacts panel — the grid of deep-link cards into every dashboard page populated by the run.](./img/inspect-artifacts-panel.png)
+![Run history strip — the most recent runs with scenario, status, wall-clock, and a one-click Replay button.](./img/run-history-strip.png)
 
 ## Performance budgets
 
diff --git a/frontend/src/App.tsx b/frontend/src/App.tsx
index 1ef34bf1..2dc4042f 100644
--- a/frontend/src/App.tsx
+++ b/frontend/src/App.tsx
@@ -26,6 +26,7 @@ const BacktestPage = lazy(() => import('@/pages/visualize/backtest'))
 const DemandPlannerPage = lazy(() => import('@/pages/visualize/demand'))
 const WhatIfPlannerPage = lazy(() => import('@/pages/visualize/planner'))
 const BatchRunnerPage = lazy(() => import('@/pages/visualize/batch'))
+const ChampionSelectorPage = lazy(() => import('@/pages/visualize/champion'))
 const ChatPage = lazy(() => import('@/pages/chat'))
 const KnowledgePage = lazy(() => import('@/pages/knowledge'))
 const GuidePage = lazy(() => import('@/pages/guide'))
@@ -186,6 +187,14 @@ function App() {
                   </Suspense>
                 }
               />
+              <Route
+                path={ROUTES.VISUALIZE.CHAMPION}
+                element={
+                  <Suspense fallback={<PageLoader />}>
+                    <ChampionSelectorPage />
+                  </Suspense>
+                }
+              />
               <Route
                 path={ROUTES.KNOWLEDGE}
                 element={
diff --git a/frontend/src/components/champion-selector/availability-panel.test.tsx b/frontend/src/components/champion-selector/availability-panel.test.tsx
new file mode 100644
index 00000000..0d5171f6
--- /dev/null
+++ b/frontend/src/components/champion-selector/availability-panel.test.tsx
@@ -0,0 +1,76 @@
+import { afterEach, describe, expect, it } from 'vitest'
+import { cleanup, render, screen } from '@testing-library/react'
+import { AvailabilityPanel } from './availability-panel'
+import type { PairAvailability } from '@/types/api'
+
+afterEach(cleanup)
+
+function makeAvailability(overrides: Partial<PairAvailability> = {}): PairAvailability {
+  return {
+    store_id: 7,
+    product_id: 12,
+    first_sales_date: '2026-01-01',
+    last_sales_date: '2026-05-31',
+    observed_days: 150,
+    expected_calendar_days: 151,
+    coverage_ratio: 0.99,
+    missing_days: 1,
+    zero_sale_days: 4,
+    promotion_days: 3,
+    average_daily_demand: 9.2,
+    status: 'ready',
+    recommended_split_config: {
+      strategy: 'expanding',
+      n_splits: 5,
+      min_train_size: 30,
+      gap: 0,
+      horizon: 14,
+    },
+    warnings: [],
+    ...overrides,
+  }
+}
+
+describe('AvailabilityPanel', () => {
+  it('renders status badge + metric tiles for a ready pair', () => {
+    render(
+      <AvailabilityPanel
+        availability={makeAvailability({ status: 'ready' })}
+        isLoading={false}
+        isError={false}
+      />,
+    )
+    expect(screen.getByTestId('availability-panel')).toBeTruthy()
+    expect(screen.getByTestId('availability-status-badge').textContent).toContain('Ready')
+    expect(screen.getByText('Observed days')).toBeTruthy()
+    expect(screen.getByText('Avg daily demand')).toBeTruthy()
+  })
+
+  it('renders the not-enough-data empty state for an unusable pair', () => {
+    render(
+      <AvailabilityPanel
+        availability={makeAvailability({ status: 'unusable' })}
+        isLoading={false}
+        isError={false}
+      />,
+    )
+    expect(screen.queryByTestId('availability-panel')).toBeNull()
+    expect(screen.getByText('Not enough data to model this pair')).toBeTruthy()
+  })
+
+  it('renders an em dash when promotion_days is null', () => {
+    render(
+      <AvailabilityPanel
+        availability={makeAvailability({ promotion_days: null })}
+        isLoading={false}
+        isError={false}
+      />,
+    )
+    expect(screen.getByText('—')).toBeTruthy()
+  })
+
+  it('shows a loading state while assessing', () => {
+    render(<AvailabilityPanel isLoading isError={false} />)
+    expect(screen.getByText('Assessing data availability…')).toBeTruthy()
+  })
+})
diff --git a/frontend/src/components/champion-selector/availability-panel.tsx b/frontend/src/components/champion-selector/availability-panel.tsx
new file mode 100644
index 00000000..3dfa7370
--- /dev/null
+++ b/frontend/src/components/champion-selector/availability-panel.tsx
@@ -0,0 +1,146 @@
+import { AlertTriangle, DatabaseZap } from 'lucide-react'
+import { EmptyState } from '@/components/common/error-display'
+import { LoadingState } from '@/components/common/loading-state'
+import { Badge } from '@/components/ui/badge'
+import { Card, CardContent, CardHeader, CardTitle } from '@/components/ui/card'
+import { formatNumber, formatPercent } from '@/lib/api'
+import type { AvailabilityStatus, PairAvailability } from '@/types/api'
+
+interface AvailabilityPanelProps {
+  availability?: PairAvailability
+  isLoading: boolean
+  isError: boolean
+}
+
+const STATUS_VARIANT: Record<
+  AvailabilityStatus,
+  'default' | 'secondary' | 'destructive'
+> = {
+  ready: 'default',
+  limited: 'secondary',
+  unusable: 'destructive',
+}
+
+const STATUS_LABEL: Record<AvailabilityStatus, string> = {
+  ready: 'Ready',
+  limited: 'Limited',
+  unusable: 'Unusable',
+}
+
+function Metric({ label, value }: { label: string; value: string }) {
+  return (
+    <div className="rounded-md border bg-muted/30 p-3">
+      <p className="text-xs text-muted-foreground">{label}</p>
+      <p className="mt-0.5 text-lg font-semibold tabular-nums">{value}</p>
+    </div>
+  )
+}
+
+/**
+ * Renders the (store, product) data-availability triage for the Champion
+ * Selector. Slice A surfaces the backend assessment only — no run, no charts.
+ */
+export function AvailabilityPanel({
+  availability,
+  isLoading,
+  isError,
+}: AvailabilityPanelProps) {
+  if (isLoading) {
+    return <LoadingState message="Assessing data availability…" />
+  }
+
+  if (isError) {
+    return (
+      <EmptyState
+        title="Could not assess availability"
+        description="The availability check failed for this pair. Try a different store/product or check the backend."
+        icon={<AlertTriangle className="h-12 w-12" />}
+      />
+    )
+  }
+
+  if (!availability) {
+    return (
+      <EmptyState
+        title="Pick a store and product"
+        description="Choose a valid store, product and horizon to see whether the pair has enough history to model."
+        icon={<DatabaseZap className="h-12 w-12" />}
+      />
+    )
+  }
+
+  // Not-enough-data state: an unusable pair or one with zero observed history.
+  if (availability.status === 'unusable' || availability.observed_days === 0) {
+    return (
+      <EmptyState
+        title="Not enough data to model this pair"
+        description="This store/product pair has too little observed sales history for a reliable comparison. Pick a different pair or a longer window."
+        icon={<DatabaseZap className="h-12 w-12" />}
+      />
+    )
+  }
+
+  const split = availability.recommended_split_config
+
+  return (
+    <Card data-testid="availability-panel">
+      <CardHeader>
+        <div className="flex items-center justify-between gap-2">
+          <CardTitle className="text-lg">Data availability</CardTitle>
+          <Badge
+            variant={STATUS_VARIANT[availability.status]}
+            data-testid="availability-status-badge"
+          >
+            {STATUS_LABEL[availability.status]}
+          </Badge>
+        </div>
+      </CardHeader>
+      <CardContent className="space-y-4">
+        <div className="grid grid-cols-2 gap-3 sm:grid-cols-3 lg:grid-cols-5">
+          <Metric label="Observed days" value={formatNumber(availability.observed_days)} />
+          <Metric
+            label="Coverage"
+            value={formatPercent(availability.coverage_ratio * 100)}
+          />
+          <Metric label="Zero-sale days" value={formatNumber(availability.zero_sale_days)} />
+          <Metric
+            label="Promotion days"
+            value={
+              availability.promotion_days === null
+                ? '—'
+                : formatNumber(availability.promotion_days)
+            }
+          />
+          <Metric
+            label="Avg daily demand"
+            value={formatNumber(availability.average_daily_demand, 2)}
+          />
+        </div>
+
+        <div className="rounded-md border p-3">
+          <p className="text-xs font-medium text-muted-foreground">
+            Recommended split
+          </p>
+          <p className="mt-1 text-sm tabular-nums">
+            {split.strategy} · {split.n_splits} splits · min train{' '}
+            {split.min_train_size}d · gap {split.gap}d · horizon {split.horizon}d
+          </p>
+        </div>
+
+        {availability.warnings.length > 0 && (
+          <ul className="space-y-1">
+            {availability.warnings.map((warning, index) => (
+              <li
+                key={index}
+                className="flex items-start gap-2 text-xs text-muted-foreground"
+              >
+                <AlertTriangle className="mt-0.5 h-3.5 w-3.5 shrink-0 text-amber-500" />
+                <span>{warning}</span>
+              </li>
+            ))}
+          </ul>
+        )}
+      </CardContent>
+    </Card>
+  )
+}
diff --git a/frontend/src/components/champion-selector/backtest-settings-form.test.tsx b/frontend/src/components/champion-selector/backtest-settings-form.test.tsx
new file mode 100644
index 00000000..b9df7a2b
--- /dev/null
+++ b/frontend/src/components/champion-selector/backtest-settings-form.test.tsx
@@ -0,0 +1,120 @@
+import { afterEach, beforeAll, describe, expect, it, vi } from 'vitest'
+import { cleanup, fireEvent, render, screen } from '@testing-library/react'
+import { BacktestSettingsForm } from './backtest-settings-form'
+import { splitConfigErrors } from './split-config'
+import type { SplitConfig } from '@/types/api'
+
+// Radix Collapsible/Select need a couple of layout APIs jsdom lacks.
+beforeAll(() => {
+  class ResizeObserverStub {
+    observe() {}
+    unobserve() {}
+    disconnect() {}
+  }
+  vi.stubGlobal('ResizeObserver', ResizeObserverStub)
+  if (!Element.prototype.hasPointerCapture) {
+    Element.prototype.hasPointerCapture = () => false
+  }
+  if (!Element.prototype.scrollIntoView) {
+    Element.prototype.scrollIntoView = () => {}
+  }
+})
+
+afterEach(cleanup)
+
+const VALID: SplitConfig = {
+  strategy: 'expanding',
+  n_splits: 5,
+  min_train_size: 30,
+  gap: 0,
+  horizon: 14,
+}
+
+describe('splitConfigErrors', () => {
+  it('accepts a valid config', () => {
+    expect(splitConfigErrors(VALID)).toEqual([])
+  })
+
+  it('flags out-of-range n_splits and gap >= horizon', () => {
+    const errors = splitConfigErrors({ ...VALID, n_splits: 1, gap: 14 })
+    expect(errors.some((e) => e.includes('Splits'))).toBe(true)
+    expect(errors.some((e) => e.includes('Gap must be smaller'))).toBe(true)
+  })
+})
+
+describe('BacktestSettingsForm', () => {
+  it('reveals the advanced split inputs when toggled', () => {
+    render(
+      <BacktestSettingsForm
+        value={VALID}
+        rankingMetric="wape"
+        forecastHorizon={14}
+        onChange={() => {}}
+        onRankingMetricChange={() => {}}
+      />,
+    )
+    // Hidden until the collapsible opens.
+    expect(screen.queryByTestId('settings-n-splits')).toBeNull()
+    fireEvent.click(screen.getByTestId('advanced-toggle'))
+    expect(screen.getByTestId('settings-n-splits')).toBeTruthy()
+    expect(screen.getByTestId('settings-gap')).toBeTruthy()
+  })
+
+  it('renders validation errors for an invalid config', () => {
+    render(
+      <BacktestSettingsForm
+        value={{ ...VALID, n_splits: 1 }}
+        rankingMetric="wape"
+        forecastHorizon={14}
+        onChange={() => {}}
+        onRankingMetricChange={() => {}}
+      />,
+    )
+    expect(screen.getByTestId('settings-errors')).toBeTruthy()
+    expect(screen.getByText(/Splits must be between 2 and 20/)).toBeTruthy()
+  })
+
+  it('"Use recommended split" emits the recommended config (horizon synced)', () => {
+    const onChange = vi.fn()
+    const recommended: SplitConfig = {
+      strategy: 'sliding',
+      n_splits: 8,
+      min_train_size: 45,
+      gap: 1,
+      horizon: 7, // intentionally different — must be overridden to forecastHorizon
+    }
+    render(
+      <BacktestSettingsForm
+        value={VALID}
+        rankingMetric="wape"
+        forecastHorizon={14}
+        onChange={onChange}
+        onRankingMetricChange={() => {}}
+        recommended={recommended}
+      />,
+    )
+    fireEvent.click(screen.getByTestId('use-recommended-split'))
+    expect(onChange).toHaveBeenCalledWith({
+      strategy: 'sliding',
+      n_splits: 8,
+      min_train_size: 45,
+      gap: 1,
+      horizon: 14, // synced to forecastHorizon
+    })
+  })
+
+  it('keeps the horizon input read-only and equal to the forecast horizon', () => {
+    render(
+      <BacktestSettingsForm
+        value={VALID}
+        rankingMetric="wape"
+        forecastHorizon={21}
+        onChange={() => {}}
+        onRankingMetricChange={() => {}}
+      />,
+    )
+    const horizon = screen.getByTestId('settings-horizon') as HTMLInputElement
+    expect(horizon.value).toBe('21')
+    expect(horizon.readOnly).toBe(true)
+  })
+})
diff --git a/frontend/src/components/champion-selector/backtest-settings-form.tsx b/frontend/src/components/champion-selector/backtest-settings-form.tsx
new file mode 100644
index 00000000..fdaca7f3
--- /dev/null
+++ b/frontend/src/components/champion-selector/backtest-settings-form.tsx
@@ -0,0 +1,206 @@
+import { useState } from 'react'
+import { ChevronDown, Settings2, Wand2 } from 'lucide-react'
+import { Button } from '@/components/ui/button'
+import {
+  Collapsible,
+  CollapsibleContent,
+  CollapsibleTrigger,
+} from '@/components/ui/collapsible'
+import { Input } from '@/components/ui/input'
+import {
+  Select,
+  SelectContent,
+  SelectItem,
+  SelectTrigger,
+  SelectValue,
+} from '@/components/ui/select'
+import { cn } from '@/lib/utils'
+import type { RankingMetric, SplitConfig, SplitStrategy } from '@/types/api'
+import { BIAS_EXPLANATION, RANKING_TIE_BREAK } from './copy'
+import { splitConfigErrors } from './split-config'
+
+interface BacktestSettingsFormProps {
+  value: SplitConfig
+  rankingMetric: RankingMetric
+  forecastHorizon: number
+  onChange: (next: SplitConfig) => void
+  onRankingMetricChange: (metric: RankingMetric) => void
+  recommended?: SplitConfig
+}
+
+const RANKING_METRICS: { value: RankingMetric; label: string }[] = [
+  { value: 'wape', label: 'WAPE (default)' },
+  { value: 'smape', label: 'sMAPE' },
+  { value: 'mae', label: 'MAE' },
+  { value: 'bias', label: 'Bias' },
+]
+
+function Field({
+  label,
+  children,
+  hint,
+}: {
+  label: string
+  children: React.ReactNode
+  hint?: string
+}) {
+  return (
+    <div className="space-y-1">
+      <span className="text-xs text-muted-foreground">{label}</span>
+      {children}
+      {hint && <p className="text-[11px] text-muted-foreground">{hint}</p>}
+    </div>
+  )
+}
+
+/**
+ * Simple/advanced backtest-settings form. The horizon is DERIVED from
+ * `forecastHorizon` (kept equal so the assembled run request is always valid)
+ * and shown read-only. The advanced toggle reveals the split-CV knobs.
+ */
+export function BacktestSettingsForm({
+  value,
+  rankingMetric,
+  forecastHorizon,
+  onChange,
+  onRankingMetricChange,
+  recommended,
+}: BacktestSettingsFormProps) {
+  const [advancedOpen, setAdvancedOpen] = useState(false)
+  const errors = splitConfigErrors(value)
+
+  function patch(partial: Partial<SplitConfig>) {
+    onChange({ ...value, ...partial, horizon: forecastHorizon })
+  }
+
+  return (
+    <div className="space-y-4" data-testid="backtest-settings-form">
+      <div className="grid grid-cols-1 gap-4 sm:grid-cols-2">
+        <Field label="Ranking metric" hint={`${RANKING_TIE_BREAK} ${BIAS_EXPLANATION}`}>
+          <Select
+            value={rankingMetric}
+            onValueChange={(metric) => onRankingMetricChange(metric as RankingMetric)}
+          >
+            <SelectTrigger data-testid="ranking-metric-select">
+              <SelectValue />
+            </SelectTrigger>
+            <SelectContent>
+              {RANKING_METRICS.map((metric) => (
+                <SelectItem key={metric.value} value={metric.value}>
+                  {metric.label}
+                </SelectItem>
+              ))}
+            </SelectContent>
+          </Select>
+        </Field>
+        <Field
+          label="Horizon (days)"
+          hint="Locked to the forecast horizon above so the backtest matches the forecast."
+        >
+          <Input
+            type="number"
+            value={String(forecastHorizon)}
+            readOnly
+            disabled
+            data-testid="settings-horizon"
+          />
+        </Field>
+      </div>
+
+      {recommended && (
+        <Button
+          type="button"
+          variant="outline"
+          size="sm"
+          data-testid="use-recommended-split"
+          onClick={() =>
+            onChange({ ...recommended, horizon: forecastHorizon })
+          }
+        >
+          <Wand2 className="mr-2 h-4 w-4" />
+          Use recommended split
+        </Button>
+      )}
+
+      <Collapsible open={advancedOpen} onOpenChange={setAdvancedOpen}>
+        <CollapsibleTrigger asChild>
+          <Button type="button" variant="ghost" size="sm" data-testid="advanced-toggle">
+            <Settings2 className="mr-2 h-4 w-4" />
+            Advanced split settings
+            <ChevronDown
+              className={cn(
+                'ml-2 h-4 w-4 transition-transform',
+                advancedOpen && 'rotate-180',
+              )}
+            />
+          </Button>
+        </CollapsibleTrigger>
+        <CollapsibleContent className="pt-3">
+          <div className="grid grid-cols-1 gap-4 sm:grid-cols-2 lg:grid-cols-4">
+            <Field label="Strategy">
+              <Select
+                value={value.strategy}
+                onValueChange={(strategy) =>
+                  patch({ strategy: strategy as SplitStrategy })
+                }
+              >
+                <SelectTrigger data-testid="settings-strategy">
+                  <SelectValue />
+                </SelectTrigger>
+                <SelectContent>
+                  <SelectItem value="expanding">Expanding</SelectItem>
+                  <SelectItem value="sliding">Sliding</SelectItem>
+                </SelectContent>
+              </Select>
+            </Field>
+            <Field label="Splits (2–20)">
+              <Input
+                type="number"
+                min={2}
+                max={20}
+                value={String(value.n_splits)}
+                data-testid="settings-n-splits"
+                onChange={(event) =>
+                  patch({ n_splits: Number(event.target.value) || 0 })
+                }
+              />
+            </Field>
+            <Field label="Min train (≥7d)">
+              <Input
+                type="number"
+                min={7}
+                value={String(value.min_train_size)}
+                data-testid="settings-min-train"
+                onChange={(event) =>
+                  patch({ min_train_size: Number(event.target.value) || 0 })
+                }
+              />
+            </Field>
+            <Field label="Gap (0–30d)">
+              <Input
+                type="number"
+                min={0}
+                max={30}
+                value={String(value.gap)}
+                data-testid="settings-gap"
+                onChange={(event) =>
+                  patch({ gap: Number(event.target.value) || 0 })
+                }
+              />
+            </Field>
+          </div>
+        </CollapsibleContent>
+      </Collapsible>
+
+      {errors.length > 0 && (
+        <ul className="space-y-0.5" data-testid="settings-errors">
+          {errors.map((error) => (
+            <li key={error} className="text-xs text-destructive">
+              {error}
+            </li>
+          ))}
+        </ul>
+      )}
+    </div>
+  )
+}
diff --git a/frontend/src/components/champion-selector/candidate-model-picker.test.tsx b/frontend/src/components/champion-selector/candidate-model-picker.test.tsx
new file mode 100644
index 00000000..8c7d171d
--- /dev/null
+++ b/frontend/src/components/champion-selector/candidate-model-picker.test.tsx
@@ -0,0 +1,99 @@
+import { afterEach, describe, expect, it, vi } from 'vitest'
+import { cleanup, fireEvent, render, screen } from '@testing-library/react'
+import { CandidateModelPicker, MAX_CANDIDATES } from './candidate-model-picker'
+import type { CandidateModelInfo, ModelCatalogResponse } from '@/types/api'
+
+afterEach(cleanup)
+
+function model(
+  model_type: string,
+  overrides: Partial<CandidateModelInfo> = {},
+): CandidateModelInfo {
+  return {
+    model_type,
+    label: model_type,
+    family: 'baseline',
+    feature_aware: false,
+    requires_extra: false,
+    default_params: {},
+    supports_auto_predict: true,
+    description: `desc ${model_type}`,
+    ...overrides,
+  }
+}
+
+const CATALOG: ModelCatalogResponse = {
+  models: [
+    model('naive'),
+    model('regression', { family: 'tree', feature_aware: true }),
+    model('lightgbm', { family: 'tree', feature_aware: true, requires_extra: true }),
+    model('xgboost', { family: 'tree', feature_aware: true, requires_extra: true }),
+  ],
+  default_candidate_model_types: ['naive', 'regression'],
+}
+
+describe('CandidateModelPicker', () => {
+  it('toggling a model calls onChange with the new selection', () => {
+    const onChange = vi.fn()
+    render(
+      <CandidateModelPicker
+        catalog={CATALOG}
+        selected={['naive']}
+        onChange={onChange}
+        isLoading={false}
+      />,
+    )
+    fireEvent.click(screen.getByTestId('candidate-checkbox-regression'))
+    expect(onChange).toHaveBeenCalledWith(['naive', 'regression'])
+  })
+
+  it('deselects an already-selected model', () => {
+    const onChange = vi.fn()
+    render(
+      <CandidateModelPicker
+        catalog={CATALOG}
+        selected={['naive', 'regression']}
+        onChange={onChange}
+        isLoading={false}
+      />,
+    )
+    fireEvent.click(screen.getByTestId('candidate-checkbox-naive'))
+    expect(onChange).toHaveBeenCalledWith(['regression'])
+  })
+
+  it('flags opt-in-extra models with an "extra" badge', () => {
+    render(
+      <CandidateModelPicker
+        catalog={CATALOG}
+        selected={[]}
+        onChange={() => {}}
+        isLoading={false}
+      />,
+    )
+    expect(screen.getByTestId('candidate-extra-badge-lightgbm')).toBeTruthy()
+    expect(screen.getByTestId('candidate-extra-badge-xgboost')).toBeTruthy()
+    // A baseline model carries no extra badge.
+    expect(screen.queryByTestId('candidate-extra-badge-naive')).toBeNull()
+  })
+
+  it('caps the selection at MAX_CANDIDATES and disables unselected models', () => {
+    const many = Array.from({ length: MAX_CANDIDATES }, (_, i) => `m${i}`)
+    const onChange = vi.fn()
+    const bigCatalog: ModelCatalogResponse = {
+      models: [...many.map((m) => model(m)), model('extra_model')],
+      default_candidate_model_types: [],
+    }
+    render(
+      <CandidateModelPicker
+        catalog={bigCatalog}
+        selected={many}
+        onChange={onChange}
+        isLoading={false}
+      />,
+    )
+    expect(screen.getByTestId('candidate-cap-badge')).toBeTruthy()
+    // Clicking an unselected model at the cap must NOT add it.
+    fireEvent.click(screen.getByTestId('candidate-checkbox-extra_model'))
+    expect(onChange).not.toHaveBeenCalled()
+  })
+})
diff --git a/frontend/src/components/champion-selector/candidate-model-picker.tsx b/frontend/src/components/champion-selector/candidate-model-picker.tsx
new file mode 100644
index 00000000..6a3b4366
--- /dev/null
+++ b/frontend/src/components/champion-selector/candidate-model-picker.tsx
@@ -0,0 +1,129 @@
+import { LoadingState } from '@/components/common/loading-state'
+import { Badge } from '@/components/ui/badge'
+import { Checkbox } from '@/components/ui/checkbox'
+import { cn } from '@/lib/utils'
+import type { CandidateModelInfo, ModelCatalogResponse, ModelFamily } from '@/types/api'
+
+/** Backend caps `candidate_models` at 10 (ModelSelectionRunRequest.max_length). */
+export const MAX_CANDIDATES = 10
+
+interface CandidateModelPickerProps {
+  catalog?: ModelCatalogResponse
+  selected: string[]
+  onChange: (types: string[]) => void
+  isLoading: boolean
+}
+
+const FAMILY_ORDER: ModelFamily[] = ['baseline', 'additive', 'tree']
+const FAMILY_LABEL: Record<ModelFamily, string> = {
+  baseline: 'Baseline',
+  additive: 'Additive',
+  tree: 'Tree-based',
+}
+
+/**
+ * Candidate-model multi-select fed by the BACKEND catalog (never the hardcoded
+ * `model-type-utils`). Mirrors the batch-matrix-picker conventions: a checkbox
+ * per model grouped by family, opt-in-extra + feature-aware badges, and a
+ * selection cap of 10.
+ */
+export function CandidateModelPicker({
+  catalog,
+  selected,
+  onChange,
+  isLoading,
+}: CandidateModelPickerProps) {
+  if (isLoading) {
+    return <LoadingState message="Loading models…" />
+  }
+  if (!catalog || catalog.models.length === 0) {
+    return (
+      <p className="text-sm text-muted-foreground">No models available.</p>
+    )
+  }
+
+  const selectedSet = new Set(selected)
+  const atCap = selected.length >= MAX_CANDIDATES
+
+  function toggle(modelType: string) {
+    if (selectedSet.has(modelType)) {
+      onChange(selected.filter((type) => type !== modelType))
+    } else if (!atCap) {
+      onChange([...selected, modelType])
+    }
+  }
+
+  const byFamily = new Map<ModelFamily, CandidateModelInfo[]>()
+  for (const model of catalog.models) {
+    const list = byFamily.get(model.family) ?? []
+    list.push(model)
+    byFamily.set(model.family, list)
+  }
+
+  return (
+    <div className="space-y-4" data-testid="candidate-model-picker">
+      <div className="flex items-center justify-between">
+        <span className="text-xs text-muted-foreground">
+          {selected.length} of {MAX_CANDIDATES} selected
+        </span>
+        {atCap && (
+          <Badge variant="secondary" data-testid="candidate-cap-badge">
+            Max {MAX_CANDIDATES} reached
+          </Badge>
+        )}
+      </div>
+
+      {FAMILY_ORDER.filter((family) => byFamily.has(family)).map((family) => (
+        <div key={family} className="space-y-2">
+          <p className="text-xs font-semibold uppercase tracking-wide text-muted-foreground">
+            {FAMILY_LABEL[family]}
+          </p>
+          <div className="grid grid-cols-1 gap-2 sm:grid-cols-2">
+            {(byFamily.get(family) ?? []).map((model) => {
+              const isSelected = selectedSet.has(model.model_type)
+              const disabled = !isSelected && atCap
+              return (
+                <label
+                  key={model.model_type}
+                  data-testid={`candidate-model-${model.model_type}`}
+                  className={cn(
+                    'flex cursor-pointer items-start gap-3 rounded-md border p-3 transition-colors',
+                    isSelected && 'border-primary bg-primary/5',
+                    disabled && 'cursor-not-allowed opacity-50',
+                  )}
+                >
+                  <Checkbox
+                    checked={isSelected}
+                    disabled={disabled}
+                    data-testid={`candidate-checkbox-${model.model_type}`}
+                    onCheckedChange={() => toggle(model.model_type)}
+                    className="mt-0.5"
+                  />
+                  <div className="min-w-0 space-y-1">
+                    <div className="flex flex-wrap items-center gap-1.5">
+                      <span className="text-sm font-medium">{model.label}</span>
+                      {model.requires_extra && (
+                        <Badge
+                          variant="outline"
+                          data-testid={`candidate-extra-badge-${model.model_type}`}
+                        >
+                          extra
+                        </Badge>
+                      )}
+                      {model.feature_aware && (
+                        <Badge variant="outline">feature-aware</Badge>
+                      )}
+                    </div>
+                    <p className="text-xs text-muted-foreground">
+                      {model.description}
+                    </p>
+                  </div>
+                </label>
+              )
+            })}
+          </div>
+        </div>
+      ))}
+    </div>
+  )
+}
diff --git a/frontend/src/components/champion-selector/copy.ts b/frontend/src/components/champion-selector/copy.ts
new file mode 100644
index 00000000..bafbfd53
--- /dev/null
+++ b/frontend/src/components/champion-selector/copy.ts
@@ -0,0 +1,20 @@
+/**
+ * Shared, LOCKED copy for the Champion Selector workflow (Slices A/B/C).
+ *
+ * Kept in a `.ts` (not `.tsx`) module so the `react-refresh/only-export-components`
+ * lint rule never trips on these non-component exports. Slices B and C import
+ * the SAME constants so the bias wording / tie-break explanation never drift.
+ */
+
+/** LOCKED #7 — the canonical bias explanation reused everywhere bias is shown. */
+export const BIAS_EXPLANATION =
+  'Positive bias means the model under-forecasts (risk of stockouts); ' +
+  'negative bias means it over-forecasts (risk of overstock).'
+
+/** LOCKED #8 — the deterministic ranking tie-break chain. */
+export const RANKING_TIE_BREAK =
+  'Ranked by WAPE, then sMAPE, then |bias|, then MAE.'
+
+/** Copy for the disabled Slice-A "Run comparison" CTA. */
+export const RUN_COMPARISON_PENDING =
+  'Model comparison runs in the next update.'
diff --git a/frontend/src/components/champion-selector/decision/business-interpretation-panel.test.tsx b/frontend/src/components/champion-selector/decision/business-interpretation-panel.test.tsx
new file mode 100644
index 00000000..27fd9c50
--- /dev/null
+++ b/frontend/src/components/champion-selector/decision/business-interpretation-panel.test.tsx
@@ -0,0 +1,47 @@
+import { afterEach, describe, expect, it } from 'vitest'
+import { cleanup, render, screen } from '@testing-library/react'
+import { BusinessInterpretationPanel } from './business-interpretation-panel'
+import type { ForecastDecision } from '@/types/api'
+
+afterEach(cleanup)
+
+const decision: ForecastDecision = {
+  method: 'heuristic',
+  lead_time_days: 7,
+  service_level: 0.95,
+  z_value: 1.6449,
+  sigma_daily_demand: 1.4,
+  expected_demand_over_lead_time: 70,
+  safety_stock: 6.1,
+  reorder_point: 76.1,
+  bias_risk_text: 'Positive bias means the model under-forecasts (risk of stockouts).',
+  caveats: ['Safety stock is a deterministic heuristic.'],
+}
+
+const businessSummary = {
+  headline: 'Recommended model: naive (high confidence).',
+  winner: { model_type: 'naive', summary: 'WAPE 10.0%' },
+  comparison: { lead_text: '15% lower WAPE than the runner-up' },
+  data_notes: ['Observed 120 of 120 calendar days.'],
+}
+
+describe('BusinessInterpretationPanel', () => {
+  it('renders the headline, expected demand, and bias risk', () => {
+    render(
+      <BusinessInterpretationPanel businessSummary={businessSummary} decision={decision} />,
+    )
+    const text = screen.getByTestId('business-interpretation-panel').textContent ?? ''
+    expect(text).toContain('Recommended model: naive')
+    expect(screen.getByTestId('business-expected-demand').textContent).toContain('70.0')
+    expect(screen.getByTestId('business-bias-risk').textContent).toContain(
+      'under-forecasts',
+    )
+  })
+
+  it('falls back to the bias explanation when no decision is present', () => {
+    render(<BusinessInterpretationPanel businessSummary={businessSummary} decision={null} />)
+    expect(
+      screen.getByText(/Positive bias means the model under-forecasts/),
+    ).toBeTruthy()
+  })
+})
diff --git a/frontend/src/components/champion-selector/decision/business-interpretation-panel.tsx b/frontend/src/components/champion-selector/decision/business-interpretation-panel.tsx
new file mode 100644
index 00000000..5cb9d1d0
--- /dev/null
+++ b/frontend/src/components/champion-selector/decision/business-interpretation-panel.tsx
@@ -0,0 +1,84 @@
+import { Card, CardContent, CardDescription, CardHeader, CardTitle } from '@/components/ui/card'
+import { BIAS_EXPLANATION } from '@/components/champion-selector/copy'
+import type { ForecastDecision } from '@/types/api'
+
+interface BusinessInterpretationPanelProps {
+  /** The deterministic backend `business_summary` (read-only). */
+  businessSummary: Record<string, unknown> | null
+  /** The decision heuristic (carries bias-risk text + expected demand). */
+  decision: ForecastDecision | null
+}
+
+function str(value: unknown): string | null {
+  return typeof value === 'string' ? value : null
+}
+
+/**
+ * Slice C — business interpretation. Renders the SAME `business_summary` the
+ * backend computed (read-only — Slice B's winner card owns the headline) and
+ * ADDS the decision-layer fields (expected demand + bias risk + caveats).
+ */
+export function BusinessInterpretationPanel({
+  businessSummary,
+  decision,
+}: BusinessInterpretationPanelProps) {
+  const headline = str(businessSummary?.['headline'])
+  const winner = businessSummary?.['winner'] as Record<string, unknown> | null | undefined
+  const winnerSummary = str(winner?.['summary'])
+  const comparison = businessSummary?.['comparison'] as Record<string, unknown> | null | undefined
+  const leadText = str(comparison?.['lead_text'])
+  const dataNotes = Array.isArray(businessSummary?.['data_notes'])
+    ? (businessSummary?.['data_notes'] as unknown[]).filter((x): x is string => typeof x === 'string')
+    : []
+
+  return (
+    <Card data-testid="business-interpretation-panel">
+      <CardHeader>
+        <CardTitle>Business interpretation</CardTitle>
+        {headline && <CardDescription>{headline}</CardDescription>}
+      </CardHeader>
+      <CardContent className="space-y-4 text-sm">
+        {winnerSummary && (
+          <p>
+            <span className="font-medium">Why it won: </span>
+            {winnerSummary}
+            {leadText ? ` — ${leadText}.` : '.'}
+          </p>
+        )}
+
+        {decision && (
+          <div className="space-y-2">
+            <p data-testid="business-expected-demand">
+              <span className="font-medium">Expected demand over lead time: </span>
+              {decision.expected_demand_over_lead_time.toFixed(1)} units (
+              {decision.lead_time_days} days).
+            </p>
+            <p className="text-muted-foreground" data-testid="business-bias-risk">
+              {decision.bias_risk_text}
+            </p>
+          </div>
+        )}
+
+        {!decision && (
+          <p className="text-xs text-muted-foreground">{BIAS_EXPLANATION}</p>
+        )}
+
+        {dataNotes.length > 0 && (
+          <ul className="list-disc space-y-1 pl-5 text-xs text-muted-foreground">
+            {dataNotes.map((note, i) => (
+              <li key={i}>{note}</li>
+            ))}
+          </ul>
+        )}
+
+        {decision?.caveats?.length ? (
+          <ul className="list-disc space-y-1 pl-5 text-xs text-muted-foreground">
+            {decision.caveats.map((caveat, i) => (
+              <li key={i}>{caveat}</li>
+            ))}
+          </ul>
+        ) : null}
+      </CardContent>
+    </Card>
+  )
+}
diff --git a/frontend/src/components/champion-selector/decision/constants.ts b/frontend/src/components/champion-selector/decision/constants.ts
new file mode 100644
index 00000000..1005d481
--- /dev/null
+++ b/frontend/src/components/champion-selector/decision/constants.ts
@@ -0,0 +1,19 @@
+/**
+ * Non-component constants for the Slice C decision panels. Kept in a `.ts`
+ * module so `react-refresh/only-export-components` never trips on them.
+ */
+
+/** Service levels the safety-stock z-table supports exactly (others snap nearest). */
+export const SERVICE_LEVEL_OPTIONS = [0.9, 0.95, 0.975, 0.99] as const
+
+/** Capability-limited blocked state for a feature-aware winner (LOCKED #5). */
+export const FEATURE_AWARE_BLOCKED_COPY =
+  'Forecast not available for feature-aware models — use the What-If Planner ' +
+  '(Scenarios) to forecast through explicit assumptions.'
+
+/** The promotion-is-audited note shown in the promote dialog. */
+export const PROMOTE_AUDIT_NOTE =
+  'Promotion is explicit and recorded — the approver and decision are saved as ' +
+  'an audit record on this run. It is never automatic.'
+
+export const SAFETY_STOCK_HEADER = 'Safety stock (heuristic)'
diff --git a/frontend/src/components/champion-selector/decision/daily-forecast-table.test.tsx b/frontend/src/components/champion-selector/decision/daily-forecast-table.test.tsx
new file mode 100644
index 00000000..c4d2a73b
--- /dev/null
+++ b/frontend/src/components/champion-selector/decision/daily-forecast-table.test.tsx
@@ -0,0 +1,26 @@
+import { afterEach, describe, expect, it } from 'vitest'
+import { cleanup, render, screen } from '@testing-library/react'
+import { DailyForecastTable } from './daily-forecast-table'
+import type { ModelSelectionForecastSummary } from '@/types/api'
+
+afterEach(cleanup)
+
+const forecast: ModelSelectionForecastSummary = {
+  points: [
+    { date: '2026-06-01', forecast: 10.5, lower_bound: 8, upper_bound: 12 },
+    { date: '2026-06-02', forecast: 14.2, lower_bound: null, upper_bound: null },
+  ],
+  total_demand: 24.7,
+  average_demand: 12.35,
+  horizon: 2,
+}
+
+describe('DailyForecastTable', () => {
+  it('renders one row per forecast point with the forecast value', () => {
+    render(<DailyForecastTable forecast={forecast} />)
+    const text = screen.getByTestId('daily-forecast-table').textContent ?? ''
+    expect(text).toContain('2026-06-01')
+    expect(text).toContain('10.50')
+    expect(text).toContain('14.20')
+  })
+})
diff --git a/frontend/src/components/champion-selector/decision/daily-forecast-table.tsx b/frontend/src/components/champion-selector/decision/daily-forecast-table.tsx
new file mode 100644
index 00000000..96404c8f
--- /dev/null
+++ b/frontend/src/components/champion-selector/decision/daily-forecast-table.tsx
@@ -0,0 +1,57 @@
+import {
+  Table,
+  TableBody,
+  TableCell,
+  TableHead,
+  TableHeader,
+  TableRow,
+} from '@/components/ui/table'
+import { Card, CardContent, CardHeader, CardTitle } from '@/components/ui/card'
+import type { ModelSelectionForecastSummary } from '@/types/api'
+
+interface DailyForecastTableProps {
+  forecast: ModelSelectionForecastSummary
+}
+
+function cell(value: unknown): string {
+  return typeof value === 'number' && Number.isFinite(value) ? value.toFixed(2) : '—'
+}
+
+/** Slice C — the per-day forecast table (date, forecast, lower, upper). */
+export function DailyForecastTable({ forecast }: DailyForecastTableProps) {
+  return (
+    <Card data-testid="daily-forecast-table">
+      <CardHeader>
+        <CardTitle>Daily forecast</CardTitle>
+      </CardHeader>
+      <CardContent>
+        <Table>
+          <TableHeader>
+            <TableRow>
+              <TableHead>Date</TableHead>
+              <TableHead className="text-right">Forecast</TableHead>
+              <TableHead className="text-right">Lower</TableHead>
+              <TableHead className="text-right">Upper</TableHead>
+            </TableRow>
+          </TableHeader>
+          <TableBody>
+            {forecast.points.map((point, index) => (
+              <TableRow key={String(point['date'] ?? index)}>
+                <TableCell>{String(point['date'] ?? '—')}</TableCell>
+                <TableCell className="text-right tabular-nums">
+                  {cell(point['forecast'])}
+                </TableCell>
+                <TableCell className="text-right tabular-nums">
+                  {cell(point['lower_bound'])}
+                </TableCell>
+                <TableCell className="text-right tabular-nums">
+                  {cell(point['upper_bound'])}
+                </TableCell>
+              </TableRow>
+            ))}
+          </TableBody>
+        </Table>
+      </CardContent>
+    </Card>
+  )
+}
diff --git a/frontend/src/components/champion-selector/decision/decision-section.tsx b/frontend/src/components/champion-selector/decision/decision-section.tsx
new file mode 100644
index 00000000..c1dbd95c
--- /dev/null
+++ b/frontend/src/components/champion-selector/decision/decision-section.tsx
@@ -0,0 +1,180 @@
+import { useMemo, useState } from 'react'
+import { Button } from '@/components/ui/button'
+import { Card, CardContent } from '@/components/ui/card'
+import { getErrorMessage } from '@/lib/api'
+import {
+  usePredictWinner,
+  usePromoteChampion,
+  useTrainSelected,
+  useTrainWinner,
+} from '@/hooks/use-model-selection'
+import type {
+  ModelCatalogResponse,
+  ModelSelectionRunResponse,
+  PredictWinnerResponse,
+  TrainWinnerResponse,
+} from '@/types/api'
+import { WinnerDecisionPanel } from './winner-decision-panel'
+import { TrainForecastActions } from './train-forecast-actions'
+import { ForecastSummaryCard } from './forecast-summary-card'
+import { ForecastChart } from './forecast-chart'
+import { DailyForecastTable } from './daily-forecast-table'
+import { BusinessInterpretationPanel } from './business-interpretation-panel'
+import { SafetyStockPanel } from './safety-stock-panel'
+import { PromoteChampionDialog } from './promote-champion-dialog'
+
+interface DecisionSectionProps {
+  selectionId: string
+  run: ModelSelectionRunResponse
+  catalog: ModelCatalogResponse | undefined
+}
+
+/**
+ * Slice C — the decision section rendered below a terminal winning run.
+ *
+ * Owns the train / predict / promote mutations (so the page keeps its hooks
+ * unconditional). Mount it with `key={selectionId}` so a fresh run resets the
+ * train/forecast/promote state.
+ */
+export function DecisionSection({ selectionId, run, catalog }: DecisionSectionProps) {
+  const winnerModelType = run.winner?.model_type ?? null
+
+  const [trainResult, setTrainResult] = useState<TrainWinnerResponse | null>(null)
+  const [predictResult, setPredictResult] = useState<PredictWinnerResponse | null>(null)
+  const [leadTimeDays, setLeadTimeDays] = useState(7)
+  const [serviceLevel, setServiceLevel] = useState(0.95)
+  const [promoteOpen, setPromoteOpen] = useState(false)
+  const [promoteError, setPromoteError] = useState<string | null>(null)
+  const [promotedAlias, setPromotedAlias] = useState<string | null>(null)
+
+  const trainWinner = useTrainWinner(selectionId)
+  const trainSelected = useTrainSelected(selectionId)
+  const predict = usePredictWinner(selectionId)
+  const promote = usePromoteChampion(selectionId)
+
+  // Every candidate the run offered (winner + runners-up + failed), de-duped.
+  const candidateModelTypes = useMemo(() => {
+    const seen = new Set<string>()
+    for (const entry of run.ranking) seen.add(entry.model_type)
+    if (winnerModelType) seen.add(winnerModelType)
+    return [...seen]
+  }, [run.ranking, winnerModelType])
+
+  // Capability of the model that WILL be (or was) trained — drives the blocked
+  // forecast state for a feature-aware winner (LOCKED #5).
+  const activeModelType = trainResult?.model_type ?? winnerModelType
+  const supportsAutoPredict = useMemo(() => {
+    const info = catalog?.models.find((m) => m.model_type === activeModelType)
+    return info?.supports_auto_predict ?? true
+  }, [catalog, activeModelType])
+
+  const trained = trainResult !== null || run.final_model !== null
+
+  if (winnerModelType === null) return null
+
+  function handleTrain(modelType: string, overrideReason: string | null) {
+    setPredictResult(null)
+    setPromotedAlias(null)
+    const onSuccess = (data: TrainWinnerResponse) => setTrainResult(data)
+    if (modelType === winnerModelType) {
+      trainWinner.mutate(undefined, { onSuccess })
+    } else {
+      trainSelected.mutate({ model_type: modelType, override_reason: overrideReason }, { onSuccess })
+    }
+  }
+
+  function handleForecast() {
+    predict.mutate(
+      { lead_time_days: leadTimeDays, service_level: serviceLevel },
+      { onSuccess: (data) => setPredictResult(data) },
+    )
+  }
+
+  function handlePromote(body: Parameters<typeof promote.mutate>[0]) {
+    setPromoteError(null)
+    promote.mutate(body, {
+      onSuccess: (data) => setPromotedAlias(data.alias_name),
+      onError: (err) => setPromoteError(getErrorMessage(err)),
+    })
+  }
+
+  const forecast = predictResult?.forecast ?? null
+  const decision = predictResult?.decision ?? null
+  const isOverride = trainResult?.is_override ?? false
+
+  return (
+    <div className="space-y-6" data-testid="decision-section">
+      <WinnerDecisionPanel
+        winnerModelType={winnerModelType}
+        candidateModelTypes={candidateModelTypes}
+        isTraining={trainWinner.isPending || trainSelected.isPending}
+        trainResult={trainResult}
+        onTrain={handleTrain}
+      />
+
+      <Card>
+        <CardContent className="flex flex-col gap-4 pt-6">
+          <TrainForecastActions
+            supportsAutoPredict={supportsAutoPredict}
+            trained={trained}
+            isPredicting={predict.isPending}
+            onForecast={handleForecast}
+          />
+          {predict.isError && (
+            <p className="text-sm text-destructive" data-testid="forecast-error">
+              {getErrorMessage(predict.error)}
+            </p>
+          )}
+        </CardContent>
+      </Card>
+
+      {forecast && (
+        <>
+          <ForecastSummaryCard forecast={forecast} />
+          <ForecastChart forecast={forecast} />
+          <DailyForecastTable forecast={forecast} />
+          <BusinessInterpretationPanel
+            businessSummary={run.business_summary}
+            decision={decision}
+          />
+          <SafetyStockPanel
+            decision={decision}
+            leadTimeDays={leadTimeDays}
+            serviceLevel={serviceLevel}
+            isRecomputing={predict.isPending}
+            onLeadTimeChange={setLeadTimeDays}
+            onServiceLevelChange={setServiceLevel}
+            onRecompute={handleForecast}
+          />
+        </>
+      )}
+
+      {trained && (
+        <Card>
+          <CardContent className="flex items-center justify-between gap-3 pt-6">
+            <p className="text-sm text-muted-foreground">
+              Promote the trained champion to a registry alias (approval-gated).
+            </p>
+            <Button
+              type="button"
+              onClick={() => setPromoteOpen(true)}
+              data-testid="open-promote-dialog"
+            >
+              Promote champion
+            </Button>
+          </CardContent>
+        </Card>
+      )}
+
+      <PromoteChampionDialog
+        open={promoteOpen}
+        onOpenChange={setPromoteOpen}
+        isOverride={isOverride}
+        isPromoting={promote.isPending}
+        promoteError={promoteError}
+        promotedAlias={promotedAlias}
+        onConfirm={handlePromote}
+      />
+    </div>
+  )
+}
diff --git a/frontend/src/components/champion-selector/decision/forecast-chart.test.tsx b/frontend/src/components/champion-selector/decision/forecast-chart.test.tsx
new file mode 100644
index 00000000..c28c6726
--- /dev/null
+++ b/frontend/src/components/champion-selector/decision/forecast-chart.test.tsx
@@ -0,0 +1,33 @@
+import { afterEach, beforeAll, describe, expect, it, vi } from 'vitest'
+import { cleanup, render, screen } from '@testing-library/react'
+import { ForecastChart } from './forecast-chart'
+import type { ModelSelectionForecastSummary } from '@/types/api'
+
+// Recharts' ResponsiveContainer needs ResizeObserver in jsdom.
+beforeAll(() => {
+  class ResizeObserverStub {
+    observe() {}
+    unobserve() {}
+    disconnect() {}
+  }
+  vi.stubGlobal('ResizeObserver', ResizeObserverStub)
+})
+
+afterEach(cleanup)
+
+const forecast: ModelSelectionForecastSummary = {
+  points: [
+    { date: '2026-06-01', forecast: 10, lower_bound: 8, upper_bound: 12 },
+    { date: '2026-06-02', forecast: 14, lower_bound: 11, upper_bound: 17 },
+  ],
+  total_demand: 24,
+  average_demand: 12,
+  horizon: 2,
+}
+
+describe('ForecastChart', () => {
+  it('renders the chart container from forecast points', () => {
+    render(<ForecastChart forecast={forecast} />)
+    expect(screen.getByTestId('forecast-chart')).toBeTruthy()
+  })
+})
diff --git a/frontend/src/components/champion-selector/decision/forecast-chart.tsx b/frontend/src/components/champion-selector/decision/forecast-chart.tsx
new file mode 100644
index 00000000..fccd54b8
--- /dev/null
+++ b/frontend/src/components/champion-selector/decision/forecast-chart.tsx
@@ -0,0 +1,43 @@
+import { TimeSeriesChart } from '@/components/charts/time-series-chart'
+import type { ModelSelectionForecastSummary } from '@/types/api'
+
+interface ForecastChartProps {
+  forecast: ModelSelectionForecastSummary
+}
+
+interface ChartRow {
+  date: string
+  forecast: number
+  lower?: number
+  upper?: number
+}
+
+/** Slice C — the horizon forecast curve (optional interval band). */
+export function ForecastChart({ forecast }: ForecastChartProps) {
+  const rows: ChartRow[] = forecast.points.map((point) => {
+    const lower = point['lower_bound']
+    const upper = point['upper_bound']
+    return {
+      date: String(point['date'] ?? ''),
+      forecast: Number(point['forecast'] ?? 0),
+      lower: typeof lower === 'number' ? lower : undefined,
+      upper: typeof upper === 'number' ? upper : undefined,
+    }
+  })
+  const hasInterval = rows.some((row) => row.lower !== undefined && row.upper !== undefined)
+
+  return (
+    <div data-testid="forecast-chart">
+      <TimeSeriesChart
+        title="Forecast"
+        description="Predicted demand over the forecast horizon."
+        data={rows}
+        predictedKey="forecast"
+        showActual={false}
+        lowerKey="lower"
+        upperKey="upper"
+        showInterval={hasInterval}
+      />
+    </div>
+  )
+}
diff --git a/frontend/src/components/champion-selector/decision/forecast-summary-card.test.tsx b/frontend/src/components/champion-selector/decision/forecast-summary-card.test.tsx
new file mode 100644
index 00000000..d9e57324
--- /dev/null
+++ b/frontend/src/components/champion-selector/decision/forecast-summary-card.test.tsx
@@ -0,0 +1,37 @@
+import { afterEach, describe, expect, it } from 'vitest'
+import { cleanup, render, screen } from '@testing-library/react'
+import { ForecastSummaryCard } from './forecast-summary-card'
+import type { ModelSelectionForecastSummary } from '@/types/api'
+
+afterEach(cleanup)
+
+const forecast: ModelSelectionForecastSummary = {
+  points: [],
+  total_demand: 140,
+  average_demand: 10,
+  horizon: 14,
+  peak_date: '2026-06-02',
+  peak_demand: 25,
+  low_date: '2026-06-03',
+  low_demand: 5,
+}
+
+describe('ForecastSummaryCard', () => {
+  it('renders total, peak, and low tiles', () => {
+    render(<ForecastSummaryCard forecast={forecast} />)
+    const text = screen.getByTestId('forecast-summary-card').textContent ?? ''
+    expect(text).toContain('140.0')
+    expect(text).toContain('25.0')
+    expect(text).toContain('2026-06-02')
+    expect(text).toContain('14d')
+  })
+
+  it('renders an em-dash for null peak/low', () => {
+    render(
+      <ForecastSummaryCard
+        forecast={{ ...forecast, peak_demand: null, low_demand: null }}
+      />,
+    )
+    expect(screen.getByTestId('forecast-summary-card').textContent).toContain('—')
+  })
+})
diff --git a/frontend/src/components/champion-selector/decision/forecast-summary-card.tsx b/frontend/src/components/champion-selector/decision/forecast-summary-card.tsx
new file mode 100644
index 00000000..dddab510
--- /dev/null
+++ b/frontend/src/components/champion-selector/decision/forecast-summary-card.tsx
@@ -0,0 +1,48 @@
+import { Card, CardContent, CardHeader, CardTitle } from '@/components/ui/card'
+import type { ModelSelectionForecastSummary } from '@/types/api'
+
+interface ForecastSummaryCardProps {
+  forecast: ModelSelectionForecastSummary
+}
+
+function Tile({ label, value, sub }: { label: string; value: string; sub?: string }) {
+  return (
+    <div className="rounded-md border bg-muted/30 p-3">
+      <p className="text-xs text-muted-foreground">{label}</p>
+      <p className="text-lg font-semibold tabular-nums">{value}</p>
+      {sub && <p className="text-xs text-muted-foreground">{sub}</p>}
+    </div>
+  )
+}
+
+function num(value: number | null | undefined): string {
+  return typeof value === 'number' && Number.isFinite(value) ? value.toFixed(1) : '—'
+}
+
+/** Slice C — total / average / peak / low / horizon KPI tiles (null-safe). */
+export function ForecastSummaryCard({ forecast }: ForecastSummaryCardProps) {
+  return (
+    <Card data-testid="forecast-summary-card">
+      <CardHeader>
+        <CardTitle>Forecast summary</CardTitle>
+      </CardHeader>
+      <CardContent>
+        <div className="grid grid-cols-2 gap-3 sm:grid-cols-3 lg:grid-cols-5">
+          <Tile label="Total demand" value={num(forecast.total_demand)} />
+          <Tile label="Average / day" value={num(forecast.average_demand)} />
+          <Tile
+            label="Peak day"
+            value={num(forecast.peak_demand)}
+            sub={forecast.peak_date ?? undefined}
+          />
+          <Tile
+            label="Low day"
+            value={num(forecast.low_demand)}
+            sub={forecast.low_date ?? undefined}
+          />
+          <Tile label="Horizon" value={`${forecast.horizon}d`} />
+        </div>
+      </CardContent>
+    </Card>
+  )
+}
diff --git a/frontend/src/components/champion-selector/decision/promote-champion-dialog.test.tsx b/frontend/src/components/champion-selector/decision/promote-champion-dialog.test.tsx
new file mode 100644
index 00000000..c7dbe718
--- /dev/null
+++ b/frontend/src/components/champion-selector/decision/promote-champion-dialog.test.tsx
@@ -0,0 +1,72 @@
+import { afterEach, describe, expect, it, vi } from 'vitest'
+import { cleanup, fireEvent, render, screen } from '@testing-library/react'
+import { PromoteChampionDialog } from './promote-champion-dialog'
+
+afterEach(cleanup)
+
+function renderDialog(overrides: Partial<Parameters<typeof PromoteChampionDialog>[0]> = {}) {
+  const props = {
+    open: true,
+    onOpenChange: vi.fn(),
+    isOverride: false,
+    isPromoting: false,
+    promoteError: null,
+    promotedAlias: null,
+    onConfirm: vi.fn(),
+    ...overrides,
+  }
+  render(<PromoteChampionDialog {...props} />)
+  return props
+}
+
+describe('PromoteChampionDialog', () => {
+  it('keeps confirm disabled until alias + approver are valid', () => {
+    renderDialog()
+    expect(screen.getByTestId('promote-confirm-action').hasAttribute('disabled')).toBe(true)
+    fireEvent.change(screen.getByTestId('promote-alias-input'), {
+      target: { value: 'champion-x' },
+    })
+    fireEvent.change(screen.getByTestId('promote-approver-input'), {
+      target: { value: 'gabor' },
+    })
+    expect(screen.getByTestId('promote-confirm-action').hasAttribute('disabled')).toBe(false)
+  })
+
+  it('flags an invalid alias name', () => {
+    renderDialog()
+    fireEvent.change(screen.getByTestId('promote-alias-input'), {
+      target: { value: 'Bad Alias' },
+    })
+    expect(screen.getByTestId('promote-alias-error')).toBeTruthy()
+  })
+
+  it('requires the ack checkbox for a non-recommended (override) model', () => {
+    renderDialog({ isOverride: true })
+    fireEvent.change(screen.getByTestId('promote-alias-input'), {
+      target: { value: 'champion-x' },
+    })
+    fireEvent.change(screen.getByTestId('promote-approver-input'), {
+      target: { value: 'gabor' },
+    })
+    // still disabled until the ack is checked
+    expect(screen.getByTestId('promote-confirm-action').hasAttribute('disabled')).toBe(true)
+    fireEvent.click(screen.getByTestId('promote-ack-checkbox'))
+    expect(screen.getByTestId('promote-confirm-action').hasAttribute('disabled')).toBe(false)
+  })
+
+  it('calls onConfirm with the promote body', () => {
+    const props = renderDialog()
+    fireEvent.change(screen.getByTestId('promote-alias-input'), {
+      target: { value: 'champion-x' },
+    })
+    fireEvent.change(screen.getByTestId('promote-approver-input'), {
+      target: { value: 'gabor' },
+    })
+    fireEvent.click(screen.getByTestId('promote-confirm-action'))
+    expect(props.onConfirm).toHaveBeenCalledWith({
+      alias_name: 'champion-x',
+      approved_by: 'gabor',
+      acknowledge_non_recommended: false,
+    })
+  })
+})
diff --git a/frontend/src/components/champion-selector/decision/promote-champion-dialog.tsx b/frontend/src/components/champion-selector/decision/promote-champion-dialog.tsx
new file mode 100644
index 00000000..79e7e486
--- /dev/null
+++ b/frontend/src/components/champion-selector/decision/promote-champion-dialog.tsx
@@ -0,0 +1,163 @@
+import { useState } from 'react'
+import { CheckCircle2, ShieldAlert } from 'lucide-react'
+import {
+  AlertDialog,
+  AlertDialogAction,
+  AlertDialogCancel,
+  AlertDialogContent,
+  AlertDialogDescription,
+  AlertDialogFooter,
+  AlertDialogHeader,
+  AlertDialogTitle,
+} from '@/components/ui/alert-dialog'
+import { Checkbox } from '@/components/ui/checkbox'
+import { Input } from '@/components/ui/input'
+import type { PromoteRequest } from '@/types/api'
+import { PROMOTE_AUDIT_NOTE } from './constants'
+
+const ALIAS_RE = /^[a-z0-9][a-z0-9\-_]*$/
+
+interface PromoteChampionDialogProps {
+  open: boolean
+  onOpenChange: (open: boolean) => void
+  /** True when a non-recommended model was trained (requires explicit ack). */
+  isOverride: boolean
+  defaultAliasName?: string
+  isPromoting: boolean
+  /** Error message from the last promote attempt (null on success/idle). */
+  promoteError: string | null
+  /** The alias name on a successful promotion (null until promoted). */
+  promotedAlias: string | null
+  onConfirm: (body: PromoteRequest) => void
+}
+
+/**
+ * Slice C — the approval-gated promote dialog. Requires an approver and a valid
+ * alias name; a non-recommended model additionally requires the ack checkbox.
+ * Mirrors `forecast-intelligence/promote-confirmation-dialog.tsx`, but calls the
+ * model_selection `promote` flow (compare and promote stay separate).
+ */
+export function PromoteChampionDialog({
+  open,
+  onOpenChange,
+  isOverride,
+  defaultAliasName = '',
+  isPromoting,
+  promoteError,
+  promotedAlias,
+  onConfirm,
+}: PromoteChampionDialogProps) {
+  const [aliasName, setAliasName] = useState(defaultAliasName)
+  const [approvedBy, setApprovedBy] = useState('')
+  const [ack, setAck] = useState(false)
+
+  const aliasValid = ALIAS_RE.test(aliasName.trim())
+  const canConfirm =
+    aliasValid &&
+    approvedBy.trim().length > 0 &&
+    (!isOverride || ack) &&
+    !isPromoting
+
+  function handleConfirm() {
+    if (!canConfirm) return
+    onConfirm({
+      alias_name: aliasName.trim(),
+      approved_by: approvedBy.trim(),
+      acknowledge_non_recommended: isOverride ? ack : false,
+    })
+  }
+
+  return (
+    <AlertDialog
+      open={open}
+      onOpenChange={(next) => {
+        if (!next) setAck(false)
+        onOpenChange(next)
+      }}
+    >
+      <AlertDialogContent data-testid="promote-champion-dialog">
+        <AlertDialogHeader>
+          <AlertDialogTitle>Promote champion to a registry alias</AlertDialogTitle>
+          <AlertDialogDescription>{PROMOTE_AUDIT_NOTE}</AlertDialogDescription>
+        </AlertDialogHeader>
+
+        <div className="space-y-3">
+          <div className="space-y-1">
+            <label htmlFor="promote-alias-name" className="text-sm font-medium">
+              Alias name
+            </label>
+            <Input
+              id="promote-alias-name"
+              value={aliasName}
+              onChange={(event) => setAliasName(event.target.value)}
+              placeholder="e.g. champion-store5-prod8"
+              autoComplete="off"
+              data-testid="promote-alias-input"
+            />
+            {aliasName.length > 0 && !aliasValid && (
+              <p className="text-xs text-destructive" data-testid="promote-alias-error">
+                Lowercase letters, digits, hyphens and underscores only (must start
+                with a letter or digit).
+              </p>
+            )}
+          </div>
+
+          <div className="space-y-1">
+            <label htmlFor="promote-approved-by" className="text-sm font-medium">
+              Approved by
+            </label>
+            <Input
+              id="promote-approved-by"
+              value={approvedBy}
+              onChange={(event) => setApprovedBy(event.target.value)}
+              placeholder="your name"
+              autoComplete="off"
+              data-testid="promote-approver-input"
+            />
+          </div>
+
+          {isOverride && (
+            <label className="flex items-start gap-2 text-xs" data-testid="promote-ack-row">
+              <Checkbox
+                checked={ack}
+                onCheckedChange={(state) => setAck(state === true)}
+                data-testid="promote-ack-checkbox"
+              />
+              <span className="flex items-start gap-1.5">
+                <ShieldAlert className="mt-0.5 h-3.5 w-3.5 shrink-0 text-warning" />
+                I understand I am promoting a non-recommended model.
+              </span>
+            </label>
+          )}
+
+          {promoteError && (
+            <p className="text-xs text-destructive" data-testid="promote-error">
+              {promoteError}
+            </p>
+          )}
+
+          {promotedAlias && (
+            <div
+              className="flex items-start gap-2 rounded-md border border-success/40 bg-success/10 p-2 text-xs"
+              data-testid="promote-success"
+            >
+              <CheckCircle2 className="mt-0.5 h-3.5 w-3.5 shrink-0 text-success" />
+              Promoted to alias <span className="font-mono">{promotedAlias}</span>.
+            </div>
+          )}
+        </div>
+
+        <AlertDialogFooter>
+          <AlertDialogCancel>Close</AlertDialogCancel>
+          <AlertDialogAction
+            onClick={handleConfirm}
+            disabled={!canConfirm}
+            data-testid="promote-confirm-action"
+          >
+            {isPromoting ? 'Promoting…' : 'Promote'}
+          </AlertDialogAction>
+        </AlertDialogFooter>
+      </AlertDialogContent>
+    </AlertDialog>
+  )
+}
diff --git a/frontend/src/components/champion-selector/decision/safety-stock-panel.test.tsx b/frontend/src/components/champion-selector/decision/safety-stock-panel.test.tsx
new file mode 100644
index 00000000..a5a27e9f
--- /dev/null
+++ b/frontend/src/components/champion-selector/decision/safety-stock-panel.test.tsx
@@ -0,0 +1,54 @@
+import { afterEach, describe, expect, it, vi } from 'vitest'
+import { cleanup, fireEvent, render, screen } from '@testing-library/react'
+import { SafetyStockPanel } from './safety-stock-panel'
+import type { ForecastDecision } from '@/types/api'
+
+afterEach(cleanup)
+
+const decision: ForecastDecision = {
+  method: 'heuristic',
+  lead_time_days: 7,
+  service_level: 0.95,
+  z_value: 1.6449,
+  sigma_daily_demand: 1.41,
+  expected_demand_over_lead_time: 70,
+  safety_stock: 6.13,
+  reorder_point: 76.13,
+  bias_risk_text: 'bias text',
+  caveats: ['heuristic'],
+}
+
+function renderPanel(overrides: Partial<Parameters<typeof SafetyStockPanel>[0]> = {}) {
+  const props = {
+    decision,
+    leadTimeDays: 7,
+    serviceLevel: 0.95,
+    isRecomputing: false,
+    onLeadTimeChange: vi.fn(),
+    onServiceLevelChange: vi.fn(),
+    onRecompute: vi.fn(),
+    ...overrides,
+  }
+  render(<SafetyStockPanel {...props} />)
+  return props
+}
+
+describe('SafetyStockPanel', () => {
+  it('renders the labeled heuristic header and stats', () => {
+    renderPanel()
+    const text = screen.getByTestId('safety-stock-panel').textContent ?? ''
+    expect(text).toContain('Safety stock (heuristic)')
+    expect(text).toContain('1.6449')
+    expect(text).toContain('6.1')
+  })
+
+  it('fires onLeadTimeChange and onRecompute', () => {
+    const props = renderPanel()
+    fireEvent.change(screen.getByTestId('safety-stock-lead-time'), {
+      target: { value: '14' },
+    })
+    expect(props.onLeadTimeChange).toHaveBeenCalledWith(14)
+    fireEvent.click(screen.getByTestId('safety-stock-recompute'))
+    expect(props.onRecompute).toHaveBeenCalledOnce()
+  })
+})
diff --git a/frontend/src/components/champion-selector/decision/safety-stock-panel.tsx b/frontend/src/components/champion-selector/decision/safety-stock-panel.tsx
new file mode 100644
index 00000000..11f1b43e
--- /dev/null
+++ b/frontend/src/components/champion-selector/decision/safety-stock-panel.tsx
@@ -0,0 +1,115 @@
+import { Loader2, RefreshCw } from 'lucide-react'
+import { Button } from '@/components/ui/button'
+import { Card, CardContent, CardDescription, CardHeader, CardTitle } from '@/components/ui/card'
+import { Input } from '@/components/ui/input'
+import {
+  Select,
+  SelectContent,
+  SelectItem,
+  SelectTrigger,
+  SelectValue,
+} from '@/components/ui/select'
+import type { ForecastDecision } from '@/types/api'
+import { SAFETY_STOCK_HEADER, SERVICE_LEVEL_OPTIONS } from './constants'
+
+interface SafetyStockPanelProps {
+  decision: ForecastDecision | null
+  leadTimeDays: number
+  serviceLevel: number
+  isRecomputing: boolean
+  onLeadTimeChange: (value: number) => void
+  onServiceLevelChange: (value: number) => void
+  onRecompute: () => void
+}
+
+function Stat({ label, value }: { label: string; value: string }) {
+  return (
+    <div className="rounded-md border bg-muted/30 p-3">
+      <p className="text-xs text-muted-foreground">{label}</p>
+      <p className="text-lg font-semibold tabular-nums">{value}</p>
+    </div>
+  )
+}
+
+/**
+ * Slice C — the CLEARLY-LABELED safety-stock heuristic. Lead time + service
+ * level inputs recompute the forecast decision. Never influences ranking.
+ */
+export function SafetyStockPanel({
+  decision,
+  leadTimeDays,
+  serviceLevel,
+  isRecomputing,
+  onLeadTimeChange,
+  onServiceLevelChange,
+  onRecompute,
+}: SafetyStockPanelProps) {
+  return (
+    <Card data-testid="safety-stock-panel">
+      <CardHeader>
+        <CardTitle>{SAFETY_STOCK_HEADER}</CardTitle>
+        <CardDescription>
+          A deterministic reorder heuristic (demand variability only, constant lead
+          time). Adjust the inputs and recompute.
+        </CardDescription>
+      </CardHeader>
+      <CardContent className="space-y-4">
+        <div className="flex flex-col gap-3 sm:flex-row sm:items-end">
+          <div className="space-y-1">
+            <span className="text-xs text-muted-foreground">Lead time (days)</span>
+            <Input
+              type="number"
+              min={1}
+              max={365}
+              value={String(leadTimeDays)}
+              onChange={(event) => onLeadTimeChange(Number(event.target.value) || 0)}
+              className="w-32"
+              data-testid="safety-stock-lead-time"
+            />
+          </div>
+          <div className="space-y-1">
+            <span className="text-xs text-muted-foreground">Service level</span>
+            <Select
+              value={String(serviceLevel)}
+              onValueChange={(value) => onServiceLevelChange(Number(value))}
+            >
+              <SelectTrigger className="w-32" data-testid="safety-stock-service-level">
+                <SelectValue />
+              </SelectTrigger>
+              <SelectContent>
+                {SERVICE_LEVEL_OPTIONS.map((level) => (
+                  <SelectItem key={level} value={String(level)}>
+                    {(level * 100).toFixed(level === 0.975 ? 1 : 0)}%
+                  </SelectItem>
+                ))}
+              </SelectContent>
+            </Select>
+          </div>
+          <Button
+            type="button"
+            variant="secondary"
+            onClick={onRecompute}
+            disabled={isRecomputing}
+            data-testid="safety-stock-recompute"
+          >
+            {isRecomputing ? (
+              <Loader2 className="mr-2 h-4 w-4 animate-spin" />
+            ) : (
+              <RefreshCw className="mr-2 h-4 w-4" />
+            )}
+            Recompute
+          </Button>
+        </div>
+
+        {decision && (
+          <div className="grid grid-cols-2 gap-3 sm:grid-cols-4">
+            <Stat label="z value" value={decision.z_value.toFixed(4)} />
+            <Stat label="σ daily" value={decision.sigma_daily_demand.toFixed(2)} />
+            <Stat label="Safety stock" value={decision.safety_stock.toFixed(1)} />
+            <Stat label="Reorder point" value={decision.reorder_point.toFixed(1)} />
+          </div>
+        )}
+      </CardContent>
+    </Card>
+  )
+}
diff --git a/frontend/src/components/champion-selector/decision/train-forecast-actions.test.tsx b/frontend/src/components/champion-selector/decision/train-forecast-actions.test.tsx
new file mode 100644
index 00000000..3ff27f99
--- /dev/null
+++ b/frontend/src/components/champion-selector/decision/train-forecast-actions.test.tsx
@@ -0,0 +1,48 @@
+import { afterEach, describe, expect, it, vi } from 'vitest'
+import { cleanup, fireEvent, render, screen } from '@testing-library/react'
+import { TrainForecastActions } from './train-forecast-actions'
+
+afterEach(cleanup)
+
+describe('TrainForecastActions', () => {
+  it('shows the blocked state for a feature-aware winner', () => {
+    render(
+      <TrainForecastActions
+        supportsAutoPredict={false}
+        trained
+        isPredicting={false}
+        onForecast={() => {}}
+      />,
+    )
+    expect(screen.getByTestId('forecast-blocked-state').textContent).toContain(
+      'What-If Planner',
+    )
+    expect(screen.queryByTestId('forecast-button')).toBeNull()
+  })
+
+  it('fires onForecast when the trained forecast button is clicked', () => {
+    const onForecast = vi.fn()
+    render(
+      <TrainForecastActions
+        supportsAutoPredict
+        trained
+        isPredicting={false}
+        onForecast={onForecast}
+      />,
+    )
+    fireEvent.click(screen.getByTestId('forecast-button'))
+    expect(onForecast).toHaveBeenCalledOnce()
+  })
+
+  it('disables the forecast button until a model is trained', () => {
+    render(
+      <TrainForecastActions
+        supportsAutoPredict
+        trained={false}
+        isPredicting={false}
+        onForecast={() => {}}
+      />,
+    )
+    expect(screen.getByTestId('forecast-button').hasAttribute('disabled')).toBe(true)
+  })
+})
diff --git a/frontend/src/components/champion-selector/decision/train-forecast-actions.tsx b/frontend/src/components/champion-selector/decision/train-forecast-actions.tsx
new file mode 100644
index 00000000..0ba12605
--- /dev/null
+++ b/frontend/src/components/champion-selector/decision/train-forecast-actions.tsx
@@ -0,0 +1,54 @@
+import { Loader2, LineChart, Ban } from 'lucide-react'
+import { Button } from '@/components/ui/button'
+import { FEATURE_AWARE_BLOCKED_COPY } from './constants'
+
+interface TrainForecastActionsProps {
+  /** From the Slice A catalog (`supports_auto_predict = not feature_aware`). */
+  supportsAutoPredict: boolean
+  /** True once a model bundle has been trained for the selection. */
+  trained: boolean
+  isPredicting: boolean
+  onForecast: () => void
+}
+
+/**
+ * Slice C — the Forecast action + the capability-limited blocked state.
+ *
+ * A feature-aware winner cannot auto-predict (LOCKED #5): instead of faking a
+ * forecast we surface the limitation and route the user to the What-If Planner.
+ */
+export function TrainForecastActions({
+  supportsAutoPredict,
+  trained,
+  isPredicting,
+  onForecast,
+}: TrainForecastActionsProps) {
+  if (!supportsAutoPredict) {
+    return (
+      <div
+        className="flex items-start gap-2 rounded-md border border-muted bg-muted/30 p-3 text-sm text-muted-foreground"
+        data-testid="forecast-blocked-state"
+      >
+        <Ban className="mt-0.5 h-4 w-4 shrink-0" />
+        <span>{FEATURE_AWARE_BLOCKED_COPY}</span>
+      </div>
+    )
+  }
+
+  return (
+    <Button
+      type="button"
+      variant="secondary"
+      onClick={onForecast}
+      disabled={!trained || isPredicting}
+      data-testid="forecast-button"
+    >
+      {isPredicting ? (
+        <Loader2 className="mr-2 h-4 w-4 animate-spin" />
+      ) : (
+        <LineChart className="mr-2 h-4 w-4" />
+      )}
+      {trained ? 'Generate forecast' : 'Train a model first'}
+    </Button>
+  )
+}
diff --git a/frontend/src/components/champion-selector/decision/winner-decision-panel.test.tsx b/frontend/src/components/champion-selector/decision/winner-decision-panel.test.tsx
new file mode 100644
index 00000000..5aca0b38
--- /dev/null
+++ b/frontend/src/components/champion-selector/decision/winner-decision-panel.test.tsx
@@ -0,0 +1,48 @@
+import { afterEach, describe, expect, it, vi } from 'vitest'
+import { cleanup, fireEvent, render, screen } from '@testing-library/react'
+import { WinnerDecisionPanel } from './winner-decision-panel'
+import type { TrainWinnerResponse } from '@/types/api'
+
+afterEach(cleanup)
+
+describe('WinnerDecisionPanel', () => {
+  it('trains the recommended winner without a confirm dialog', () => {
+    const onTrain = vi.fn()
+    render(
+      <WinnerDecisionPanel
+        winnerModelType="naive"
+        candidateModelTypes={['naive', 'seasonal_naive']}
+        isTraining={false}
+        trainResult={null}
+        onTrain={onTrain}
+      />,
+    )
+    expect(screen.getByTestId('decision-train-button').textContent).toContain(
+      'Train recommended',
+    )
+    fireEvent.click(screen.getByTestId('decision-train-button'))
+    expect(onTrain).toHaveBeenCalledWith('naive', null)
+  })
+
+  it('renders the override warning from a train result', () => {
+    const trainResult: TrainWinnerResponse = {
+      selection_id: 's',
+      model_type: 'seasonal_naive',
+      model_path: 'p',
+      is_override: true,
+      override_warning: 'You trained seasonal_naive instead of naive.',
+    }
+    render(
+      <WinnerDecisionPanel
+        winnerModelType="naive"
+        candidateModelTypes={['naive', 'seasonal_naive']}
+        isTraining={false}
+        trainResult={trainResult}
+        onTrain={() => {}}
+      />,
+    )
+    expect(screen.getByTestId('decision-override-warning').textContent).toContain(
+      'seasonal_naive',
+    )
+  })
+})
diff --git a/frontend/src/components/champion-selector/decision/winner-decision-panel.tsx b/frontend/src/components/champion-selector/decision/winner-decision-panel.tsx
new file mode 100644
index 00000000..5b0d58d5
--- /dev/null
+++ b/frontend/src/components/champion-selector/decision/winner-decision-panel.tsx
@@ -0,0 +1,158 @@
+import { useState } from 'react'
+import { Loader2, Trophy, TriangleAlert } from 'lucide-react'
+import {
+  AlertDialog,
+  AlertDialogAction,
+  AlertDialogCancel,
+  AlertDialogContent,
+  AlertDialogDescription,
+  AlertDialogFooter,
+  AlertDialogHeader,
+  AlertDialogTitle,
+} from '@/components/ui/alert-dialog'
+import { Button } from '@/components/ui/button'
+import { Card, CardContent, CardDescription, CardHeader, CardTitle } from '@/components/ui/card'
+import { Input } from '@/components/ui/input'
+import {
+  Select,
+  SelectContent,
+  SelectItem,
+  SelectTrigger,
+  SelectValue,
+} from '@/components/ui/select'
+import type { TrainWinnerResponse } from '@/types/api'
+
+interface WinnerDecisionPanelProps {
+  winnerModelType: string
+  /** Every candidate offered in the run (winner + runners-up + failed). */
+  candidateModelTypes: string[]
+  isTraining: boolean
+  trainResult: TrainWinnerResponse | null
+  /** Train the chosen model — the page routes winner vs. override. */
+  onTrain: (modelType: string, overrideReason: string | null) => void
+}
+
+/**
+ * Slice C — accept the recommended winner OR override to another candidate.
+ *
+ * Picking a non-winner opens a confirm dialog (explicit warning + an optional
+ * reason) before training. Presentational — the page owns the train mutations.
+ */
+export function WinnerDecisionPanel({
+  winnerModelType,
+  candidateModelTypes,
+  isTraining,
+  trainResult,
+  onTrain,
+}: WinnerDecisionPanelProps) {
+  const [selected, setSelected] = useState(winnerModelType)
+  const [overrideReason, setOverrideReason] = useState('')
+  const [confirmOpen, setConfirmOpen] = useState(false)
+
+  const isOverride = selected !== winnerModelType
+
+  function handleTrainClick() {
+    if (isOverride) {
+      setConfirmOpen(true)
+      return
+    }
+    onTrain(selected, null)
+  }
+
+  function handleConfirmOverride() {
+    onTrain(selected, overrideReason.trim() || null)
+    setConfirmOpen(false)
+  }
+
+  return (
+    <Card data-testid="winner-decision-panel">
+      <CardHeader>
+        <CardTitle>5 · Decide &amp; train</CardTitle>
+        <CardDescription>
+          Train the recommended champion, or override to another candidate. The
+          recommended model is <span className="font-medium">{winnerModelType}</span>.
+        </CardDescription>
+      </CardHeader>
+      <CardContent className="space-y-4">
+        <div className="flex flex-col gap-3 sm:flex-row sm:items-end">
+          <div className="space-y-1">
+            <span className="text-xs text-muted-foreground">Model to train</span>
+            <Select value={selected} onValueChange={setSelected}>
+              <SelectTrigger className="w-64" data-testid="decision-model-select">
+                <SelectValue />
+              </SelectTrigger>
+              <SelectContent>
+                {candidateModelTypes.map((mt) => (
+                  <SelectItem key={mt} value={mt}>
+                    {mt}
+                    {mt === winnerModelType ? ' (recommended)' : ''}
+                  </SelectItem>
+                ))}
+              </SelectContent>
+            </Select>
+          </div>
+          <Button
+            type="button"
+            onClick={handleTrainClick}
+            disabled={isTraining}
+            data-testid="decision-train-button"
+          >
+            {isTraining ? (
+              <Loader2 className="mr-2 h-4 w-4 animate-spin" />
+            ) : (
+              <Trophy className="mr-2 h-4 w-4" />
+            )}
+            {isOverride ? 'Train override' : 'Train recommended'}
+          </Button>
+        </div>
+
+        {trainResult?.override_warning && (
+          <div
+            className="flex items-start gap-2 rounded-md border border-warning/40 bg-warning/10 p-2 text-xs"
+            data-testid="decision-override-warning"
+          >
+            <TriangleAlert className="mt-0.5 h-3.5 w-3.5 shrink-0 text-warning" />
+            <span>{trainResult.override_warning}</span>
+          </div>
+        )}
+
+        {trainResult && !trainResult.override_warning && (
+          <p className="text-xs text-muted-foreground" data-testid="decision-trained-note">
+            Trained <span className="font-medium">{trainResult.model_type}</span>.
+          </p>
+        )}
+      </CardContent>
+
+      <AlertDialog open={confirmOpen} onOpenChange={setConfirmOpen}>
+        <AlertDialogContent data-testid="override-confirm-dialog">
+          <AlertDialogHeader>
+            <AlertDialogTitle>Train a non-recommended model?</AlertDialogTitle>
+            <AlertDialogDescription>
+              You picked <span className="font-medium">{selected}</span> instead of the
+              recommended <span className="font-medium">{winnerModelType}</span>. This is an
+              override and is recorded on the run.
+            </AlertDialogDescription>
+          </AlertDialogHeader>
+          <div className="space-y-1">
+            <span className="text-xs text-muted-foreground">Reason (optional)</span>
+            <Input
+              value={overrideReason}
+              onChange={(event) => setOverrideReason(event.target.value)}
+              placeholder="e.g. domain seasonality outweighs the WAPE lead"
+              data-testid="override-reason-input"
+            />
+          </div>
+          <AlertDialogFooter>
+            <AlertDialogCancel>Cancel</AlertDialogCancel>
+            <AlertDialogAction
+              onClick={handleConfirmOverride}
+              data-testid="override-confirm-action"
+            >
+              Train override
+            </AlertDialogAction>
+          </AlertDialogFooter>
+        </AlertDialogContent>
+      </AlertDialog>
+    </Card>
+  )
+}
diff --git a/frontend/src/components/champion-selector/results/cancel-run-dialog.test.tsx b/frontend/src/components/champion-selector/results/cancel-run-dialog.test.tsx
new file mode 100644
index 00000000..c5d53231
--- /dev/null
+++ b/frontend/src/components/champion-selector/results/cancel-run-dialog.test.tsx
@@ -0,0 +1,33 @@
+import { afterEach, beforeAll, describe, expect, it, vi } from 'vitest'
+import { cleanup, fireEvent, render, screen } from '@testing-library/react'
+import { CancelRunDialog } from './cancel-run-dialog'
+
+beforeAll(() => {
+  class ResizeObserverStub {
+    observe() {}
+    unobserve() {}
+    disconnect() {}
+  }
+  vi.stubGlobal('ResizeObserver', ResizeObserverStub)
+  if (!Element.prototype.hasPointerCapture) {
+    Element.prototype.hasPointerCapture = () => false
+  }
+})
+
+afterEach(cleanup)
+
+describe('CancelRunDialog', () => {
+  it('confirms cancellation via the AlertDialog', () => {
+    const onConfirm = vi.fn()
+    render(<CancelRunDialog onConfirm={onConfirm} />)
+    fireEvent.click(screen.getByTestId('cancel-run-trigger'))
+    fireEvent.click(screen.getByTestId('cancel-run-confirm'))
+    expect(onConfirm).toHaveBeenCalledTimes(1)
+  })
+
+  it('disables the trigger while cancelling', () => {
+    render(<CancelRunDialog onConfirm={() => {}} isCancelling />)
+    const trigger = screen.getByTestId('cancel-run-trigger') as HTMLButtonElement
+    expect(trigger.disabled).toBe(true)
+  })
+})
diff --git a/frontend/src/components/champion-selector/results/cancel-run-dialog.tsx b/frontend/src/components/champion-selector/results/cancel-run-dialog.tsx
new file mode 100644
index 00000000..d85c08ca
--- /dev/null
+++ b/frontend/src/components/champion-selector/results/cancel-run-dialog.tsx
@@ -0,0 +1,62 @@
+import { Loader2, X } from 'lucide-react'
+import {
+  AlertDialog,
+  AlertDialogAction,
+  AlertDialogCancel,
+  AlertDialogContent,
+  AlertDialogDescription,
+  AlertDialogFooter,
+  AlertDialogHeader,
+  AlertDialogTitle,
+  AlertDialogTrigger,
+} from '@/components/ui/alert-dialog'
+import { Button } from '@/components/ui/button'
+
+interface CancelRunDialogProps {
+  onConfirm: () => void
+  isCancelling?: boolean
+  disabled?: boolean
+}
+
+/**
+ * Cancel-run confirmation (Slice B). Mirrors the batch cancel dialog and reuses
+ * the honest pending-skip / running-yield copy.
+ */
+export function CancelRunDialog({ onConfirm, isCancelling, disabled }: CancelRunDialogProps) {
+  return (
+    <AlertDialog>
+      <AlertDialogTrigger asChild>
+        <Button
+          type="button"
+          variant="outline"
+          disabled={disabled || isCancelling}
+          data-testid="cancel-run-trigger"
+        >
+          {isCancelling ? (
+            <Loader2 className="mr-2 h-4 w-4 animate-spin" />
+          ) : (
+            <X className="mr-2 h-4 w-4" />
+          )}
+          Cancel run
+        </Button>
+      </AlertDialogTrigger>
+      <AlertDialogContent>
+        <AlertDialogHeader>
+          <AlertDialogTitle>Cancel this comparison?</AlertDialogTitle>
+          <AlertDialogDescription>
+            Candidates that haven&apos;t started will be skipped. A candidate
+            already mid-fit stops at the next safe point — sklearn / LightGBM
+            fits are uncancellable mid-call, so an in-flight fit may finish
+            first. Results from candidates that already completed are kept.
+          </AlertDialogDescription>
+        </AlertDialogHeader>
+        <AlertDialogFooter>
+          <AlertDialogCancel>Keep running</AlertDialogCancel>
+          <AlertDialogAction onClick={onConfirm} data-testid="cancel-run-confirm">
+            Cancel run
+          </AlertDialogAction>
+        </AlertDialogFooter>
+      </AlertDialogContent>
+    </AlertDialog>
+  )
+}
diff --git a/frontend/src/components/champion-selector/results/comparison-charts.test.tsx b/frontend/src/components/champion-selector/results/comparison-charts.test.tsx
new file mode 100644
index 00000000..d1ea60bf
--- /dev/null
+++ b/frontend/src/components/champion-selector/results/comparison-charts.test.tsx
@@ -0,0 +1,36 @@
+import { afterEach, beforeAll, describe, expect, it, vi } from 'vitest'
+import { cleanup, render, screen } from '@testing-library/react'
+import { ComparisonCharts } from './comparison-charts'
+import type { ModelSelectionChartData } from '@/types/api'
+
+// Recharts' ResponsiveContainer needs ResizeObserver in jsdom.
+beforeAll(() => {
+  class ResizeObserverStub {
+    observe() {}
+    unobserve() {}
+    disconnect() {}
+  }
+  vi.stubGlobal('ResizeObserver', ResizeObserverStub)
+})
+
+afterEach(cleanup)
+
+const chartData: ModelSelectionChartData = {
+  wape_by_model: { regression: 10, naive: 14 },
+  bias_by_model: { regression: -0.2, naive: 0.5 },
+  fold_stability: { regression: [10, 11] },
+  winner_actual_vs_predicted: [
+    { dates: ['2026-01-01', '2026-01-02'], actuals: [10, 12], predictions: [9.5, 12.5] },
+  ],
+}
+
+describe('ComparisonCharts', () => {
+  it('renders WAPE + bias bars from chart_data', () => {
+    render(<ComparisonCharts chartData={chartData} winnerModelType="regression" />)
+    expect(screen.getByTestId('comparison-charts')).toBeTruthy()
+    expect(screen.getByTestId('metric-bars-wape-by-model')).toBeTruthy()
+    expect(screen.getByTestId('metric-bars-bias-by-model')).toBeTruthy()
+    // Winner is starred in the bar list.
+    expect(screen.getAllByText('★ regression').length).toBeGreaterThan(0)
+  })
+})
diff --git a/frontend/src/components/champion-selector/results/comparison-charts.tsx b/frontend/src/components/champion-selector/results/comparison-charts.tsx
new file mode 100644
index 00000000..5e192a22
--- /dev/null
+++ b/frontend/src/components/champion-selector/results/comparison-charts.tsx
@@ -0,0 +1,105 @@
+import { Card, CardContent, CardDescription, CardHeader, CardTitle } from '@/components/ui/card'
+import { MultiSeriesChart } from '@/components/charts/multi-series-chart'
+import { BIAS_EXPLANATION } from '@/components/champion-selector/copy'
+import type { ModelSelectionChartData } from '@/types/api'
+
+interface ComparisonChartsProps {
+  chartData: ModelSelectionChartData
+  winnerModelType?: string
+}
+
+/** One labelled horizontal bar (CSS — deterministic, no chart lib needed). */
+function MetricBars({
+  title,
+  byModel,
+  winnerModelType,
+  signed = false,
+}: {
+  title: string
+  byModel: Record<string, number>
+  winnerModelType?: string
+  signed?: boolean
+}) {
+  const entries = Object.entries(byModel)
+  const max = Math.max(1, ...entries.map(([, v]) => Math.abs(v)))
+  return (
+    <div className="space-y-2" data-testid={`metric-bars-${title.toLowerCase().replace(/\s+/g, '-')}`}>
+      <p className="text-xs font-medium text-muted-foreground">{title}</p>
+      {entries.map(([model, value]) => (
+        <div key={model} className="flex items-center gap-2 text-xs">
+          <span className="w-28 shrink-0 truncate" title={model}>
+            {model === winnerModelType ? `★ ${model}` : model}
+          </span>
+          <div className="h-3 flex-1 rounded bg-muted">
+            <div
+              className={signed && value < 0 ? 'h-3 rounded bg-amber-500' : 'h-3 rounded bg-primary'}
+              style={{ width: `${(Math.abs(value) / max) * 100}%` }}
+            />
+          </div>
+          <span className="w-12 shrink-0 text-right tabular-nums">{value.toFixed(2)}</span>
+        </div>
+      ))}
+    </div>
+  )
+}
+
+/**
+ * Comparison charts (Slice B): WAPE-by-model + bias-by-model bars, and the
+ * winner's actual-vs-predicted overlay. Reads the backend `chart_data` payload.
+ */
+export function ComparisonCharts({ chartData, winnerModelType }: ComparisonChartsProps) {
+  // Build actual-vs-predicted rows for the winner from the fold chart points.
+  const avpRows: Record<string, number | string>[] = []
+  for (const fold of chartData.winner_actual_vs_predicted as Array<{
+    dates?: string[]
+    actuals?: number[]
+    predictions?: number[]
+  }>) {
+    const dates = fold.dates ?? []
+    const actuals = fold.actuals ?? []
+    const predictions = fold.predictions ?? []
+    for (let i = 0; i < dates.length; i++) {
+      avpRows.push({
+        date: dates[i] ?? String(i),
+        actual: actuals[i] ?? 0,
+        predicted: predictions[i] ?? 0,
+      })
+    }
+  }
+
+  return (
+    <Card data-testid="comparison-charts">
+      <CardHeader>
+        <CardTitle>Comparison</CardTitle>
+        <CardDescription>{BIAS_EXPLANATION}</CardDescription>
+      </CardHeader>
+      <CardContent className="space-y-6">
+        <div className="grid gap-6 md:grid-cols-2">
+          <MetricBars
+            title="WAPE by model"
+            byModel={chartData.wape_by_model}
+            winnerModelType={winnerModelType}
+          />
+          <MetricBars
+            title="Bias by model"
+            byModel={chartData.bias_by_model}
+            winnerModelType={winnerModelType}
+            signed
+          />
+        </div>
+        {avpRows.length > 0 && (
+          <MultiSeriesChart
+            title="Winner — actual vs predicted"
+            data={avpRows}
+            series={[
+              { key: 'actual', label: 'Actual' },
+              { key: 'predicted', label: 'Predicted' },
+            ]}
+            xAxisKey="date"
+            height={260}
+          />
+        )}
+      </CardContent>
+    </Card>
+  )
+}
diff --git a/frontend/src/components/champion-selector/results/constants.ts b/frontend/src/components/champion-selector/results/constants.ts
new file mode 100644
index 00000000..41aa3bb2
--- /dev/null
+++ b/frontend/src/components/champion-selector/results/constants.ts
@@ -0,0 +1,17 @@
+import type { ModelSelectionStatus } from '@/types/api'
+
+/**
+ * Terminal selection-run statuses (Slice B). Polling stops once a run reaches
+ * one of these. Kept in a `.ts` module so the
+ * `react-refresh/only-export-components` lint rule never trips.
+ */
+export const TERMINAL_SELECTION_STATES: ReadonlySet<ModelSelectionStatus> = new Set([
+  'completed',
+  'partial',
+  'failed',
+  'cancelled',
+])
+
+export function isTerminalSelectionStatus(status: ModelSelectionStatus): boolean {
+  return TERMINAL_SELECTION_STATES.has(status)
+}
diff --git a/frontend/src/components/champion-selector/results/model-detail-drawer.test.tsx b/frontend/src/components/champion-selector/results/model-detail-drawer.test.tsx
new file mode 100644
index 00000000..83d90d1b
--- /dev/null
+++ b/frontend/src/components/champion-selector/results/model-detail-drawer.test.tsx
@@ -0,0 +1,43 @@
+import { afterEach, beforeAll, describe, expect, it, vi } from 'vitest'
+import { cleanup, render, screen } from '@testing-library/react'
+import { ModelDetailDrawer } from './model-detail-drawer'
+import type { ModelRankEntry } from '@/types/api'
+
+// Radix Dialog (Sheet) needs these layout APIs in jsdom.
+beforeAll(() => {
+  class ResizeObserverStub {
+    observe() {}
+    unobserve() {}
+    disconnect() {}
+  }
+  vi.stubGlobal('ResizeObserver', ResizeObserverStub)
+  if (!Element.prototype.hasPointerCapture) {
+    Element.prototype.hasPointerCapture = () => false
+  }
+})
+
+afterEach(cleanup)
+
+const entry: ModelRankEntry = {
+  rank: 1,
+  model_type: 'regression',
+  params: { max_depth: 6 },
+  included: true,
+  exclusion_reason: null,
+  metrics: { wape: 10, smape: 8, mae: 4, rmse: 5, bias: 0.1 },
+}
+
+describe('ModelDetailDrawer', () => {
+  it('renders the candidate metrics + params when open', () => {
+    render(<ModelDetailDrawer entry={entry} open onOpenChange={() => {}} />)
+    const drawer = screen.getByTestId('model-detail-drawer')
+    expect(drawer.textContent).toContain('regression')
+    expect(drawer.textContent).toContain('WAPE')
+    expect(drawer.textContent).toContain('max_depth')
+  })
+
+  it('renders nothing meaningful when closed', () => {
+    render(<ModelDetailDrawer entry={entry} open={false} onOpenChange={() => {}} />)
+    expect(screen.queryByTestId('model-detail-drawer')).toBeNull()
+  })
+})
diff --git a/frontend/src/components/champion-selector/results/model-detail-drawer.tsx b/frontend/src/components/champion-selector/results/model-detail-drawer.tsx
new file mode 100644
index 00000000..f7ac0148
--- /dev/null
+++ b/frontend/src/components/champion-selector/results/model-detail-drawer.tsx
@@ -0,0 +1,79 @@
+import {
+  Sheet,
+  SheetContent,
+  SheetDescription,
+  SheetHeader,
+  SheetTitle,
+} from '@/components/ui/sheet'
+import { Badge } from '@/components/ui/badge'
+import type { ModelRankEntry } from '@/types/api'
+
+interface ModelDetailDrawerProps {
+  entry: ModelRankEntry | null
+  open: boolean
+  onOpenChange: (open: boolean) => void
+}
+
+function fmt(value: number | undefined): string {
+  if (typeof value !== 'number' || !Number.isFinite(value)) return '—'
+  return value.toFixed(3)
+}
+
+const METRIC_KEYS: { key: string; label: string }[] = [
+  { key: 'wape', label: 'WAPE' },
+  { key: 'smape', label: 'sMAPE' },
+  { key: 'mae', label: 'MAE' },
+  { key: 'rmse', label: 'RMSE' },
+  { key: 'bias', label: 'Bias' },
+]
+
+/**
+ * Per-model detail drawer (Slice B). Opens from a ranking-row click; shows one
+ * candidate's metrics, params, and exclusion reason (read-only).
+ */
+export function ModelDetailDrawer({ entry, open, onOpenChange }: ModelDetailDrawerProps) {
+  return (
+    <Sheet open={open} onOpenChange={onOpenChange}>
+      <SheetContent data-testid="model-detail-drawer">
+        {entry && (
+          <>
+            <SheetHeader>
+              <SheetTitle className="flex items-center gap-2">
+                {entry.model_type}
+                {!entry.included && (
+                  <Badge variant="outline">{entry.exclusion_reason ?? 'excluded'}</Badge>
+                )}
+              </SheetTitle>
+              <SheetDescription>
+                {entry.rank !== null ? `Ranked #${entry.rank}` : 'Not ranked'}
+              </SheetDescription>
+            </SheetHeader>
+            <div className="space-y-4 px-4 pb-4">
+              <div>
+                <p className="mb-1 text-xs font-medium text-muted-foreground">Metrics</p>
+                <table className="w-full text-sm">
+                  <tbody>
+                    {METRIC_KEYS.map((m) => (
+                      <tr key={m.key} className="border-t">
+                        <td className="py-1 text-muted-foreground">{m.label}</td>
+                        <td className="py-1 text-right tabular-nums">
+                          {fmt(entry.metrics?.[m.key])}
+                        </td>
+                      </tr>
+                    ))}
+                  </tbody>
+                </table>
+              </div>
+              <div>
+                <p className="mb-1 text-xs font-medium text-muted-foreground">Parameters</p>
+                <pre className="overflow-x-auto rounded-md bg-muted p-2 text-xs">
+                  {JSON.stringify(entry.params, null, 2)}
+                </pre>
+              </div>
+            </div>
+          </>
+        )}
+      </SheetContent>
+    </Sheet>
+  )
+}
diff --git a/frontend/src/components/champion-selector/results/ranking-table.test.tsx b/frontend/src/components/champion-selector/results/ranking-table.test.tsx
new file mode 100644
index 00000000..9943ff6b
--- /dev/null
+++ b/frontend/src/components/champion-selector/results/ranking-table.test.tsx
@@ -0,0 +1,50 @@
+import { afterEach, describe, expect, it, vi } from 'vitest'
+import { cleanup, fireEvent, render, screen } from '@testing-library/react'
+import { RankingTable } from './ranking-table'
+import type { ModelRankEntry } from '@/types/api'
+
+afterEach(cleanup)
+
+const ranking: ModelRankEntry[] = [
+  {
+    rank: 1,
+    model_type: 'regression',
+    params: {},
+    included: true,
+    exclusion_reason: null,
+    metrics: { wape: 10, smape: 8, mae: 4, bias: 0.1 },
+  },
+  {
+    rank: 2,
+    model_type: 'naive',
+    params: {},
+    included: true,
+    exclusion_reason: null,
+    metrics: { wape: 14, smape: 12, mae: 6, bias: 0.5 },
+  },
+  {
+    rank: null,
+    model_type: 'moving_average',
+    params: { window_size: 0 },
+    included: false,
+    exclusion_reason: 'failed',
+    metrics: null,
+  },
+]
+
+describe('RankingTable', () => {
+  it('renders a row per entry; excluded rows show their reason', () => {
+    render(<RankingTable ranking={ranking} onSelectModel={() => {}} />)
+    expect(screen.getByTestId('ranking-row-regression')).toBeTruthy()
+    expect(screen.getByTestId('ranking-row-naive')).toBeTruthy()
+    const excluded = screen.getByTestId('ranking-row-moving_average')
+    expect(excluded.textContent).toContain('failed')
+  })
+
+  it('calls onSelectModel with the clicked entry', () => {
+    const onSelect = vi.fn()
+    render(<RankingTable ranking={ranking} onSelectModel={onSelect} />)
+    fireEvent.click(screen.getByTestId('ranking-row-naive'))
+    expect(onSelect).toHaveBeenCalledWith(ranking[1])
+  })
+})
diff --git a/frontend/src/components/champion-selector/results/ranking-table.tsx b/frontend/src/components/champion-selector/results/ranking-table.tsx
new file mode 100644
index 00000000..a8c0515a
--- /dev/null
+++ b/frontend/src/components/champion-selector/results/ranking-table.tsx
@@ -0,0 +1,90 @@
+import { Trophy } from 'lucide-react'
+import { Card, CardContent, CardDescription, CardHeader, CardTitle } from '@/components/ui/card'
+import { Badge } from '@/components/ui/badge'
+import { cn } from '@/lib/utils'
+import { RANKING_TIE_BREAK } from '@/components/champion-selector/copy'
+import type { ModelRankEntry } from '@/types/api'
+
+interface RankingTableProps {
+  ranking: ModelRankEntry[]
+  onSelectModel: (entry: ModelRankEntry) => void
+}
+
+function fmt(value: number | undefined): string {
+  if (typeof value !== 'number' || !Number.isFinite(value)) return '—'
+  return value.toFixed(2)
+}
+
+/**
+ * Candidate ranking table (Slice B). Winner row highlighted; excluded
+ * (failed/cancelled/filtered) rows show their reason and stay visible. Clicking
+ * a row opens the model-detail drawer.
+ */
+export function RankingTable({ ranking, onSelectModel }: RankingTableProps) {
+  return (
+    <Card data-testid="ranking-table">
+      <CardHeader>
+        <CardTitle>Ranking</CardTitle>
+        <CardDescription>{RANKING_TIE_BREAK}</CardDescription>
+      </CardHeader>
+      <CardContent>
+        <table className="w-full text-sm">
+          <thead>
+            <tr className="text-left text-muted-foreground">
+              <th className="py-1.5">Rank</th>
+              <th className="py-1.5">Model</th>
+              <th className="py-1.5 text-right">WAPE</th>
+              <th className="py-1.5 text-right">sMAPE</th>
+              <th className="py-1.5 text-right">MAE</th>
+              <th className="py-1.5 text-right">Bias</th>
+            </tr>
+          </thead>
+          <tbody>
+            {ranking.map((entry) => (
+              <tr
+                key={`${entry.model_type}-${entry.rank ?? 'x'}`}
+                data-testid={`ranking-row-${entry.model_type}`}
+                onClick={() => onSelectModel(entry)}
+                className={cn(
+                  'cursor-pointer border-t hover:bg-accent/50',
+                  entry.rank === 1 && 'bg-primary/5 font-medium',
+                  !entry.included && 'text-muted-foreground',
+                )}
+              >
+                <td className="py-1.5">
+                  {entry.rank === 1 ? (
+                    <span className="inline-flex items-center gap-1">
+                      <Trophy className="h-3.5 w-3.5" />1
+                    </span>
+                  ) : (
+                    (entry.rank ?? '—')
+                  )}
+                </td>
+                <td className="py-1.5">
+                  {entry.model_type}
+                  {!entry.included && (
+                    <Badge variant="outline" className="ml-2">
+                      {entry.exclusion_reason ?? 'excluded'}
+                    </Badge>
+                  )}
+                </td>
+                <td className="py-1.5 text-right tabular-nums">
+                  {fmt(entry.metrics?.['wape'])}
+                </td>
+                <td className="py-1.5 text-right tabular-nums">
+                  {fmt(entry.metrics?.['smape'])}
+                </td>
+                <td className="py-1.5 text-right tabular-nums">
+                  {fmt(entry.metrics?.['mae'])}
+                </td>
+                <td className="py-1.5 text-right tabular-nums">
+                  {fmt(entry.metrics?.['bias'])}
+                </td>
+              </tr>
+            ))}
+          </tbody>
+        </table>
+      </CardContent>
+    </Card>
+  )
+}
diff --git a/frontend/src/components/champion-selector/results/run-progress-panel.test.tsx b/frontend/src/components/champion-selector/results/run-progress-panel.test.tsx
new file mode 100644
index 00000000..13c4ef54
--- /dev/null
+++ b/frontend/src/components/champion-selector/results/run-progress-panel.test.tsx
@@ -0,0 +1,57 @@
+import { afterEach, describe, expect, it } from 'vitest'
+import { cleanup, render, screen } from '@testing-library/react'
+import { RunProgressPanel } from './run-progress-panel'
+import type { CandidateProgress, SelectionProgress } from '@/types/api'
+
+afterEach(cleanup)
+
+const progress: SelectionProgress = {
+  total: 3,
+  pending: 1,
+  running: 1,
+  completed: 1,
+  failed: 0,
+  cancelled: 0,
+}
+
+function cand(model_type: string, status: CandidateProgress['status']): CandidateProgress {
+  return {
+    candidate_id: `id-${model_type}`,
+    ordinal: 0,
+    model_type,
+    status,
+    error: status === 'failed' ? 'boom' : null,
+    started_at: null,
+    completed_at: null,
+    duration_ms: status === 'completed' ? 1500 : null,
+  }
+}
+
+describe('RunProgressPanel', () => {
+  it('renders status badge, counts, and a per-candidate row', () => {
+    render(
+      <RunProgressPanel
+        status="running"
+        progress={progress}
+        candidates={[cand('naive', 'completed'), cand('regression', 'running')]}
+      />,
+    )
+    expect(screen.getByTestId('run-status-badge').textContent).toContain('running')
+    expect(screen.getByText('Total')).toBeTruthy()
+    expect(screen.getByTestId('candidate-row-naive')).toBeTruthy()
+    expect(screen.getByTestId('candidate-row-regression')).toBeTruthy()
+  })
+
+  it('keeps a failed candidate visible with its error', () => {
+    render(
+      <RunProgressPanel
+        status="partial"
+        progress={progress}
+        candidates={[cand('xgboost', 'failed')]}
+      />,
+    )
+    const row = screen.getByTestId('candidate-row-xgboost')
+    expect(row.textContent).toContain('failed')
+    expect(row.textContent).toContain('boom')
+  })
+})
diff --git a/frontend/src/components/champion-selector/results/run-progress-panel.tsx b/frontend/src/components/champion-selector/results/run-progress-panel.tsx
new file mode 100644
index 00000000..4c5699a3
--- /dev/null
+++ b/frontend/src/components/champion-selector/results/run-progress-panel.tsx
@@ -0,0 +1,87 @@
+import { Card, CardContent, CardHeader, CardTitle } from '@/components/ui/card'
+import { StatusBadge } from '@/components/common/status-badge'
+import { getStatusVariant } from '@/lib/status-utils'
+import type {
+  CandidateProgress,
+  ModelSelectionStatus,
+  SelectionProgress,
+} from '@/types/api'
+
+interface RunProgressPanelProps {
+  status: ModelSelectionStatus
+  progress: SelectionProgress | null
+  candidates: CandidateProgress[]
+}
+
+function Count({ label, value }: { label: string; value: number }) {
+  return (
+    <div className="rounded-md border bg-muted/30 px-3 py-2 text-center">
+      <p className="text-xs text-muted-foreground">{label}</p>
+      <p className="text-lg font-semibold tabular-nums">{value}</p>
+    </div>
+  )
+}
+
+/**
+ * Live async-run progress (Slice B): the run status, per-status counts, and a
+ * per-candidate table. Failed/cancelled candidates stay visible.
+ */
+export function RunProgressPanel({ status, progress, candidates }: RunProgressPanelProps) {
+  return (
+    <Card data-testid="run-progress-panel">
+      <CardHeader>
+        <div className="flex items-center justify-between gap-2">
+          <CardTitle className="text-lg">Comparison progress</CardTitle>
+          <StatusBadge variant={getStatusVariant(status)} data-testid="run-status-badge">
+            {status}
+          </StatusBadge>
+        </div>
+      </CardHeader>
+      <CardContent className="space-y-4">
+        {progress && (
+          <div className="grid grid-cols-3 gap-2 sm:grid-cols-6">
+            <Count label="Total" value={progress.total} />
+            <Count label="Pending" value={progress.pending} />
+            <Count label="Running" value={progress.running} />
+            <Count label="Completed" value={progress.completed} />
+            <Count label="Failed" value={progress.failed} />
+            <Count label="Cancelled" value={progress.cancelled} />
+          </div>
+        )}
+        {candidates.length > 0 && (
+          <table className="w-full text-sm">
+            <thead>
+              <tr className="text-left text-muted-foreground">
+                <th className="py-1.5">Model</th>
+                <th className="py-1.5">Status</th>
+                <th className="py-1.5 text-right">Duration</th>
+              </tr>
+            </thead>
+            <tbody>
+              {candidates.map((c) => (
+                <tr
+                  key={c.candidate_id}
+                  data-testid={`candidate-row-${c.model_type}`}
+                  className="border-t"
+                >
+                  <td className="py-1.5 font-medium">{c.model_type}</td>
+                  <td className="py-1.5">
+                    <StatusBadge variant={getStatusVariant(c.status)}>
+                      {c.status}
+                    </StatusBadge>
+                    {c.error && (
+                      <span className="ml-2 text-xs text-destructive">{c.error}</span>
+                    )}
+                  </td>
+                  <td className="py-1.5 text-right tabular-nums text-muted-foreground">
+                    {c.duration_ms === null ? '—' : `${(c.duration_ms / 1000).toFixed(1)}s`}
+                  </td>
+                </tr>
+              ))}
+            </tbody>
+          </table>
+        )}
+      </CardContent>
+    </Card>
+  )
+}
diff --git a/frontend/src/components/champion-selector/results/winner-card.test.tsx b/frontend/src/components/champion-selector/results/winner-card.test.tsx
new file mode 100644
index 00000000..54054253
--- /dev/null
+++ b/frontend/src/components/champion-selector/results/winner-card.test.tsx
@@ -0,0 +1,40 @@
+import { afterEach, describe, expect, it } from 'vitest'
+import { cleanup, render, screen } from '@testing-library/react'
+import { WinnerCard } from './winner-card'
+import type { WinnerSummary } from '@/types/api'
+
+afterEach(cleanup)
+
+const winner: WinnerSummary = {
+  model_type: 'regression',
+  params: {},
+  metrics: { wape: 10, smape: 8, mae: 4, bias: 0.1 },
+  rank: 1,
+}
+
+describe('WinnerCard', () => {
+  it('renders the winner, confidence, metrics, and bias copy', () => {
+    render(<WinnerCard winner={winner} confidence="high" reasons={['clear lead']} />)
+    expect(screen.getByTestId('winner-card').textContent).toContain('regression')
+    expect(screen.getByTestId('winner-confidence-badge').textContent).toContain('high')
+    expect(screen.getByText('clear lead')).toBeTruthy()
+    expect(screen.getByText(/Positive bias means the model under-forecasts/)).toBeTruthy()
+  })
+
+  it('renders a no-winner state when winner is null', () => {
+    render(<WinnerCard winner={null} confidence={null} reasons={[]} />)
+    expect(screen.getByText('No champion selected')).toBeTruthy()
+  })
+
+  it('surfaces the deterministic business_summary headline read-only', () => {
+    render(
+      <WinnerCard
+        winner={winner}
+        confidence="medium"
+        reasons={[]}
+        businessSummary={{ headline: 'regression wins by 28% WAPE' }}
+      />,
+    )
+    expect(screen.getByText('regression wins by 28% WAPE')).toBeTruthy()
+  })
+})
diff --git a/frontend/src/components/champion-selector/results/winner-card.tsx b/frontend/src/components/champion-selector/results/winner-card.tsx
new file mode 100644
index 00000000..c5fa0b8a
--- /dev/null
+++ b/frontend/src/components/champion-selector/results/winner-card.tsx
@@ -0,0 +1,100 @@
+import { Trophy } from 'lucide-react'
+import { Card, CardContent, CardDescription, CardHeader, CardTitle } from '@/components/ui/card'
+import { Badge } from '@/components/ui/badge'
+import { StatusBadge } from '@/components/common/status-badge'
+import { BIAS_EXPLANATION } from '@/components/champion-selector/copy'
+import type { ConfidenceLevel, WinnerSummary } from '@/types/api'
+
+interface WinnerCardProps {
+  winner: WinnerSummary | null
+  confidence: ConfidenceLevel | null
+  reasons: string[]
+  /** The deterministic backend `business_summary` (read-only; Slice C extends). */
+  businessSummary?: Record<string, unknown> | null
+}
+
+const CONFIDENCE_VARIANT: Record<ConfidenceLevel, 'success' | 'info' | 'warning'> = {
+  high: 'success',
+  medium: 'info',
+  low: 'warning',
+}
+
+function Metric({ label, value }: { label: string; value: number | undefined }) {
+  return (
+    <div className="rounded-md border bg-muted/30 p-3">
+      <p className="text-xs text-muted-foreground">{label}</p>
+      <p className="text-lg font-semibold tabular-nums">
+        {typeof value === 'number' && Number.isFinite(value) ? value.toFixed(2) : '—'}
+      </p>
+    </div>
+  )
+}
+
+/**
+ * Winner summary card (Slice B). Null-safe — renders a "no winner" state for a
+ * failed/cancelled run. Renders the deterministic `business_summary` headline
+ * READ-ONLY (Slice C adds the decision-layer interpretation on top).
+ */
+export function WinnerCard({ winner, confidence, reasons, businessSummary }: WinnerCardProps) {
+  if (winner === null) {
+    return (
+      <Card data-testid="winner-card">
+        <CardHeader>
+          <CardTitle>No champion selected</CardTitle>
+          <CardDescription>
+            No candidate produced a valid backtest. Review the failed candidates
+            below or adjust the selection.
+          </CardDescription>
+        </CardHeader>
+      </Card>
+    )
+  }
+
+  const headline =
+    typeof businessSummary?.['headline'] === 'string'
+      ? (businessSummary['headline'] as string)
+      : null
+
+  return (
+    <Card data-testid="winner-card">
+      <CardHeader>
+        <div className="flex flex-wrap items-center justify-between gap-2">
+          <CardTitle className="flex items-center gap-2">
+            <Trophy className="h-5 w-5" />
+            {winner.model_type}
+          </CardTitle>
+          {confidence && (
+            <StatusBadge
+              variant={CONFIDENCE_VARIANT[confidence]}
+              data-testid="winner-confidence-badge"
+            >
+              {confidence} confidence
+            </StatusBadge>
+          )}
+        </div>
+        {headline && <CardDescription>{headline}</CardDescription>}
+      </CardHeader>
+      <CardContent className="space-y-4">
+        <div className="grid grid-cols-2 gap-3 sm:grid-cols-4">
+          <Metric label="WAPE" value={winner.metrics['wape']} />
+          <Metric label="sMAPE" value={winner.metrics['smape']} />
+          <Metric label="MAE" value={winner.metrics['mae']} />
+          <Metric label="Bias" value={winner.metrics['bias']} />
+        </div>
+        {reasons.length > 0 && (
+          <div className="space-y-1">
+            {reasons.map((reason, i) => (
+              <div key={i} className="flex items-start gap-2">
+                <Badge variant="secondary" className="mt-0.5 shrink-0">
+                  why
+                </Badge>
+                <span className="text-sm text-muted-foreground">{reason}</span>
+              </div>
+            ))}
+          </div>
+        )}
+        <p className="text-xs text-muted-foreground">{BIAS_EXPLANATION}</p>
+      </CardContent>
+    </Card>
+  )
+}
diff --git a/frontend/src/components/champion-selector/run-request.test.ts b/frontend/src/components/champion-selector/run-request.test.ts
new file mode 100644
index 00000000..59f4ad0e
--- /dev/null
+++ b/frontend/src/components/champion-selector/run-request.test.ts
@@ -0,0 +1,63 @@
+import { describe, expect, it } from 'vitest'
+import { assembleRunRequest } from './run-request'
+import type { SplitConfig } from '@/types/api'
+
+const SPLIT: SplitConfig = {
+  strategy: 'expanding',
+  n_splits: 5,
+  min_train_size: 30,
+  gap: 0,
+  horizon: 7, // intentionally stale — must be overridden to forecastHorizon
+}
+
+describe('assembleRunRequest', () => {
+  it('pins auto_train_winner and auto_predict to false (Slice A invariant)', () => {
+    const req = assembleRunRequest({
+      storeId: 7,
+      productId: 12,
+      startDate: '2026-01-01',
+      endDate: '2026-05-31',
+      forecastHorizon: 14,
+      rankingMetric: 'wape',
+      splitConfig: SPLIT,
+      selectedModels: ['naive', 'regression'],
+    })
+    expect(req.auto_train_winner).toBe(false)
+    expect(req.auto_predict).toBe(false)
+  })
+
+  it('forces split_config.horizon === forecast_horizon', () => {
+    const req = assembleRunRequest({
+      storeId: 1,
+      productId: 2,
+      startDate: '2026-01-01',
+      endDate: '2026-03-31',
+      forecastHorizon: 21,
+      rankingMetric: 'wape',
+      splitConfig: SPLIT,
+      selectedModels: ['naive'],
+    })
+    expect(req.forecast_horizon).toBe(21)
+    expect(req.split_config.horizon).toBe(21)
+  })
+
+  it('maps selected model types into flat candidate configs and stays V1', () => {
+    const req = assembleRunRequest({
+      storeId: 1,
+      productId: 2,
+      startDate: '2026-01-01',
+      endDate: '2026-03-31',
+      forecastHorizon: 14,
+      rankingMetric: 'smape',
+      splitConfig: SPLIT,
+      selectedModels: ['naive', 'seasonal_naive'],
+    })
+    expect(req.candidate_models).toEqual([
+      { model_type: 'naive', params: {} },
+      { model_type: 'seasonal_naive', params: {} },
+    ])
+    expect(req.feature_frame_version).toBe(1)
+    expect(req.feature_groups).toBeNull()
+    expect(req.ranking_metric).toBe('smape')
+  })
+})
diff --git a/frontend/src/components/champion-selector/run-request.ts b/frontend/src/components/champion-selector/run-request.ts
new file mode 100644
index 00000000..253da365
--- /dev/null
+++ b/frontend/src/components/champion-selector/run-request.ts
@@ -0,0 +1,50 @@
+import type {
+  ModelSelectionRunRequest,
+  RankingMetric,
+  SplitConfig,
+} from '@/types/api'
+
+export interface AssembleRunRequestInput {
+  storeId: number
+  productId: number
+  startDate: string // YYYY-MM-DD
+  endDate: string // YYYY-MM-DD
+  forecastHorizon: number
+  rankingMetric: RankingMetric
+  splitConfig: SplitConfig
+  selectedModels: string[]
+}
+
+/**
+ * Assemble the typed `ModelSelectionRunRequest` from the Champion Selector
+ * form state. Pure + side-effect-free so it can be unit-tested.
+ *
+ * Slice A pins `auto_train_winner` and `auto_predict` to `false`: the async run
+ * path (Slice B) treats both as NO-OPS, and Slice C owns explicit
+ * train/predict. `split_config.horizon` is forced equal to `forecast_horizon`
+ * (the backend `ModelSelectionRunRequest` validator requires it). The request
+ * is assembled but NOT sent in Slice A — the "Run comparison" CTA is disabled.
+ */
+export function assembleRunRequest(
+  input: AssembleRunRequestInput,
+): ModelSelectionRunRequest {
+  return {
+    store_id: input.storeId,
+    product_id: input.productId,
+    selection_window: {
+      start_date: input.startDate,
+      end_date: input.endDate,
+    },
+    forecast_horizon: input.forecastHorizon,
+    ranking_metric: input.rankingMetric,
+    split_config: { ...input.splitConfig, horizon: input.forecastHorizon },
+    candidate_models: input.selectedModels.map((model_type) => ({
+      model_type,
+      params: {},
+    })),
+    feature_frame_version: 1,
+    feature_groups: null,
+    auto_train_winner: false,
+    auto_predict: false,
+  }
+}
diff --git a/frontend/src/components/champion-selector/searchable-entity-select.test.tsx b/frontend/src/components/champion-selector/searchable-entity-select.test.tsx
new file mode 100644
index 00000000..99b476a7
--- /dev/null
+++ b/frontend/src/components/champion-selector/searchable-entity-select.test.tsx
@@ -0,0 +1,78 @@
+import { afterEach, beforeAll, describe, expect, it, vi } from 'vitest'
+import { cleanup, fireEvent, render, screen } from '@testing-library/react'
+import { SearchableEntitySelect, type SearchableEntityItem } from './searchable-entity-select'
+
+// Radix Popover positions its content with Popper, which needs ResizeObserver
+// + a couple of layout APIs jsdom lacks. Polyfill them locally (the repo has no
+// vitest setup file) so the popover can open in the test environment.
+beforeAll(() => {
+  class ResizeObserverStub {
+    observe() {}
+    unobserve() {}
+    disconnect() {}
+  }
+  vi.stubGlobal('ResizeObserver', ResizeObserverStub)
+  if (!Element.prototype.hasPointerCapture) {
+    Element.prototype.hasPointerCapture = () => false
+  }
+  if (!Element.prototype.scrollIntoView) {
+    Element.prototype.scrollIntoView = () => {}
+  }
+})
+
+afterEach(cleanup)
+
+const ITEMS: SearchableEntityItem[] = [
+  { id: 7, primary: 'S001 · Downtown', secondary: 'North' },
+  { id: 12, primary: 'S002 · Airport', secondary: 'West' },
+  { id: 99, primary: 'S003 · Suburb', secondary: 'East' },
+]
+
+describe('SearchableEntitySelect', () => {
+  it('shows the placeholder when nothing is selected', () => {
+    render(
+      <SearchableEntitySelect
+        items={ITEMS}
+        value={null}
+        onChange={() => {}}
+        placeholder="Pick a store…"
+      />,
+    )
+    expect(screen.getByText('Pick a store…')).toBeTruthy()
+  })
+
+  it('filters the list client-side and selects an option on click', () => {
+    const onChange = vi.fn()
+    render(
+      <SearchableEntitySelect items={ITEMS} value={null} onChange={onChange} />,
+    )
+    fireEvent.click(screen.getByTestId('searchable-entity-select'))
+
+    // All three options visible before filtering.
+    expect(screen.getByTestId('searchable-entity-select-option-7')).toBeTruthy()
+    expect(screen.getByTestId('searchable-entity-select-option-12')).toBeTruthy()
+    expect(screen.getByTestId('searchable-entity-select-option-99')).toBeTruthy()
+
+    // Filter narrows to the Airport row (matches the primary text).
+    fireEvent.change(screen.getByTestId('searchable-entity-select-filter'), {
+      target: { value: 'airport' },
+    })
+    expect(screen.queryByTestId('searchable-entity-select-option-7')).toBeNull()
+    expect(screen.getByTestId('searchable-entity-select-option-12')).toBeTruthy()
+
+    fireEvent.click(screen.getByTestId('searchable-entity-select-option-12'))
+    expect(onChange).toHaveBeenCalledWith(12)
+  })
+
+  it('filters on the secondary descriptor too', () => {
+    render(
+      <SearchableEntitySelect items={ITEMS} value={null} onChange={() => {}} />,
+    )
+    fireEvent.click(screen.getByTestId('searchable-entity-select'))
+    fireEvent.change(screen.getByTestId('searchable-entity-select-filter'), {
+      target: { value: 'east' },
+    })
+    expect(screen.getByTestId('searchable-entity-select-option-99')).toBeTruthy()
+    expect(screen.queryByTestId('searchable-entity-select-option-7')).toBeNull()
+  })
+})
diff --git a/frontend/src/components/champion-selector/searchable-entity-select.tsx b/frontend/src/components/champion-selector/searchable-entity-select.tsx
new file mode 100644
index 00000000..f4dcf51b
--- /dev/null
+++ b/frontend/src/components/champion-selector/searchable-entity-select.tsx
@@ -0,0 +1,144 @@
+import { useState } from 'react'
+import { Check, ChevronsUpDown, Search } from 'lucide-react'
+import { cn } from '@/lib/utils'
+import { Button } from '@/components/ui/button'
+import { Input } from '@/components/ui/input'
+import {
+  Popover,
+  PopoverContent,
+  PopoverTrigger,
+} from '@/components/ui/popover'
+
+export interface SearchableEntityItem {
+  id: number
+  primary: string
+  secondary?: string
+}
+
+interface SearchableEntitySelectProps {
+  items: SearchableEntityItem[]
+  value: number | null
+  onChange: (id: number) => void
+  placeholder?: string
+  loading?: boolean
+  emptyLabel?: string
+  /** Forwarded to the trigger button + filter input for scoped test queries. */
+  testId?: string
+}
+
+/**
+ * A combobox built from existing primitives (Popover + Input + a filtered
+ * `<button>` list) — the repo ships no `cmdk`/`command` primitive, and Slice A
+ * adds no new dependency (LOCKED #6). The list is filtered CLIENT-SIDE over the
+ * already-fetched (<= 100) rows, matching both the primary and secondary text.
+ */
+export function SearchableEntitySelect({
+  items,
+  value,
+  onChange,
+  placeholder = 'Select…',
+  loading = false,
+  emptyLabel = 'No matches',
+  testId = 'searchable-entity-select',
+}: SearchableEntitySelectProps) {
+  const [open, setOpen] = useState(false)
+  const [filter, setFilter] = useState('')
+
+  const selected = items.find((item) => item.id === value) ?? null
+  const needle = filter.trim().toLowerCase()
+  const filtered = needle
+    ? items.filter(
+        (item) =>
+          item.primary.toLowerCase().includes(needle) ||
+          (item.secondary?.toLowerCase().includes(needle) ?? false),
+      )
+    : items
+
+  return (
+    <Popover open={open} onOpenChange={setOpen}>
+      <PopoverTrigger asChild>
+        <Button
+          type="button"
+          variant="outline"
+          role="combobox"
+          aria-expanded={open}
+          disabled={loading}
+          data-testid={testId}
+          className="w-full justify-between font-normal"
+        >
+          <span className="flex min-w-0 flex-col items-start text-left">
+            {selected ? (
+              <>
+                <span className="truncate">{selected.primary}</span>
+                {selected.secondary && (
+                  <span className="truncate text-xs text-muted-foreground">
+                    {selected.secondary}
+                  </span>
+                )}
+              </>
+            ) : (
+              <span className="text-muted-foreground">
+                {loading ? 'Loading…' : placeholder}
+              </span>
+            )}
+          </span>
+          <ChevronsUpDown className="ml-2 h-4 w-4 shrink-0 opacity-50" />
+        </Button>
+      </PopoverTrigger>
+      <PopoverContent className="w-[var(--radix-popover-trigger-width)] p-0" align="start">
+        <div className="flex items-center gap-2 border-b px-3 py-2">
+          <Search className="h-4 w-4 shrink-0 text-muted-foreground" />
+          <Input
+            autoFocus
+            value={filter}
+            onChange={(event) => setFilter(event.target.value)}
+            placeholder="Filter…"
+            data-testid={`${testId}-filter`}
+            className="h-8 border-0 px-0 shadow-none focus-visible:ring-0"
+          />
+        </div>
+        <div className="max-h-64 overflow-y-auto p-1" role="listbox">
+          {filtered.length === 0 ? (
+            <p className="px-3 py-6 text-center text-sm text-muted-foreground">
+              {emptyLabel}
+            </p>
+          ) : (
+            filtered.map((item) => (
+              <button
+                key={item.id}
+                type="button"
+                role="option"
+                aria-selected={item.id === value}
+                data-testid={`${testId}-option-${item.id}`}
+                onClick={() => {
+                  onChange(item.id)
+                  setFilter('')
+                  setOpen(false)
+                }}
+                className={cn(
+                  'flex w-full items-center gap-2 rounded-sm px-2 py-1.5 text-left text-sm hover:bg-accent hover:text-accent-foreground',
+                  item.id === value && 'bg-accent/50',
+                )}
+              >
+                <Check
+                  className={cn(
+                    'h-4 w-4 shrink-0',
+                    item.id === value ? 'opacity-100' : 'opacity-0',
+                  )}
+                />
+                <span className="flex min-w-0 flex-col">
+                  <span className="truncate">{item.primary}</span>
+                  {item.secondary && (
+                    <span className="truncate text-xs text-muted-foreground">
+                      {item.secondary}
+                    </span>
+                  )}
+                </span>
+              </button>
+            ))
+          )}
+        </div>
+      </PopoverContent>
+    </Popover>
+  )
+}
diff --git a/frontend/src/components/champion-selector/split-config.ts b/frontend/src/components/champion-selector/split-config.ts
new file mode 100644
index 00000000..ecc98f35
--- /dev/null
+++ b/frontend/src/components/champion-selector/split-config.ts
@@ -0,0 +1,24 @@
+import type { SplitConfig } from '@/types/api'
+
+/**
+ * Inline-validate a `SplitConfig` against the backend SplitConfig bounds
+ * (`app/features/backtesting/schemas.py`). Kept in a `.ts` module (not the
+ * form `.tsx`) so the `react-refresh/only-export-components` lint rule stays
+ * happy. Returns a list of human-facing error strings (empty = valid).
+ */
+export function splitConfigErrors(config: SplitConfig): string[] {
+  const errors: string[] = []
+  if (config.n_splits < 2 || config.n_splits > 20) {
+    errors.push('Splits must be between 2 and 20.')
+  }
+  if (config.min_train_size < 7) {
+    errors.push('Minimum train size must be at least 7 days.')
+  }
+  if (config.gap < 0 || config.gap > 30) {
+    errors.push('Gap must be between 0 and 30 days.')
+  }
+  if (config.gap >= config.horizon) {
+    errors.push('Gap must be smaller than the horizon.')
+  }
+  return errors
+}
diff --git a/frontend/src/components/demo/RunHistoryStrip.tsx b/frontend/src/components/demo/RunHistoryStrip.tsx
index 5605879c..fce287ba 100644
--- a/frontend/src/components/demo/RunHistoryStrip.tsx
+++ b/frontend/src/components/demo/RunHistoryStrip.tsx
@@ -63,26 +63,35 @@ export function RunHistoryStrip({ onReplay, summary, scenario }: RunHistoryStrip
   const [items, setItems] = useState<RunHistoryItem[]>(() => loadHistory())
   const [lastSummary, setLastSummary] = useState<DemoSummary | null>(null)
 
-  useEffect(() => {
-    if (!summary || summary === lastSummary) return
-    // Persist exactly once per pipeline_complete summary (R18).
-    const entry: RunHistoryItem = {
-      id: crypto.randomUUID(),
-      runId: summary.winningRunId,
-      timestamp: new Date().toISOString(),
-      scenario,
-      status: summary.overallStatus,
-      wallClockS: summary.wallClockS,
-    }
-    const next = [entry, ...items].slice(0, HISTORY_CAP)
-    setItems(next)
-    saveHistory(next)
+  // Append exactly once per pipeline_complete summary (R18). Done DURING render
+  // (the React "storing information from previous renders" pattern) rather than
+  // in an effect — calling setState synchronously inside an effect body causes
+  // cascading renders and is flagged by react-hooks/set-state-in-effect.
+  if (summary && summary !== lastSummary) {
     setLastSummary(summary)
-  }, [summary, lastSummary, items, scenario])
+    setItems((prev) =>
+      [
+        {
+          id: crypto.randomUUID(),
+          runId: summary.winningRunId,
+          timestamp: new Date().toISOString(),
+          scenario,
+          status: summary.overallStatus,
+          wallClockS: summary.wallClockS,
+        },
+        ...prev,
+      ].slice(0, HISTORY_CAP),
+    )
+  }
+
+  // Persist the history to localStorage whenever it changes — syncing React
+  // state to an external system is the sanctioned use of an effect.
+  useEffect(() => {
+    saveHistory(items)
+  }, [items])
 
   const clear = useCallback(() => {
     setItems([])
-    saveHistory([])
   }, [])
 
   if (items.length === 0) return null
diff --git a/frontend/src/hooks/index.ts b/frontend/src/hooks/index.ts
index 1c47074d..eebde40d 100644
--- a/frontend/src/hooks/index.ts
+++ b/frontend/src/hooks/index.ts
@@ -7,6 +7,7 @@ export * from './use-inventory'
 export * from './use-lifecycle-curve'
 export * from './use-runs'
 export * from './use-jobs'
+export * from './use-model-selection'
 export * from './use-ops'
 export * from './use-scenarios'
 export * from './use-rag-sources'
diff --git a/frontend/src/hooks/use-model-selection.test.ts b/frontend/src/hooks/use-model-selection.test.ts
new file mode 100644
index 00000000..5074351b
--- /dev/null
+++ b/frontend/src/hooks/use-model-selection.test.ts
@@ -0,0 +1,364 @@
+/**
+ * Unit tests for the model-selection query hooks (Champion Selector, Slice A).
+ *
+ * Stubs `fetch` to assert the catalog + availability GET URLs and the
+ * availability `enabled` gating. No real backend is exercised.
+ */
+import { QueryClient, QueryClientProvider } from '@tanstack/react-query'
+import { act, renderHook, waitFor } from '@testing-library/react'
+import { afterEach, describe, expect, it, vi } from 'vitest'
+import { createElement, type ReactNode } from 'react'
+
+import {
+  useCancelSelectionRun,
+  useModelCatalog,
+  usePairAvailability,
+  usePredictWinner,
+  usePromoteChampion,
+  useSelectionRun,
+  useSubmitSelectionRun,
+  useTrainSelected,
+  useTrainWinner,
+} from './use-model-selection'
+import type {
+  ModelCatalogResponse,
+  ModelSelectionRunRequest,
+  PairAvailability,
+  SubmitRunResponse,
+} from '@/types/api'
+
+function makeWrapper(client: QueryClient) {
+  return function Wrapper({ children }: { children: ReactNode }) {
+    return createElement(QueryClientProvider, { client }, children)
+  }
+}
+
+function makeClient() {
+  return new QueryClient({ defaultOptions: { queries: { retry: false } } })
+}
+
+const CATALOG: ModelCatalogResponse = {
+  models: [
+    {
+      model_type: 'naive',
+      label: 'Naive',
+      family: 'baseline',
+      feature_aware: false,
+      requires_extra: false,
+      default_params: {},
+      supports_auto_predict: true,
+      description: 'Repeats the last observed value.',
+    },
+  ],
+  default_candidate_model_types: ['naive', 'seasonal_naive', 'moving_average'],
+}
+
+const AVAILABILITY: PairAvailability = {
+  store_id: 7,
+  product_id: 12,
+  first_sales_date: '2026-01-01',
+  last_sales_date: '2026-05-31',
+  observed_days: 150,
+  expected_calendar_days: 151,
+  coverage_ratio: 0.99,
+  missing_days: 1,
+  zero_sale_days: 4,
+  promotion_days: 3,
+  average_daily_demand: 9.2,
+  status: 'ready',
+  recommended_split_config: {
+    strategy: 'expanding',
+    n_splits: 5,
+    min_train_size: 30,
+    gap: 0,
+    horizon: 14,
+  },
+  warnings: [],
+}
+
+afterEach(() => {
+  vi.unstubAllGlobals()
+})
+
+describe('useModelCatalog', () => {
+  it('GETs /model-selection/models and returns the parsed catalog', async () => {
+    const fetchMock = vi.fn().mockResolvedValue(
+      new Response(JSON.stringify(CATALOG), {
+        status: 200,
+        headers: { 'content-type': 'application/json' },
+      }),
+    )
+    vi.stubGlobal('fetch', fetchMock)
+
+    const { result } = renderHook(() => useModelCatalog(), {
+      wrapper: makeWrapper(makeClient()),
+    })
+
+    await waitFor(() => expect(result.current.isSuccess).toBe(true))
+    expect(fetchMock).toHaveBeenCalledTimes(1)
+    expect(fetchMock.mock.calls[0]![0]).toContain('/model-selection/models')
+    expect(result.current.data?.models[0]?.model_type).toBe('naive')
+  })
+})
+
+describe('usePairAvailability', () => {
+  it('GETs /model-selection/availability with the three query params', async () => {
+    const fetchMock = vi.fn().mockResolvedValue(
+      new Response(JSON.stringify(AVAILABILITY), {
+        status: 200,
+        headers: { 'content-type': 'application/json' },
+      }),
+    )
+    vi.stubGlobal('fetch', fetchMock)
+
+    const { result } = renderHook(
+      () => usePairAvailability({ storeId: 7, productId: 12, forecastHorizon: 14 }),
+      { wrapper: makeWrapper(makeClient()) },
+    )
+
+    await waitFor(() => expect(result.current.isSuccess).toBe(true))
+    const url = String(fetchMock.mock.calls[0]![0])
+    expect(url).toContain('/model-selection/availability')
+    expect(url).toContain('store_id=7')
+    expect(url).toContain('product_id=12')
+    expect(url).toContain('forecast_horizon=14')
+    expect(result.current.data?.status).toBe('ready')
+  })
+
+  it('does NOT fetch while the pair is incomplete (enabled gating)', async () => {
+    const fetchMock = vi.fn()
+    vi.stubGlobal('fetch', fetchMock)
+
+    renderHook(
+      () => usePairAvailability({ storeId: null, productId: 12, forecastHorizon: 14 }),
+      { wrapper: makeWrapper(makeClient()) },
+    )
+
+    // Give TanStack a tick; the disabled query must never call fetch.
+    await new Promise((resolve) => setTimeout(resolve, 20))
+    expect(fetchMock).not.toHaveBeenCalled()
+  })
+})
+
+// --------------------------------------------------------------------- Slice B
+
+const SUBMIT_RESPONSE: SubmitRunResponse = {
+  selection_id: 'sel_b',
+  store_id: 7,
+  product_id: 12,
+  status: 'running',
+  selection_window: { start_date: '2026-01-01', end_date: '2026-05-31' },
+  forecast_horizon: 14,
+  ranking_metric: 'wape',
+  availability: null,
+  ranking: [],
+  winner: null,
+  recommendation_confidence: null,
+  confidence_reasons: [],
+  chart_data: null,
+  final_model: null,
+  forecast: null,
+  business_summary: null,
+  error_message: null,
+  created_at: '2026-06-01T12:00:00Z',
+  started_at: '2026-06-01T12:00:00Z',
+  completed_at: null,
+  progress: { total: 1, pending: 1, running: 0, completed: 0, failed: 0, cancelled: 0 },
+  candidate_progress: [
+    {
+      candidate_id: 'c0',
+      ordinal: 0,
+      model_type: 'naive',
+      status: 'pending',
+      error: null,
+      started_at: null,
+      completed_at: null,
+      duration_ms: null,
+    },
+  ],
+  monitor_url: '/model-selection/sel_b',
+  cancel_url: '/model-selection/sel_b',
+}
+
+const RUN_REQUEST: ModelSelectionRunRequest = {
+  store_id: 7,
+  product_id: 12,
+  selection_window: { start_date: '2026-01-01', end_date: '2026-05-31' },
+  forecast_horizon: 14,
+  ranking_metric: 'wape',
+  split_config: {
+    strategy: 'expanding',
+    n_splits: 5,
+    min_train_size: 30,
+    gap: 0,
+    horizon: 14,
+  },
+  candidate_models: [{ model_type: 'naive', params: {} }],
+  feature_frame_version: 1,
+  feature_groups: null,
+  auto_train_winner: false,
+  auto_predict: false,
+}
+
+describe('useSubmitSelectionRun', () => {
+  it('POSTs to /model-selection/runs and seeds the poll cache', async () => {
+    const fetchMock = vi.fn().mockResolvedValue(
+      new Response(JSON.stringify(SUBMIT_RESPONSE), {
+        status: 202,
+        headers: { 'content-type': 'application/json' },
+      }),
+    )
+    vi.stubGlobal('fetch', fetchMock)
+    const client = makeClient()
+    const { result } = renderHook(() => useSubmitSelectionRun(), {
+      wrapper: makeWrapper(client),
+    })
+    await act(async () => {
+      result.current.mutate(RUN_REQUEST)
+    })
+    await waitFor(() => expect(result.current.isSuccess).toBe(true))
+    const call = fetchMock.mock.calls[0]!
+    expect(String(call[0])).toContain('/model-selection/runs')
+    expect((call[1] as RequestInit).method).toBe('POST')
+    // The poll cache is seeded so useSelectionRun starts warm.
+    expect(
+      client.getQueryData(['model-selection', 'run', 'sel_b']),
+    ).toEqual(SUBMIT_RESPONSE)
+  })
+})
+
+describe('useSelectionRun', () => {
+  it('GETs /model-selection/{id} when given a selection id', async () => {
+    const fetchMock = vi.fn().mockResolvedValue(
+      new Response(JSON.stringify({ ...SUBMIT_RESPONSE, status: 'completed' }), {
+        status: 200,
+        headers: { 'content-type': 'application/json' },
+      }),
+    )
+    vi.stubGlobal('fetch', fetchMock)
+    const { result } = renderHook(() => useSelectionRun('sel_b'), {
+      wrapper: makeWrapper(makeClient()),
+    })
+    await waitFor(() => expect(result.current.isSuccess).toBe(true))
+    expect(String(fetchMock.mock.calls[0]![0])).toContain('/model-selection/sel_b')
+    expect(result.current.data?.status).toBe('completed')
+  })
+
+  it('does NOT fetch without a selection id (enabled gating)', async () => {
+    const fetchMock = vi.fn()
+    vi.stubGlobal('fetch', fetchMock)
+    renderHook(() => useSelectionRun(null), { wrapper: makeWrapper(makeClient()) })
+    await new Promise((resolve) => setTimeout(resolve, 20))
+    expect(fetchMock).not.toHaveBeenCalled()
+  })
+})
+
+describe('useCancelSelectionRun', () => {
+  it('DELETEs /model-selection/{id}', async () => {
+    const cancelled = { ...SUBMIT_RESPONSE, status: 'cancelled' as const }
+    const fetchMock = vi.fn().mockResolvedValue(
+      new Response(JSON.stringify(cancelled), {
+        status: 200,
+        headers: { 'content-type': 'application/json' },
+      }),
+    )
+    vi.stubGlobal('fetch', fetchMock)
+    const { result } = renderHook(() => useCancelSelectionRun(), {
+      wrapper: makeWrapper(makeClient()),
+    })
+    await act(async () => {
+      result.current.mutate('sel_b')
+    })
+    await waitFor(() => expect(result.current.isSuccess).toBe(true))
+    const call = fetchMock.mock.calls[0]!
+    expect(String(call[0])).toContain('/model-selection/sel_b')
+    expect((call[1] as RequestInit).method).toBe('DELETE')
+  })
+})
+
+// --------------------------------------------------------------- Slice C hooks
+
+function jsonResponse(body: unknown) {
+  return new Response(JSON.stringify(body), {
+    status: 200,
+    headers: { 'content-type': 'application/json' },
+  })
+}
+
+describe('useTrainWinner', () => {
+  it('POSTs /train-winner (no body) and invalidates the run query', async () => {
+    const fetchMock = vi.fn().mockResolvedValue(
+      jsonResponse({ selection_id: 'sel_c', model_type: 'naive', model_path: 'p', is_override: false, override_warning: null }),
+    )
+    vi.stubGlobal('fetch', fetchMock)
+    const { result } = renderHook(() => useTrainWinner('sel_c'), {
+      wrapper: makeWrapper(makeClient()),
+    })
+    await act(async () => {
+      result.current.mutate()
+    })
+    await waitFor(() => expect(result.current.isSuccess).toBe(true))
+    const call = fetchMock.mock.calls[0]!
+    expect(String(call[0])).toContain('/model-selection/sel_c/train-winner')
+    expect((call[1] as RequestInit).method).toBe('POST')
+  })
+})
+
+describe('useTrainSelected', () => {
+  it('POSTs /train-selected with the override body', async () => {
+    const fetchMock = vi.fn().mockResolvedValue(
+      jsonResponse({ selection_id: 'sel_c', model_type: 'seasonal_naive', model_path: 'p', is_override: true, override_warning: 'w' }),
+    )
+    vi.stubGlobal('fetch', fetchMock)
+    const { result } = renderHook(() => useTrainSelected('sel_c'), {
+      wrapper: makeWrapper(makeClient()),
+    })
+    await act(async () => {
+      result.current.mutate({ model_type: 'seasonal_naive', override_reason: 'domain' })
+    })
+    await waitFor(() => expect(result.current.isSuccess).toBe(true))
+    const call = fetchMock.mock.calls[0]!
+    expect(String(call[0])).toContain('/model-selection/sel_c/train-selected')
+    expect((call[1] as RequestInit).method).toBe('POST')
+    expect(String((call[1] as RequestInit).body)).toContain('seasonal_naive')
+  })
+})
+
+describe('usePredictWinner', () => {
+  it('POSTs /predict with the decision params body', async () => {
+    const fetchMock = vi.fn().mockResolvedValue(
+      jsonResponse({ selection_id: 'sel_c', forecast: { points: [], total_demand: 0, average_demand: 0, horizon: 14 }, decision: null }),
+    )
+    vi.stubGlobal('fetch', fetchMock)
+    const { result } = renderHook(() => usePredictWinner('sel_c'), {
+      wrapper: makeWrapper(makeClient()),
+    })
+    await act(async () => {
+      result.current.mutate({ lead_time_days: 7, service_level: 0.95 })
+    })
+    await waitFor(() => expect(result.current.isSuccess).toBe(true))
+    const call = fetchMock.mock.calls[0]!
+    expect(String(call[0])).toContain('/model-selection/sel_c/predict')
+    expect((call[1] as RequestInit).method).toBe('POST')
+  })
+})
+
+describe('usePromoteChampion', () => {
+  it('POSTs /promote with the promote body', async () => {
+    const fetchMock = vi.fn().mockResolvedValue(
+      jsonResponse({ selection_id: 'sel_c', alias_name: 'champion-x', run_id: 'r', run_status: 'success', model_type: 'naive', is_override: false, promoted_at: '2026-06-01T00:00:00Z' }),
+    )
+    vi.stubGlobal('fetch', fetchMock)
+    const { result } = renderHook(() => usePromoteChampion('sel_c'), {
+      wrapper: makeWrapper(makeClient()),
+    })
+    await act(async () => {
+      result.current.mutate({ alias_name: 'champion-x', approved_by: 'gabor' })
+    })
+    await waitFor(() => expect(result.current.isSuccess).toBe(true))
+    const call = fetchMock.mock.calls[0]!
+    expect(String(call[0])).toContain('/model-selection/sel_c/promote')
+    expect((call[1] as RequestInit).method).toBe('POST')
+    expect(String((call[1] as RequestInit).body)).toContain('champion-x')
+  })
+})
diff --git a/frontend/src/hooks/use-model-selection.ts b/frontend/src/hooks/use-model-selection.ts
new file mode 100644
index 00000000..bc861a1b
--- /dev/null
+++ b/frontend/src/hooks/use-model-selection.ts
@@ -0,0 +1,190 @@
+import { useMutation, useQuery, useQueryClient } from '@tanstack/react-query'
+import { api } from '@/lib/api'
+import { isTerminalSelectionStatus } from '@/components/champion-selector/results/constants'
+import type {
+  ForecastDecisionParams,
+  ModelCatalogResponse,
+  ModelSelectionRunRequest,
+  ModelSelectionRunResponse,
+  PairAvailability,
+  PredictWinnerResponse,
+  PromoteRequest,
+  PromoteResponse,
+  SubmitRunResponse,
+  TrainSelectedRequest,
+  TrainWinnerResponse,
+} from '@/types/api'
+
+/**
+ * Model-selection query hooks (Champion Selector).
+ *
+ * Slice A: catalog + availability GETs. Slice B: async submit / poll / cancel.
+ * Slice C: train (winner / override) / predict (decision) / promote.
+ */
+
+/**
+ * Fetch the backend-owned candidate-model capability catalog.
+ *
+ * The catalog is static, so it is cached aggressively (no refetch churn).
+ */
+export function useModelCatalog() {
+  return useQuery({
+    queryKey: ['model-selection', 'models'],
+    queryFn: () => api<ModelCatalogResponse>('/model-selection/models'),
+    staleTime: 1000 * 60 * 60, // 1h — the catalog rarely changes within a session
+  })
+}
+
+interface UsePairAvailabilityParams {
+  storeId: number | null
+  productId: number | null
+  forecastHorizon: number
+  enabled?: boolean
+}
+
+/**
+ * Assess data availability for a (store, product) pair at a given horizon.
+ *
+ * Gated like `useStore`: only fires once a real pair is chosen. `storeId` /
+ * `productId` are nullable so the page can pass its raw selection state without
+ * coercing un-selected values to a bogus `0`/`1`.
+ */
+export function usePairAvailability({
+  storeId,
+  productId,
+  forecastHorizon,
+  enabled = true,
+}: UsePairAvailabilityParams) {
+  return useQuery({
+    queryKey: ['model-selection', 'availability', storeId, productId, forecastHorizon],
+    queryFn: () =>
+      api<PairAvailability>('/model-selection/availability', {
+        params: {
+          store_id: storeId,
+          product_id: productId,
+          forecast_horizon: forecastHorizon,
+        },
+      }),
+    enabled: enabled && !!storeId && storeId > 0 && !!productId && productId > 0,
+  })
+}
+
+/**
+ * Submit an async selection run (Slice B). `POST /model-selection/runs` returns
+ * 202 immediately; we seed the poll cache so `useSelectionRun` starts warm.
+ */
+export function useSubmitSelectionRun() {
+  const queryClient = useQueryClient()
+  return useMutation({
+    mutationFn: (request: ModelSelectionRunRequest) =>
+      api<SubmitRunResponse>('/model-selection/runs', {
+        method: 'POST',
+        body: request,
+      }),
+    onSuccess: (data) => {
+      queryClient.setQueryData(['model-selection', 'run', data.selection_id], data)
+    },
+  })
+}
+
+/**
+ * Poll one selection run. Refetches every 2s while pending/running, then stops
+ * once the run reaches a terminal status. Gated on a real selection id.
+ */
+export function useSelectionRun(selectionId: string | null, enabled = true) {
+  return useQuery({
+    queryKey: ['model-selection', 'run', selectionId],
+    queryFn: () =>
+      api<ModelSelectionRunResponse>(`/model-selection/${selectionId}`),
+    enabled: enabled && !!selectionId,
+    refetchInterval: (query) => {
+      const status = query.state.data?.status
+      return status && isTerminalSelectionStatus(status) ? false : 2000
+    },
+  })
+}
+
+/**
+ * Cancel an in-flight selection run (Slice B). `DELETE /model-selection/{id}` —
+ * 200 settled / 404 / 409 terminal / 504 drain timeout. Seeds + invalidates the
+ * poll query on success.
+ */
+export function useCancelSelectionRun() {
+  const queryClient = useQueryClient()
+  return useMutation({
+    mutationFn: (selectionId: string) =>
+      api<ModelSelectionRunResponse>(`/model-selection/${selectionId}`, {
+        method: 'DELETE',
+      }),
+    onSuccess: (data) => {
+      queryClient.setQueryData(['model-selection', 'run', data.selection_id], data)
+      void queryClient.invalidateQueries({
+        queryKey: ['model-selection', 'run', data.selection_id],
+      })
+    },
+  })
+}
+
+/**
+ * Invalidate the polled run query so a terminal run re-fetches the new
+ * `final_model_path` / `forecast` / promotion after a Slice C mutation.
+ */
+function invalidateRun(
+  queryClient: ReturnType<typeof useQueryClient>,
+  selectionId: string,
+) {
+  void queryClient.invalidateQueries({
+    queryKey: ['model-selection', 'run', selectionId],
+  })
+}
+
+/** Train the ranked winner (`POST /{id}/train-winner`, no body). */
+export function useTrainWinner(selectionId: string) {
+  const queryClient = useQueryClient()
+  return useMutation({
+    mutationFn: () =>
+      api<TrainWinnerResponse>(`/model-selection/${selectionId}/train-winner`, {
+        method: 'POST',
+      }),
+    onSuccess: () => invalidateRun(queryClient, selectionId),
+  })
+}
+
+/** Train a user-chosen candidate (`POST /{id}/train-selected`, override). */
+export function useTrainSelected(selectionId: string) {
+  const queryClient = useQueryClient()
+  return useMutation({
+    mutationFn: (body: TrainSelectedRequest) =>
+      api<TrainWinnerResponse>(`/model-selection/${selectionId}/train-selected`, {
+        method: 'POST',
+        body,
+      }),
+    onSuccess: () => invalidateRun(queryClient, selectionId),
+  })
+}
+
+/** Forecast with the trained model + decision (`POST /{id}/predict`). */
+export function usePredictWinner(selectionId: string) {
+  const queryClient = useQueryClient()
+  return useMutation({
+    mutationFn: (body: ForecastDecisionParams) =>
+      api<PredictWinnerResponse>(`/model-selection/${selectionId}/predict`, {
+        method: 'POST',
+        body,
+      }),
+    onSuccess: () => invalidateRun(queryClient, selectionId),
+  })
+}
+
+/** Promote the trained champion to a registry alias (`POST /{id}/promote`). */
+export function usePromoteChampion(selectionId: string) {
+  const queryClient = useQueryClient()
+  return useMutation({
+    mutationFn: (body: PromoteRequest) =>
+      api<PromoteResponse>(`/model-selection/${selectionId}/promote`, {
+        method: 'POST',
+        body,
+      }),
+    onSuccess: () => invalidateRun(queryClient, selectionId),
+  })
+}
diff --git a/frontend/src/lib/approval-report.test.ts b/frontend/src/lib/approval-report.test.ts
new file mode 100644
index 00000000..f94f04d9
--- /dev/null
+++ b/frontend/src/lib/approval-report.test.ts
@@ -0,0 +1,67 @@
+import { describe, it, expect } from 'vitest'
+import { formatApprovalReport } from './approval-report'
+import type { ApprovalResponse } from '@/types/api'
+
+describe('formatApprovalReport', () => {
+  it('reports a successful execution', () => {
+    const res: ApprovalResponse = {
+      action_id: 'a1',
+      approved: true,
+      status: 'executed',
+      result: { alias_name: 'champion' },
+    }
+    const msg = formatApprovalReport('create_alias', res)
+    expect(msg).toContain('✅')
+    expect(msg).toContain('create_alias')
+    expect(msg).toContain('executed successfully')
+  })
+
+  it('reports an approved-but-failed execution with the error cause', () => {
+    // The backend marks a failed execution `rejected` with the cause in result.error.
+    const res: ApprovalResponse = {
+      action_id: 'a2',
+      approved: true,
+      status: 'rejected',
+      result: { error: 'Run not found: 3c5d', error_type: 'ValueError' },
+    }
+    const msg = formatApprovalReport('create_alias', res)
+    expect(msg).toContain('❌')
+    expect(msg).toContain('could not be executed')
+    expect(msg).toContain('Run not found: 3c5d')
+  })
+
+  it('reports an operator rejection (no execution)', () => {
+    const res: ApprovalResponse = {
+      action_id: 'a3',
+      approved: false,
+      status: 'rejected',
+      result: null,
+    }
+    const msg = formatApprovalReport('archive_run', res)
+    expect(msg).toContain('🚫')
+    expect(msg).toContain('Rejected')
+    expect(msg).toContain('No action was taken')
+  })
+
+  it('reports an expired approval', () => {
+    const res: ApprovalResponse = {
+      action_id: 'a4',
+      approved: true,
+      status: 'expired',
+      result: null,
+    }
+    const msg = formatApprovalReport('save_scenario', res)
+    expect(msg).toContain('⏰')
+    expect(msg).toContain('expired')
+  })
+
+  it('does not throw on a non-object result', () => {
+    const res: ApprovalResponse = {
+      action_id: 'a5',
+      approved: true,
+      status: 'executed',
+      result: 'ok',
+    }
+    expect(() => formatApprovalReport('create_alias', res)).not.toThrow()
+  })
+})
diff --git a/frontend/src/lib/approval-report.ts b/frontend/src/lib/approval-report.ts
new file mode 100644
index 00000000..f041157e
--- /dev/null
+++ b/frontend/src/lib/approval-report.ts
@@ -0,0 +1,44 @@
+import type { ApprovalResponse } from '@/types/api'
+
+/**
+ * Build a human-readable chat report for an approved/rejected agent action.
+ *
+ * The backend's `POST /approve` returns an {@link ApprovalResponse} for every
+ * outcome, but the chat UI previously discarded it — so a click produced no
+ * visible result ("nothing returned"). This formats a one-line report for ALL
+ * outcomes so the operator always sees what happened:
+ *
+ * - `executed`                      → the action ran successfully.
+ * - approved but `rejected` + error → the action was approved but execution
+ *   failed (the backend marks a failed execution `rejected` and puts the cause
+ *   in `result.error`).
+ * - `rejected` (not approved)       → the operator rejected the action.
+ * - `expired`                       → the approval window lapsed before it ran.
+ *
+ * @param actionLabel - The gated action name (e.g. `create_alias`).
+ * @param res - The approval response from the backend.
+ * @returns A markdown-ish one-line report for the chat transcript.
+ */
+export function formatApprovalReport(actionLabel: string, res: ApprovalResponse): string {
+  const result =
+    res.result && typeof res.result === 'object'
+      ? (res.result as Record<string, unknown>)
+      : undefined
+  const errorDetail =
+    result && 'error' in result ? String(result.error) : undefined
+
+  if (res.status === 'executed') {
+    return `✅ Approved — \`${actionLabel}\` executed successfully.`
+  }
+  if (res.approved && errorDetail) {
+    return `❌ Approved, but \`${actionLabel}\` could not be executed: ${errorDetail}`
+  }
+  if (!res.approved) {
+    return `🚫 Rejected \`${actionLabel}\`. No action was taken.`
+  }
+  if (res.status === 'expired') {
+    return `⏰ The \`${actionLabel}\` approval expired before it could run.`
+  }
+  // Defensive fallback: approved, not executed, no error detail.
+  return `\`${actionLabel}\` finished with status: ${res.status}.`
+}
diff --git a/frontend/src/lib/constants.ts b/frontend/src/lib/constants.ts
index 6a6de39f..95cb28b8 100644
--- a/frontend/src/lib/constants.ts
+++ b/frontend/src/lib/constants.ts
@@ -25,6 +25,7 @@ export const ROUTES = {
     DEMAND: '/visualize/demand',
     PLANNER: '/visualize/planner',
     BATCH: '/visualize/batch',
+    CHAMPION: '/visualize/champion',
   },
   KNOWLEDGE: '/knowledge',
   CHAT: '/chat',
@@ -55,6 +56,7 @@ export const NAV_ITEMS = [
       { label: 'Forecast', href: ROUTES.VISUALIZE.FORECAST },
       { label: 'Backtest Results', href: ROUTES.VISUALIZE.BACKTEST },
       { label: 'Batch Runner', href: ROUTES.VISUALIZE.BATCH },
+      { label: 'Champion Selector', href: ROUTES.VISUALIZE.CHAMPION },
     ],
   },
   { label: 'Knowledge', href: ROUTES.KNOWLEDGE },
diff --git a/frontend/src/pages/chat.tsx b/frontend/src/pages/chat.tsx
index cc22a9d5..6bbaaeb6 100644
--- a/frontend/src/pages/chat.tsx
+++ b/frontend/src/pages/chat.tsx
@@ -16,8 +16,15 @@ import {
   SelectValue,
 } from '@/components/ui/select'
 import { api } from '@/lib/api'
+import { formatApprovalReport } from '@/lib/approval-report'
 import { WS_URL, ROUTES } from '@/lib/constants'
-import type { ChatMessage as ChatMessageType, AgentStreamEvent, AgentType, AgentSession } from '@/types/api'
+import type {
+  ChatMessage as ChatMessageType,
+  AgentStreamEvent,
+  AgentType,
+  AgentSession,
+  ApprovalResponse,
+} from '@/types/api'
 
 export default function ChatPage() {
   const [sessionId, setSessionId] = useState<string | null>(null)
@@ -142,38 +149,42 @@ export default function ChatPage() {
     send({ session_id: sessionId, message: content })
   }
 
-  const handleApprove = async () => {
-    if (!sessionId || !pendingAction?.actionId) return
-    setIsApproving(true)
-    try {
-      await api(`/agents/sessions/${sessionId}/approve`, {
-        method: 'POST',
-        body: { action_id: pendingAction.actionId, approved: true },
-      })
-      setPendingAction(null)
-    } catch (error) {
-      console.error('Failed to approve:', error)
-    } finally {
-      setIsApproving(false)
-    }
+  const appendAssistantMessage = (content: string) => {
+    setMessages((prev) => [
+      ...prev,
+      { role: 'assistant', content, timestamp: new Date().toISOString() },
+    ])
   }
 
-  const handleReject = async () => {
+  // Approve or reject a pending action, then ALWAYS surface the execution
+  // report — for every outcome (executed / failed / rejected / expired). The
+  // handlers previously discarded the /approve response, so a click left the
+  // user with no feedback ("nothing returned").
+  const decideAction = async (approved: boolean) => {
     if (!sessionId || !pendingAction?.actionId) return
+    const actionLabel = pendingAction.action
     setIsApproving(true)
     try {
-      await api(`/agents/sessions/${sessionId}/approve`, {
+      const res = await api<ApprovalResponse>(`/agents/sessions/${sessionId}/approve`, {
         method: 'POST',
-        body: { action_id: pendingAction.actionId, approved: false },
+        body: { action_id: pendingAction.actionId, approved },
       })
       setPendingAction(null)
+      appendAssistantMessage(formatApprovalReport(actionLabel, res))
     } catch (error) {
-      console.error('Failed to reject:', error)
+      console.error(approved ? 'Failed to approve:' : 'Failed to reject:', error)
+      setPendingAction(null)
+      const verb = approved ? 'approve' : 'reject'
+      const detail = error instanceof Error ? error.message : 'request failed'
+      appendAssistantMessage(`Error: could not ${verb} \`${actionLabel}\` — ${detail}`)
     } finally {
       setIsApproving(false)
     }
   }
 
+  const handleApprove = () => decideAction(true)
+  const handleReject = () => decideAction(false)
+
   const handleNewSession = () => {
     setSessionId(null)
     setMessages([])
diff --git a/frontend/src/pages/visualize/champion.test.tsx b/frontend/src/pages/visualize/champion.test.tsx
new file mode 100644
index 00000000..2ae297ca
--- /dev/null
+++ b/frontend/src/pages/visualize/champion.test.tsx
@@ -0,0 +1,122 @@
+import { afterEach, beforeAll, describe, expect, it, vi } from 'vitest'
+import { cleanup, render, screen, waitFor } from '@testing-library/react'
+import type { ModelCatalogResponse } from '@/types/api'
+
+// Radix primitives need a couple of layout APIs jsdom lacks.
+beforeAll(() => {
+  class ResizeObserverStub {
+    observe() {}
+    unobserve() {}
+    disconnect() {}
+  }
+  vi.stubGlobal('ResizeObserver', ResizeObserverStub)
+  if (!Element.prototype.hasPointerCapture) {
+    Element.prototype.hasPointerCapture = () => false
+  }
+  if (!Element.prototype.scrollIntoView) {
+    Element.prototype.scrollIntoView = () => {}
+  }
+})
+
+const CATALOG: ModelCatalogResponse = {
+  models: [
+    {
+      model_type: 'naive',
+      label: 'Naive',
+      family: 'baseline',
+      feature_aware: false,
+      requires_extra: false,
+      default_params: {},
+      supports_auto_predict: true,
+      description: 'Repeats the last observed value.',
+    },
+    {
+      model_type: 'regression',
+      label: 'Gradient Boosting Regression',
+      family: 'tree',
+      feature_aware: true,
+      requires_extra: false,
+      default_params: {},
+      supports_auto_predict: false,
+      description: 'Histogram gradient boosting.',
+    },
+  ],
+  default_candidate_model_types: ['naive', 'regression'],
+}
+
+vi.mock('@/hooks/use-stores', () => ({
+  useStores: () => ({
+    data: { stores: [{ id: 7, code: 'S001', name: 'Downtown', region: 'North', store_type: 'flagship' }] },
+    isLoading: false,
+  }),
+}))
+vi.mock('@/hooks/use-products', () => ({
+  useProducts: () => ({
+    data: { products: [{ id: 12, sku: 'SKU1', name: 'Widget', category: 'tools' }] },
+    isLoading: false,
+  }),
+}))
+vi.mock('@/hooks/use-model-selection', () => ({
+  useModelCatalog: () => ({
+    data: CATALOG,
+    isLoading: false,
+    isError: false,
+    error: null,
+    refetch: () => {},
+  }),
+  usePairAvailability: () => ({
+    data: undefined,
+    isLoading: false,
+    isError: false,
+  }),
+  // Slice B — inert async hooks (no run in progress for the shell test).
+  useSubmitSelectionRun: () => ({ mutate: vi.fn(), isPending: false }),
+  useCancelSelectionRun: () => ({ mutate: vi.fn(), isPending: false }),
+  useSelectionRun: () => ({ data: undefined, isLoading: false, isError: false }),
+}))
+
+import ChampionSelectorPage from './champion'
+
+afterEach(cleanup)
+
+describe('ChampionSelectorPage', () => {
+  it('renders the selection shell', () => {
+    render(<ChampionSelectorPage />)
+    expect(screen.getByText('Champion Selector')).toBeTruthy()
+    expect(screen.getByText('1 · Pick a store & product')).toBeTruthy()
+    expect(screen.getByText('2 · Data availability')).toBeTruthy()
+    expect(screen.getByText('3 · Candidate models')).toBeTruthy()
+    expect(screen.getByText('4 · Backtest settings')).toBeTruthy()
+  })
+
+  it('drives candidate cards from the backend catalog', () => {
+    render(<ChampionSelectorPage />)
+    expect(screen.getByTestId('candidate-model-naive')).toBeTruthy()
+    expect(screen.getByTestId('candidate-model-regression')).toBeTruthy()
+  })
+
+  it('pre-selects the catalog default candidate models', async () => {
+    render(<ChampionSelectorPage />)
+    // The seeding effect selects the default two models.
+    await waitFor(() =>
+      expect(screen.getByText('2 of 10 selected')).toBeTruthy(),
+    )
+  })
+
+  it('renders the availability empty state until a pair is chosen', () => {
+    render(<ChampionSelectorPage />)
+    expect(screen.getByText('Pick a store and product')).toBeTruthy()
+  })
+
+  it('keeps the Run comparison CTA disabled and issues no POST', () => {
+    const fetchMock = vi.fn()
+    vi.stubGlobal('fetch', fetchMock)
+    render(<ChampionSelectorPage />)
+    const cta = screen.getByTestId('run-comparison-cta') as HTMLButtonElement
+    expect(cta.disabled).toBe(true)
+    // The page itself issues no network calls (the hooks are mocked); in
+    // particular it never POSTs to /model-selection/run.
+    expect(fetchMock).not.toHaveBeenCalled()
+    vi.unstubAllGlobals()
+  })
+})
diff --git a/frontend/src/pages/visualize/champion.tsx b/frontend/src/pages/visualize/champion.tsx
new file mode 100644
index 00000000..30b624c8
--- /dev/null
+++ b/frontend/src/pages/visualize/champion.tsx
@@ -0,0 +1,387 @@
+import { useMemo, useState } from 'react'
+import { format } from 'date-fns'
+import { DateRange } from 'react-day-picker'
+import { Loader2, Trophy } from 'lucide-react'
+import { useStores } from '@/hooks/use-stores'
+import { useProducts } from '@/hooks/use-products'
+import {
+  useCancelSelectionRun,
+  useModelCatalog,
+  usePairAvailability,
+  useSelectionRun,
+  useSubmitSelectionRun,
+} from '@/hooks/use-model-selection'
+import { DateRangePicker } from '@/components/common/date-range-picker'
+import { ErrorDisplay } from '@/components/common/error-display'
+import { AvailabilityPanel } from '@/components/champion-selector/availability-panel'
+import { BacktestSettingsForm } from '@/components/champion-selector/backtest-settings-form'
+import { splitConfigErrors } from '@/components/champion-selector/split-config'
+import { CandidateModelPicker } from '@/components/champion-selector/candidate-model-picker'
+import { SearchableEntitySelect } from '@/components/champion-selector/searchable-entity-select'
+import { assembleRunRequest } from '@/components/champion-selector/run-request'
+import { RunProgressPanel } from '@/components/champion-selector/results/run-progress-panel'
+import { RankingTable } from '@/components/champion-selector/results/ranking-table'
+import { WinnerCard } from '@/components/champion-selector/results/winner-card'
+import { ComparisonCharts } from '@/components/champion-selector/results/comparison-charts'
+import { ModelDetailDrawer } from '@/components/champion-selector/results/model-detail-drawer'
+import { CancelRunDialog } from '@/components/champion-selector/results/cancel-run-dialog'
+import { DecisionSection } from '@/components/champion-selector/decision/decision-section'
+import { isTerminalSelectionStatus } from '@/components/champion-selector/results/constants'
+import { Button } from '@/components/ui/button'
+import { Card, CardContent, CardDescription, CardHeader, CardTitle } from '@/components/ui/card'
+import { Input } from '@/components/ui/input'
+import { getErrorMessage } from '@/lib/api'
+import type {
+  ModelRankEntry,
+  ModelSelectionRunRequest,
+  SplitConfig,
+} from '@/types/api'
+
+const DEFAULT_HORIZON = 14
+
+const DEFAULT_SPLIT: SplitConfig = {
+  strategy: 'expanding',
+  n_splits: 5,
+  min_train_size: 30,
+  gap: 0,
+  horizon: DEFAULT_HORIZON,
+}
+
+/**
+ * Forecast Champion Selector — Slice A.
+ *
+ * Configuration + availability triage only. It assembles a typed
+ * `ModelSelectionRunRequest` in component state and surfaces a DISABLED
+ * "Run comparison" CTA — the comparison RUN itself (and all results/training)
+ * lands in Slices B/C. This page calls only the two read GETs (catalog +
+ * availability); it never POSTs.
+ */
+export default function ChampionSelectorPage() {
+  const [storeId, setStoreId] = useState<number | null>(null)
+  const [productId, setProductId] = useState<number | null>(null)
+  const [dateRange, setDateRange] = useState<DateRange | undefined>()
+  const [forecastHorizon, setForecastHorizon] = useState(DEFAULT_HORIZON)
+  const [splitConfig, setSplitConfig] = useState<SplitConfig>(DEFAULT_SPLIT)
+  const [rankingMetric, setRankingMetric] = useState<
+    ModelSelectionRunRequest['ranking_metric']
+  >('wape')
+  // `null` means "the user hasn't edited the selection yet" — fall back to the
+  // catalog's default candidate set (derived below, no effect needed).
+  const [editedModels, setEditedModels] = useState<string[] | null>(null)
+
+  // Slice B — the in-flight/terminal async run + the detail-drawer selection.
+  const [selectionId, setSelectionId] = useState<string | null>(null)
+  const [submitError, setSubmitError] = useState<string | null>(null)
+  const [drawerEntry, setDrawerEntry] = useState<ModelRankEntry | null>(null)
+  const [drawerOpen, setDrawerOpen] = useState(false)
+
+  // /dimensions/{stores,products} both cap page_size at 100 (client-filtered).
+  const storesQuery = useStores({ page: 1, pageSize: 100 })
+  const productsQuery = useProducts({ page: 1, pageSize: 100 })
+  const catalogQuery = useModelCatalog()
+
+  const validPair = !!storeId && !!productId
+  const availabilityQuery = usePairAvailability({
+    storeId,
+    productId,
+    forecastHorizon,
+    enabled: validPair,
+  })
+
+  // Pre-select the backend default candidate set until the user edits it —
+  // derived during render rather than seeded via an effect.
+  const selectedModels =
+    editedModels ?? catalogQuery.data?.default_candidate_model_types ?? []
+
+  // split_config.horizon must equal forecast_horizon (the backend validator).
+  // Force it during render so no effect is needed to keep them in sync.
+  const effectiveSplit: SplitConfig = useMemo(
+    () => ({ ...splitConfig, horizon: forecastHorizon }),
+    [splitConfig, forecastHorizon],
+  )
+
+  const storeItems = useMemo(
+    () =>
+      (storesQuery.data?.stores ?? []).map((store) => ({
+        id: store.id,
+        primary: `${store.code} · ${store.name}`,
+        secondary: [store.region, store.store_type].filter(Boolean).join(' · '),
+      })),
+    [storesQuery.data],
+  )
+  const productItems = useMemo(
+    () =>
+      (productsQuery.data?.products ?? []).map((product) => ({
+        id: product.id,
+        primary: `${product.sku} · ${product.name}`,
+        secondary: product.category ?? undefined,
+      })),
+    [productsQuery.data],
+  )
+
+  const formReady =
+    validPair &&
+    !!dateRange?.from &&
+    !!dateRange?.to &&
+    forecastHorizon >= 1 &&
+    forecastHorizon <= 90 &&
+    selectedModels.length >= 1 &&
+    splitConfigErrors(effectiveSplit).length === 0
+
+  // The assembled request — `auto_train_winner`/`auto_predict` pinned false by
+  // `assembleRunRequest` (no-ops in the async path; Slice C owns train/predict).
+  const runRequest: ModelSelectionRunRequest | null =
+    formReady && dateRange?.from && dateRange?.to
+      ? assembleRunRequest({
+          storeId: storeId!,
+          productId: productId!,
+          startDate: format(dateRange.from, 'yyyy-MM-dd'),
+          endDate: format(dateRange.to, 'yyyy-MM-dd'),
+          forecastHorizon,
+          rankingMetric,
+          splitConfig: effectiveSplit,
+          selectedModels,
+        })
+      : null
+
+  // Slice B — async submit → poll → cancel.
+  const submitRun = useSubmitSelectionRun()
+  const cancelRun = useCancelSelectionRun()
+  const runQuery = useSelectionRun(selectionId)
+  const run = runQuery.data
+  const isRunning = !!run && !isTerminalSelectionStatus(run.status)
+  const isTerminal = !!run && isTerminalSelectionStatus(run.status)
+
+  function handleRunComparison() {
+    if (!runRequest) return
+    setSubmitError(null)
+    submitRun.mutate(runRequest, {
+      onSuccess: (data) => setSelectionId(data.selection_id),
+      onError: (err) => setSubmitError(getErrorMessage(err)),
+    })
+  }
+
+  function handleSelectModel(entry: ModelRankEntry) {
+    setDrawerEntry(entry)
+    setDrawerOpen(true)
+  }
+
+  return (
+    <div className="space-y-6">
+      <div>
+        <h1 className="flex items-center gap-2 text-3xl font-bold">
+          <Trophy className="h-7 w-7" />
+          Champion Selector
+        </h1>
+        <p className="mt-1 text-sm text-muted-foreground">
+          Configure a store, product, time period, horizon and candidate models,
+          and check whether the pair has enough history to model. Running the
+          comparison arrives in a later update.
+        </p>
+      </div>
+
+      {/* Selection */}
+      <Card>
+        <CardHeader>
+          <CardTitle>1 · Pick a store &amp; product</CardTitle>
+          <CardDescription>
+            Search by code/SKU or name. The availability check runs automatically
+            once a valid pair and horizon are chosen.
+          </CardDescription>
+        </CardHeader>
+        <CardContent className="space-y-4">
+          <div className="grid grid-cols-1 gap-4 lg:grid-cols-2">
+            <div className="space-y-1">
+              <span className="text-xs text-muted-foreground">Store</span>
+              <SearchableEntitySelect
+                items={storeItems}
+                value={storeId}
+                onChange={setStoreId}
+                loading={storesQuery.isLoading}
+                placeholder="Pick a store…"
+                testId="champion-store-select"
+              />
+            </div>
+            <div className="space-y-1">
+              <span className="text-xs text-muted-foreground">Product</span>
+              <SearchableEntitySelect
+                items={productItems}
+                value={productId}
+                onChange={setProductId}
+                loading={productsQuery.isLoading}
+                placeholder="Pick a product…"
+                testId="champion-product-select"
+              />
+            </div>
+            <div className="space-y-1">
+              <span className="text-xs text-muted-foreground">Time period</span>
+              <DateRangePicker value={dateRange} onChange={setDateRange} />
+            </div>
+            <div className="space-y-1">
+              <span className="text-xs text-muted-foreground">
+                Forecast horizon (days)
+              </span>
+              <Input
+                type="number"
+                min={1}
+                max={90}
+                value={String(forecastHorizon)}
+                data-testid="champion-horizon"
+                onChange={(event) =>
+                  setForecastHorizon(Number(event.target.value) || 0)
+                }
+              />
+            </div>
+          </div>
+        </CardContent>
+      </Card>
+
+      {/* Availability */}
+      <Card>
+        <CardHeader>
+          <CardTitle>2 · Data availability</CardTitle>
+          <CardDescription>
+            Whether this pair has enough observed history for a reliable
+            comparison, plus the recommended split.
+          </CardDescription>
+        </CardHeader>
+        <CardContent>
+          <AvailabilityPanel
+            availability={availabilityQuery.data}
+            isLoading={validPair && availabilityQuery.isLoading}
+            isError={availabilityQuery.isError}
+          />
+        </CardContent>
+      </Card>
+
+      {/* Candidate models */}
+      <Card>
+        <CardHeader>
+          <CardTitle>3 · Candidate models</CardTitle>
+          <CardDescription>
+            Pick the models to compare (up to 10). The default five are
+            pre-selected; opt-in extras are flagged.
+          </CardDescription>
+        </CardHeader>
+        <CardContent>
+          {catalogQuery.isError ? (
+            <ErrorDisplay
+              error={catalogQuery.error}
+              title="Could not load the model catalog"
+              onRetry={() => catalogQuery.refetch()}
+            />
+          ) : (
+            <CandidateModelPicker
+              catalog={catalogQuery.data}
+              selected={selectedModels}
+              onChange={setEditedModels}
+              isLoading={catalogQuery.isLoading}
+            />
+          )}
+        </CardContent>
+      </Card>
+
+      {/* Backtest settings */}
+      <Card>
+        <CardHeader>
+          <CardTitle>4 · Backtest settings</CardTitle>
+          <CardDescription>
+            The ranking metric and cross-validation split. Start with the
+            recommended split or fine-tune under Advanced.
+          </CardDescription>
+        </CardHeader>
+        <CardContent>
+          <BacktestSettingsForm
+            value={effectiveSplit}
+            rankingMetric={rankingMetric}
+            forecastHorizon={forecastHorizon}
+            onChange={setSplitConfig}
+            onRankingMetricChange={setRankingMetric}
+            recommended={availabilityQuery.data?.recommended_split_config}
+          />
+        </CardContent>
+      </Card>
+
+      {/* Run CTA (Slice B — submit the async comparison) */}
+      <Card>
+        <CardContent className="flex flex-col gap-3 pt-6 sm:flex-row sm:items-center sm:justify-between">
+          <div className="text-sm text-muted-foreground">
+            {formReady
+              ? `Ready to compare ${selectedModels.length} model${
+                  selectedModels.length === 1 ? '' : 's'
+                }.`
+              : 'Pick a store, product, time period, horizon and at least one model to continue.'}
+            {submitError && (
+              <span className="ml-2 text-destructive">{submitError}</span>
+            )}
+          </div>
+          <div className="flex items-center gap-2">
+            {isRunning && (
+              <CancelRunDialog
+                onConfirm={() => selectionId && cancelRun.mutate(selectionId)}
+                isCancelling={cancelRun.isPending}
+              />
+            )}
+            <Button
+              type="button"
+              disabled={!formReady || submitRun.isPending || isRunning}
+              data-testid="run-comparison-cta"
+              onClick={handleRunComparison}
+            >
+              {submitRun.isPending || isRunning ? (
+                <Loader2 className="mr-2 h-4 w-4 animate-spin" />
+              ) : (
+                <Trophy className="mr-2 h-4 w-4" />
+              )}
+              {isRunning ? 'Running…' : 'Run comparison'}
+            </Button>
+          </div>
+        </CardContent>
+      </Card>
+
+      {/* Live progress + results (Slice B) */}
+      {run && (
+        <RunProgressPanel
+          status={run.status}
+          progress={run.progress ?? null}
+          candidates={run.candidate_progress ?? []}
+        />
+      )}
+
+      {isTerminal && run && (
+        <>
+          <WinnerCard
+            winner={run.winner}
+            confidence={run.recommendation_confidence}
+            reasons={run.confidence_reasons}
+            businessSummary={run.business_summary}
+          />
+          {run.chart_data && (
+            <ComparisonCharts
+              chartData={run.chart_data}
+              winnerModelType={run.winner?.model_type}
+            />
+          )}
+          {run.ranking.length > 0 && (
+            <RankingTable ranking={run.ranking} onSelectModel={handleSelectModel} />
+          )}
+          <ModelDetailDrawer
+            entry={drawerEntry}
+            open={drawerOpen}
+            onOpenChange={setDrawerOpen}
+          />
+          {/* Slice C — decide → train → forecast → interpret → promote. Keyed by
+              selectionId so a fresh run resets the decision state. */}
+          {selectionId && run.winner && (
+            <DecisionSection
+              key={selectionId}
+              selectionId={selectionId}
+              run={run}
+              catalog={catalogQuery.data}
+            />
+          )}
+        </>
+      )}
+    </div>
+  )
+}
diff --git a/frontend/src/types/api.ts b/frontend/src/types/api.ts
index 3c62f684..88a204e1 100644
--- a/frontend/src/types/api.ts
+++ b/frontend/src/types/api.ts
@@ -624,6 +624,15 @@ export interface ChatMessage {
   timestamp: string
 }
 
+/** Response from POST /agents/sessions/{id}/approve (mirrors backend ApprovalResponse). */
+export interface ApprovalResponse {
+  action_id: string
+  approved: boolean
+  /** Execution result on success, or `{ error, error_type }` when execution failed. */
+  result?: unknown
+  status: 'executed' | 'rejected' | 'expired'
+}
+
 export interface ToolCall {
   tool_name: string
   arguments: Record<string, unknown>
@@ -1179,3 +1188,267 @@ export interface ForecastExplanation {
   as_of_date: string // ISO date
   generated_at: string // ISO datetime
 }
+
+// =============================================================================
+// Model Selection (Champion Selector) — backend slice app/features/model_selection
+// =============================================================================
+//
+// The FULL workflow contract is declared here so Slices B/C add BEHAVIOR, not
+// type definitions. Slice A CONSUMES only `ModelCatalogResponse`,
+// `PairAvailability`, and `SplitConfig` (read-only). Everything tagged
+// DECLARED-FOR-LATER is wired by Slice B (async run + results) and Slice C
+// (train / predict / business summary / override / promotion).
+
+export type ModelSelectionStatus =
+  | 'pending'
+  | 'running'
+  | 'completed'
+  | 'partial'
+  | 'failed'
+  | 'cancelled' // Slice B — async cancel terminal state
+export type CandidateStatus =
+  | 'pending'
+  | 'running'
+  | 'completed'
+  | 'failed'
+  | 'cancelled'
+export type RankingMetric = 'wape' | 'smape' | 'mae' | 'bias'
+export type AvailabilityStatus = 'ready' | 'limited' | 'unusable'
+// `ConfidenceLevel` ('high' | 'medium' | 'low') is reused from the
+// Explainability section above — the backend uses the same enum.
+
+// Backtest split config — mirrors `app/features/backtesting/schemas.py`
+// `SplitConfig` EXACTLY (bounds enforced client-side so the assembled run
+// request is always valid for Slice B).
+export type SplitStrategy = 'expanding' | 'sliding'
+export interface SplitConfig {
+  strategy: SplitStrategy // def 'expanding'
+  n_splits: number // 2..20, def 5
+  min_train_size: number // >= 7, def 30
+  gap: number // 0..30, def 0
+  horizon: number // 1..90, def 14; must be > gap; kept === forecast_horizon
+}
+
+// --- CONSUMED in Slice A ---------------------------------------------------
+
+export interface CandidateModelInfo {
+  model_type: string
+  label: string
+  family: ModelFamily
+  feature_aware: boolean
+  /** lightgbm/xgboost — opt-in extra may be absent at runtime. */
+  requires_extra: boolean
+  default_params: Record<string, unknown>
+  /** false for feature-aware models (the predict path rejects them). */
+  supports_auto_predict: boolean
+  description: string
+}
+
+export interface ModelCatalogResponse {
+  models: CandidateModelInfo[]
+  default_candidate_model_types: string[]
+}
+
+export interface PairAvailability {
+  store_id: number
+  product_id: number
+  first_sales_date: string | null
+  last_sales_date: string | null
+  observed_days: number
+  expected_calendar_days: number
+  coverage_ratio: number
+  missing_days: number
+  zero_sale_days: number
+  promotion_days: number | null
+  average_daily_demand: number
+  status: AvailabilityStatus
+  recommended_split_config: SplitConfig
+  warnings: string[]
+}
+
+// --- DECLARED-FOR-LATER (Slices B/C wire behavior on these) ----------------
+
+export interface SelectionWindow {
+  start_date: string // ISO date (inclusive)
+  end_date: string // ISO date (inclusive)
+}
+
+export interface CandidateModelConfig {
+  model_type: string
+  params: Record<string, unknown>
+}
+
+export interface RankingPolicy {
+  minimum_sample_size: number
+  high_confidence_rel_improvement: number
+  max_acceptable_abs_bias: number
+}
+
+export interface ModelSelectionRunRequest {
+  store_id: number
+  product_id: number
+  selection_window: SelectionWindow
+  forecast_horizon: number
+  ranking_metric: RankingMetric
+  split_config: SplitConfig
+  candidate_models: CandidateModelConfig[]
+  feature_frame_version: number // 1 | 2 (Slice A always 1)
+  feature_groups: string[] | null // only valid when feature_frame_version === 2
+  ranking_policy?: RankingPolicy
+  // Slice A sets BOTH false. The async run path (Slice B `POST /runs`) treats
+  // them as NO-OPS, and Slice C owns explicit train/predict — so these two
+  // fields stay false throughout the UI flow and are never surfaced as toggles.
+  auto_train_winner: boolean
+  auto_predict: boolean
+}
+
+export interface ModelRankEntry {
+  rank: number | null
+  model_type: string
+  params: Record<string, unknown>
+  included: boolean
+  exclusion_reason: string | null
+  metrics: Record<string, number> | null
+}
+
+export interface WinnerSummary {
+  model_type: string
+  params: Record<string, unknown>
+  metrics: Record<string, number>
+  rank: number
+}
+
+export interface ModelSelectionChartData {
+  wape_by_model: Record<string, number>
+  bias_by_model: Record<string, number>
+  fold_stability: Record<string, number[]>
+  winner_actual_vs_predicted: unknown[]
+}
+
+export interface ModelSelectionForecastSummary {
+  points: Record<string, unknown>[]
+  total_demand: number
+  average_demand: number
+  horizon: number
+  // Slice C — additive peak/low day (null on legacy snapshots).
+  peak_date?: string | null
+  peak_demand?: number | null
+  low_date?: string | null
+  low_demand?: number | null
+}
+
+// Slice B — live async progress on a selection run.
+export interface CandidateProgress {
+  candidate_id: string
+  ordinal: number
+  model_type: string
+  status: CandidateStatus
+  error: string | null
+  started_at: string | null
+  completed_at: string | null
+  duration_ms: number | null
+}
+
+export interface SelectionProgress {
+  total: number
+  pending: number
+  running: number
+  completed: number
+  failed: number
+  cancelled: number
+}
+
+export interface ModelSelectionRunResponse {
+  selection_id: string
+  store_id: number
+  product_id: number
+  status: ModelSelectionStatus
+  selection_window: SelectionWindow
+  forecast_horizon: number
+  ranking_metric: string
+  availability: PairAvailability | null
+  ranking: ModelRankEntry[]
+  winner: WinnerSummary | null
+  recommendation_confidence: ConfidenceLevel | null
+  confidence_reasons: string[]
+  chart_data: ModelSelectionChartData | null
+  final_model: Record<string, unknown> | null
+  forecast: ModelSelectionForecastSummary | null
+  business_summary: Record<string, unknown> | null
+  error_message: string | null
+  created_at: string // ISO datetime
+  // Slice B — additive async fields (null/empty on a legacy sync `/run` row).
+  started_at?: string | null
+  completed_at: string | null
+  progress?: SelectionProgress | null
+  candidate_progress?: CandidateProgress[]
+}
+
+// Slice B — 202 response from `POST /model-selection/runs` (additive superset).
+export interface SubmitRunResponse extends ModelSelectionRunResponse {
+  monitor_url: string
+  cancel_url: string
+}
+
+// Slice C — forecast decision, override, and promotion contracts.
+
+/** `POST /model-selection/{id}/train-selected` body (override). */
+export interface TrainSelectedRequest {
+  model_type: string
+  override_reason?: string | null
+}
+
+/** Optional `POST /model-selection/{id}/predict` body. */
+export interface ForecastDecisionParams {
+  lead_time_days: number
+  service_level: number
+}
+
+/** Deterministic, labeled inventory-decision heuristic (never feeds ranking). */
+export interface ForecastDecision {
+  method: 'heuristic'
+  lead_time_days: number
+  service_level: number
+  z_value: number
+  sigma_daily_demand: number
+  expected_demand_over_lead_time: number
+  safety_stock: number
+  reorder_point: number
+  bias_risk_text: string
+  caveats: string[]
+}
+
+/** `POST /model-selection/{id}/train-winner` and `/train-selected` response. */
+export interface TrainWinnerResponse {
+  selection_id: string
+  model_type: string
+  model_path: string
+  is_override: boolean
+  override_warning: string | null
+}
+
+/** `POST /model-selection/{id}/predict` response (forecast + decision). */
+export interface PredictWinnerResponse {
+  selection_id: string
+  forecast: ModelSelectionForecastSummary
+  decision: ForecastDecision | null
+}
+
+/** `POST /model-selection/{id}/promote` body (approval-gated). */
+export interface PromoteRequest {
+  alias_name: string
+  approved_by: string
+  acknowledge_non_recommended?: boolean
+  description?: string | null
+}
+
+/** `POST /model-selection/{id}/promote` response. */
+export interface PromoteResponse {
+  selection_id: string
+  alias_name: string
+  run_id: string
+  run_status: string
+  model_type: string
+  is_override: boolean
+  promoted_at: string // ISO datetime
+}
diff --git a/tests/test_e2e_demo.py b/tests/test_e2e_demo.py
index 31d263d4..ac3a5278 100644
--- a/tests/test_e2e_demo.py
+++ b/tests/test_e2e_demo.py
@@ -504,23 +504,31 @@ def test_run_demo_showcase_rich_full_epic(
         f"status={scenario_step['status']!r} detail={scenario_step['detail']!r}"
     )
 
-    # Any OTHER failed step must be an environment-dependent knowledge-phase step
-    # (embedding provider unreachable / misconfigured key) -- those skip
-    # gracefully when the provider is absent (RUNBOOKS 20-22), but a real 401
-    # surfaces as a fail locally. Not the #324 cascade.
-    ENV_DEPENDENT_KNOWLEDGE_STEPS = {"rag_index_subset", "rag_retrieve_probe"}
+    # ---- PR1 (PRP-42, #329) — knowledge phase must never hard-fail -----------
+    # The embedding-provider knowledge steps now SKIP gracefully whether the
+    # provider is truly unreachable OR rejects an invalid/placeholder key (the
+    # 401/403 -> EMBEDDING_AUTH classification, RUNBOOKS 20-22). They may pass
+    # (provider reachable + corpus matches), skip (unreachable / bad key), or
+    # warn (retrieve indexed but found no hits) -- but they must NOT fail.
+    KNOWLEDGE_STEPS = {"rag_index_subset", "rag_retrieve_probe"}
+    for name in KNOWLEDGE_STEPS:
+        step = by_name.get(name)
+        if step is not None:
+            assert step["status"] in {"pass", "skip", "warn"}, (
+                f"{name} must skip/warn gracefully on an unreachable/invalid "
+                f"embedding key (#329), got status={step['status']!r} "
+                f"detail={step['detail']!r}"
+            )
+
+    # No step may hard-fail on showcase_rich now: #324 is fixed and the
+    # knowledge phase skips instead of 401/502-failing. Any fail is a regression.
     failed = [s for s in result["steps"] if s["status"] == "fail"]
-    for step in failed:
-        assert step["step_name"] in ENV_DEPENDENT_KNOWLEDGE_STEPS, (
-            f"unexpected showcase_rich failure (not #324, not env-dependent): "
-            f"{step['step_name']!r} detail={step['detail']!r}"
-        )
-    # With no env-dependent failures, the per-step statuses and the overall
-    # status must agree -- the whole pipeline reports pass.
-    if not failed:
-        assert result["overall_status"] == "pass", (
-            f"no failed steps but overall_status={result['overall_status']!r}"
-        )
+    assert not failed, "unexpected showcase_rich failure(s): " + ", ".join(
+        f"{s['step_name']!r} (detail={s['detail']!r})" for s in failed
+    )
+    assert result["overall_status"] == "pass", (
+        f"no failed steps but overall_status={result['overall_status']!r}"
+    )
 
 
 @pytest.mark.integration