355 changed files with 2591 additions and 34713 deletions
--- a/.cliff.toml
+++ b/.cliff.toml
@ -1,33 +0,0 @@
-[changelog]
-header = "# Changelog\n"
-body = """
-{% if version %}\
-## [{{ version | trim_start_matches(pat="v") }}] - {{ timestamp | date(format="%Y-%m-%d") }}
-{% else %}\
-## [Unreleased]
-{% endif %}\
-{% for group, commits in commits | group_by(attribute="group") %}
-### {{ group | upper_first }}
-{% for commit in commits %}
- {{ commit.message | upper_first }}\
-{% endfor %}
-{% endfor %}\n
-"""
-footer = ""
-trim = true
-
-[git]
-conventional_commits = true
-filter_unconventional = true
-commit_parsers = [
-  { message = "^feat", group = "Features" },
-  { message = "^fix", group = "Bug Fixes" },
-  { message = "^refactor", group = "Refactor" },
-  { message = "^perf", group = "Performance" },
-  { message = "^docs", group = "Documentation" },
-  { message = "^test", group = "Testing" },
-  { message = "^ci", group = "CI/CD" },
-  { message = "^chore", group = "Miscellaneous" },
-]
-filter_commits = false
-tag_pattern = "v[0-9].*"
--- a/.forgejo/workflows/ci.yml
+++ b/.forgejo/workflows/ci.yml
@ -1,30 +0,0 @@
-name: CI
-
-on:
-  push:
-    branches: [main]
-  pull_request:
-    branches: [main]
-
-jobs:
-  test:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v4
-
-      - uses: actions/setup-python@v5
-        with:
-          python-version: "3.11"
-          cache: pip
-
-      - name: Install dependencies
-        run: pip install -e ".[dev]"
-
-      - name: Lint (ruff)
-        run: ruff check circuitforge_core/
-
-      - name: Type check (mypy)
-        run: mypy circuitforge_core/ --ignore-missing-imports
-
-      - name: Test
-        run: pytest tests/ -v --tb=short
--- a/.forgejo/workflows/mirror.yml
+++ b/.forgejo/workflows/mirror.yml
@ -1,31 +0,0 @@
-name: Mirror
-
-on:
-  push:
-    branches: [main]
-    tags:
-      - "v*"
-
-jobs:
-  mirror:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v4
-        with:
-          fetch-depth: 0
-
-      - name: Mirror to GitHub
-        continue-on-error: true
-        env:
-          GITHUB_MIRROR_TOKEN: ${{ secrets.GITHUB_MIRROR_TOKEN }}
-        run: |
-          git remote add github "https://x-access-token:${GITHUB_MIRROR_TOKEN}@github.com/CircuitForgeLLC/circuitforge-core.git"
-          git push github --mirror
-
-      - name: Mirror to Codeberg
-        continue-on-error: true
-        env:
-          CODEBERG_MIRROR_TOKEN: ${{ secrets.CODEBERG_MIRROR_TOKEN }}
-        run: |
-          git remote add codeberg "https://CircuitForge:${CODEBERG_MIRROR_TOKEN}@codeberg.org/CircuitForge/circuitforge-core.git"
-          git push codeberg --mirror
--- a/.forgejo/workflows/release-pypi.yml
+++ b/.forgejo/workflows/release-pypi.yml
@ -1,66 +0,0 @@
-name: Release — PyPI + Forgejo Packages
-
-# circuitforge-core is MIT — published to both public PyPI and the Circuit-Forge
-# Forgejo Packages index so cf-orch can resolve it from a single --extra-index-url.
-#
-# Required secrets:
-#   PYPI_API_TOKEN      — public PyPI upload token
-#   FORGEJO_PYPI_TOKEN  — Forgejo token with package:write scope
-
-on:
-  push:
-    tags:
-      - "v*"
-
-jobs:
-  release:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v4
-        with:
-          fetch-depth: 0
-
-      - uses: actions/setup-python@v5
-        with:
-          python-version: "3.11"
-
-      - name: Build
-        run: |
-          pip install build twine
-          python -m build
-
-      - name: Publish to public PyPI
-        uses: pypa/gh-action-pypi-publish@release/v1
-        with:
-          password: ${{ secrets.PYPI_API_TOKEN }}
-
-      - name: Publish to Forgejo Packages
-        env:
-          TWINE_USERNAME: pypi-token
-          TWINE_PASSWORD: ${{ secrets.FORGEJO_PYPI_TOKEN }}
-          TWINE_REPOSITORY_URL: https://git.opensourcesolarpunk.com/api/packages/Circuit-Forge/pypi
-        run: twine upload dist/*
-
-      - name: Create Forgejo release
-        env:
-          FORGEJO_TOKEN: ${{ secrets.FORGEJO_PYPI_TOKEN }}
-        run: |
-          TAG="${GITHUB_REF_NAME}"
-          EXISTING=$(curl -sf \
-            -H "Authorization: token ${FORGEJO_TOKEN}" \
-            "https://git.opensourcesolarpunk.com/api/v1/repos/Circuit-Forge/circuitforge-core/releases/tags/${TAG}" \
-            2>/dev/null \
-            | python3 -c "import sys,json; print(json.load(sys.stdin).get('id',''))" 2>/dev/null || true)
-          if [ -z "${EXISTING}" ]; then
-            python3 -c "
-          import json
-          print(json.dumps({'tag_name':'${TAG}','name':'${TAG}','draft':False,'prerelease':False}))
-          " | curl -sf -X POST \
-                -H "Authorization: token ${FORGEJO_TOKEN}" \
-                -H "Content-Type: application/json" \
-                "https://git.opensourcesolarpunk.com/api/v1/repos/Circuit-Forge/circuitforge-core/releases" \
-                -d @-
-            echo "Release created for ${TAG}"
-          else
-            echo "Release for ${TAG} already exists (id=${EXISTING}), skipping."
-          fi
--- a/.gitignore
+++ b/.gitignore
@ -5,14 +5,6 @@ __pycache__/
 dist/
 .pytest_cache/
 .superpowers/
-.coverage
-build/
-"<MagicMock*"
-
-# packages/display (Vue/npm)
-node_modules/
-*.tsbuildinfo

 # cf-orch private profiles (commit on personal/heimdall branch only)
 circuitforge_core/resources/profiles/private/
-.worktrees/
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@ -1,381 +0,0 @@
-# Changelog
-
-All notable changes to `circuitforge-core` are documented here.
-Format follows [Keep a Changelog](https://keepachangelog.com/en/1.0.0/).
-Versions follow [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
-
---
-
-## [0.22.0] — 2026-07-10
-
-### Added
-
-**`circuitforge_core.signal_bus`** — generic SSE event publisher for real-time signal streams (MIT, closes #58)
-
- `SignalBus` — publish/subscribe bus for real-time events over Server-Sent Events. One instance per service; `publish()` is thread-safe (safe to call from sync producer threads such as OpenCV, Meshtastic, or PyPubSub callbacks) via `loop.call_soon_threadsafe()`. `subscribe(request)` returns a FastAPI `StreamingResponse` — each subscriber gets an independent bounded `asyncio.Queue` (default 100 events) with oldest-drop-on-overflow, plus a 15s keepalive comment to keep proxies from closing idle connections.
- `SignalEvent` — frozen dataclass (`source`, `kind`, `payload`, auto-populated ISO-8601 UTC `timestamp`) with `to_sse()` wire-format serialization.
- New `signal-bus` extra (`fastapi>=0.110`).
-
-**`circuitforge_core.video.app`** — `POST /caption/upload` endpoint
-
-Accepts a multipart video file upload, writes it to a temp file, captions it via the configured backend, then deletes the temp file. Lets callers without filesystem access to the video-service node (e.g. a product on one host posting to cf-video on another over an SSH tunnel) caption a video without a shared mount. `video-service` extra now also pulls in `python-multipart`, required by FastAPI's `UploadFile` parsing.
-
-### Docs
-
- `mkdocs.yml` — new blue-grey/cyan palette, wired to a central `docs/stylesheets/theme.css` for consistent theme-aware styling across the site (light and dark mode).
-
-**`circuitforge_core.hardware.model_vram_estimate`** — model-to-hardware VRAM fit check (closes #64)
-
-Answers "can this hardware run model X at quantization level Y?" — the missing capability noted against `cf_core.hardware`, which detects available VRAM but had no way to cross-reference model requirements. Queries the HuggingFace Hub API for parameter count (`safetensors.total`) and architecture (`config.json`: `num_hidden_layers`, `hidden_size`, `num_attention_heads`, `num_key_value_heads`), then applies the standard formula: `vram_gb = params * bytes_per_param(quant) + kv_cache_gb(ctx_len, arch) + overhead_gb`. Reference algorithm from [LLMcalc](https://github.com/Raskoll2/LLMcalc) (unlicensed upstream — algorithm reference only, no code copied, no dependency added).
-
- `model_vram_estimate(hf_model_id, quant_level, *, ctx_len=4096, available_vram_mb=None, overhead_gb=0.6, timeout=10.0) -> VramEstimate`
- Supports common quant levels: `fp32`, `fp16`/`bf16`, `int8`/`q8`/`q8_0`, `q6_k`, `q5_k_m`/`q5_0`, `int4`/`q4`/`q4_k_m`/`q4_0`, `q3_k_m`, `q2_k`.
- KV cache sizing accounts for GQA (`num_key_value_heads`); falls back to 0 GB when the model's `config.json` lacks standard architecture fields, rather than failing the whole estimate — weights dominate VRAM use regardless.
- Raises `ModelVramLookupError` on HF Hub API failures or missing safetensors metadata; raises `ValueError` for unrecognized quant levels.
- Application points noted in the ticket: Avocet preflight (verify a checkpoint fits before benchmarking), cf-orch worker assignment (match model to GPU by VRAM fit), Peregrine/Kiwi onboarding wizard ("your GPU has X GB — here are models that will run well").
-
-**`circuitforge_core.retry`** — standard retry/backoff wrapper over `backon` (closes #65)
-
-Standardizes retry/backoff behavior for cf-core modules and products that make external calls, replacing ad-hoc per-product retry loops. Wraps [backon](https://github.com/Llucs/backon) (MIT, zero stdlib dependencies) rather than reimplementing retry logic — chosen over `tenacity`/`backoff` per the eval in #65 for its native async support, built-in circuit breaker/hedging primitives, and a process-wide enable/disable toggle that's ideal for tests.
-
- `on_exception(exception, *, max_tries=3, max_time=30.0, **backon_kwargs)` — decorator with CF's standard defaults (full-jitter exponential backoff); extra kwargs forward to `backon.on_exception` (e.g. `sleep=` for tests, `on_backoff=` for logging hooks).
- `retry(target, *args, exception=Exception, max_tries=3, max_time=30.0, **kwargs)` — call an already-defined callable with the same retry behavior, for use without decorator syntax.
- `disable_retries()` / `enable_retries()` — re-exported `backon` context managers for scoping retry-disable to a test or block.
- `disable_retries_globally()` / `enable_retries_globally()` — re-exported `backon.disable()`/`enable()` process-wide toggles, for a test-suite-level fixture.
- New core dependency: `backon>=4.0`.
- Scope note: only the standalone wrapper module ships in this PR. Wiring it into `llm`, `affiliates`, `reranker`, and `activitypub` (the call sites identified in #65) is left as follow-up work per module, rather than retrofitting `LLMRouter`'s existing fallback-chain error handling in the same change.
-
-**`circuitforge_core.task_bridge`** — shared data contract for pushing tasks into an external scheduler (closes #66)
-
-Kiwi is the pilot consumer, pushing pantry expiry-alert tasks into Ashley Venn's Focus Flow scheduler (AGPL-3.0, external project). To keep AGPL and BSL code from ever sharing a process or artifact, the task data contract lives here in cf-core (MIT); each product implements its own exporter/receiver. Design spec: `circuitforge-plans/shared/superpowers/specs/2026-07-05-focus-flow-task-bridge-design.md`.
-
- `models.py` — `ExternalTask` frozen dataclass: `schema_version`, `source_product`, `external_id`, `title`, `notes`, `due_at` (ISO 8601 UTC), `kind` (always `"flexible"` in v1 — external sources can never inject urgency into another product's UX), `status` (`"active"` / `"cancelled"`). Validates required fields and `kind`/`status` values in `__post_init__`.
- `client.py` — `push_tasks(endpoint, token, tasks)`: thin `httpx` wrapper POSTing a batch as `{"tasks": [...]}` with a bearer token. Raises `TaskBridgeError` on transport failure or non-2xx response. No transport server, no auth/token generation — that lives on the receiving side.
- New `task-bridge` extra (`httpx>=0.27`).
- 19 tests: schema/validation/serialization (no network) plus a contract test against a real local `http.server` instance standing in for Focus Flow's importer, verifying the client emits a conformant payload.
-
-**`circuitforge_core.tasks.dispatch_task` / `get_task_status`** — generic caller/args task dispatch (closes #67)
-
-Pagepiper (and potentially other products copying its pattern) imported `dispatch_task(caller, args) -> task_id` / `get_task_status(task_id) -> dict` from `circuitforge_core.tasks`, expecting a `"product/task_name"` + kwargs-dict interface — neither function existed anywhere, so every call silently hit an `except Exception` fallback to local `BackgroundTasks`, with no visible error. This is a different API shape from the existing VRAM-budgeted `TaskScheduler` (keyed by `task_id`/`job_id`/`params` against a specific SQLite `background_tasks` table), so it's a new module rather than a `TaskScheduler` wrapper.
-
- `register_task_runner(caller, fn)` — register a runnable under a name (e.g. `"pagepiper/ingest_pdf"`) once at product startup.
- `dispatch_task(caller, args)` — runs the registered runnable as `fn(**args)` on a background thread, returns a `task_id` immediately. Raises `LookupError` if `caller` isn't registered — products with an `except Exception: ...` fallback (like pagepiper's `_dispatch_ingest`) keep working unchanged.
- `get_task_status(task_id)` — returns `{"status": "queued"|"running"|"complete"|"error", "progress": int|None, "error": str|None}`. Raises `KeyError` for an unknown `task_id`.
- `reset_dispatch_registry()` — test teardown only.
- **Scope note:** this is the free-tier, in-process, single-node implementation — no cross-node distribution. Routing through the `circuitforge-orch` coordinator (BSL, separate package) would need a new generic task-dispatch endpoint on that coordinator, which doesn't exist today (`circuitforge_orch.client.CFOrchClient` only exposes model/service allocation, not a generic caller/args job queue); that's out of scope for this cf-core-only PR and tracked as follow-up. Consuming products (pagepiper) additionally need to call `register_task_runner()` at startup to benefit — not done here, since that's product-side work in a separate repo.
- 10 tests: unregistered lookup, task_id uniqueness, args passed as kwargs, success/error status transitions, unregister, unknown task_id, status snapshot immutability.
-
---
-
-## [0.20.0] — 2026-05-05
-
-### Fixed / Enhanced
-
-**`circuitforge_core.llm.LLMRouter`** — Pagepiper-driven improvements (closes #59, #60)
-
- **#59 — dict init** (`LLMRouter(config_path: Path | dict)`): `__init__` now accepts an inline config dict in addition to a `Path`. Ingest scripts that construct Ollama URLs from product-specific env vars (e.g. `PAGEPIPER_OLLAMA_URL`) can pass the dict directly without writing a temp file. Passing a dict previously raised `AttributeError: 'dict' object has no attribute 'exists'`. Tests: `test_init_accepts_inline_dict`, `test_init_dict_is_used_directly`.
-
- **#60 — Ollama preflight** (`_check_ollama_model_pulled()`): Before the first `embed()` call on an Ollama backend, `GET /api/tags` is checked to verify the configured embedding model is pulled. If it is not, a `RuntimeError` with an actionable `ollama pull <model>` hint is raised immediately — replacing the opaque `All LLM backends exhausted for embed()` error. Results are cached per base URL for the router's lifetime (one HTTP call, not one per `embed()` invocation). Non-Ollama backends (vLLM, etc.) don't expose `/api/tags` — a non-200 response causes the check to be silently skipped. Tests: `test_embed_raises_actionable_error_when_model_not_pulled`, `test_embed_proceeds_when_model_is_pulled`, `test_embed_skips_preflight_when_tags_endpoint_unavailable`, `test_ollama_tags_cache_is_hit_only_once`.
-
---
-
-## [0.17.0] — 2026-04-27
-
-### Added
-
-**`circuitforge_core.reranker`** — shared reranker module for RAG pipelines across the orchard (MIT, closes #54)
-
-Five adapters covering local and cloud paths:
-
- `adapters/bge.py` — `BGETextReranker`: FlagEmbedding cross-encoder (`BAAI/bge-reranker-*`). Batches all pairs in a single `compute_score()` call via `rerank_batch()`. Thread-safe with internal lock. Free tier.
- `adapters/qwen3.py` — `Qwen3TextReranker`: generative reranker using `AutoModelForCausalLM`. Scores by reading yes/no token logits at the last input position after pre-filling the assistant `<think>\n\n</think>` block — one forward pass per batch, no generation loop. Left-pads for consistent last-token position across batch. Free / Paid tier.
- `adapters/cross_encoder.py` — `CrossEncoderTextReranker`: sentence-transformers `CrossEncoder`. Broader model coverage: `mxbai-rerank-*`, `ms-marco-MiniLM-*`, `jina-reranker-*`. Free tier.
- `adapters/cohere.py` — `CohereTextReranker`: Cohere Rerank API (BYOK cloud path). Reads `COHERE_API_KEY` from env or explicit `api_key=` arg. Restores original candidate order from Cohere's score-sorted response. Paid / BYOK.
- `adapters/remote.py` — `RemoteTextReranker`: HTTP delegate to a cf-reranker service endpoint. `from_cf_orch()` classmethod allocates via cf-orch on demand. `release()` method returns the lease.
- `adapters/mock.py` — `MockTextReranker`: Jaccard-similarity scorer, no model required. Used in tests and `CF_RERANKER_MOCK=1` mode.
-
-`app.py` — `cf-reranker` FastAPI service (port 8011). Managed by cf-orch as a process-type service. Exposes `GET /health` and `POST /rerank`. Defaults to `Qwen3-Reranker-0.6B`.
-
-**Auto cf-orch routing:** `make_reranker()` checks `CF_ORCH_URL` at construction time. When set (cloud deployments), it automatically allocates a `cf-reranker` service via cf-orch and returns a `RemoteTextReranker` — no code changes needed in Kiwi, Peregrine, or Snipe. Local dev (no `CF_ORCH_URL`) falls back to local BGE inference.
-
-**Public API:**
- `rerank(query, candidates, top_n)` — process-level singleton, mock-safe
- `make_reranker(model_id, backend, mock)` — explicit instance
- `reset_reranker()` — test teardown only
- `RerankResult(candidate, score, rank)` — frozen dataclass result type
-
-**`pyproject.toml` extras:** `reranker-bge`, `reranker-qwen3`, `reranker-cross-encoder`, `reranker-cohere`, `reranker-service`
-
-54 tests across all adapters.
-
---
-
-## [0.14.0] — 2026-04-20
-
-### Added
-
-**`circuitforge_core.activitypub`** — ActivityPub actor management, object construction, HTTP Signature signing, delivery, and Lemmy integration (MIT, closes #51)
-
- `actor.py` — `CFActor` frozen dataclass; `generate_rsa_keypair(bits)`; `make_actor()`; `load_actor_from_key_file()`. `to_ap_dict()` produces an ActivityPub Application/Person object and never includes the private key.
- `objects.py` — `make_note()`, `make_offer()`, `make_request()` (CF namespace extension), `make_create()`. All return plain dicts; IDs minted with UUID4. `make_request` uses `https://circuitforge.tech/ns/activitystreams` context extension for the non-AS2 Request type.
- `signing.py` — `sign_headers()` (draft-cavage-http-signatures-08, rsa-sha256; signs `(request-target)`, `host`, `date`, `digest`, `content-type`). `verify_signature()` re-computes Digest from actual body after signature verification to catch body-swap attacks.
- `delivery.py` — `deliver_activity(activity, inbox_url, actor)` — synchronous `requests.post` with signed headers and `Content-Type: application/activity+json`.
- `lemmy.py` — `LemmyConfig` frozen dataclass; `LemmyClient` with `login()`, `resolve_community()` (bare name or `!community@instance` address), `post_to_community()`. Uses Lemmy v0.19+ REST API (JWT auth). `LemmyAuthError` / `LemmyCommunityNotFound` exceptions.
- `inbox.py` — `make_inbox_router(handlers, verify_key_fetcher, path)` — FastAPI APIRouter stub; dispatches by activity type; optional HTTP Signature verification via async `verify_key_fetcher` callback. FastAPI imported at module level with `_FASTAPI_AVAILABLE` guard (avoids annotation-resolution bug with lazy string annotations).
- 105 tests across all six files.
-
-**Key design notes:**
- `inbox` not re-exported from `__init__` — requires fastapi, imported explicitly by products that need it
- Signing Digest + re-verifying digest against body on verify — prevents body-swap attacks even when signature is valid
- `from __future__ import annotations` intentionally omitted in `inbox.py` — FastAPI resolves `Request` annotation against module globals at route registration time
-
---
-
-## [0.13.0] — 2026-04-20
-
-### Added
-
-**`circuitforge_core.preferences.currency`** — per-user currency code preference + formatting utility (MIT, closes #52)
-
- `PREF_CURRENCY_CODE = "currency.code"` — shared store key; all products read from the same path
- `get_currency_code(user_id, store)` — priority fallback: store → `CURRENCY_DEFAULT` env var → `"USD"`
- `set_currency_code(currency_code, user_id, store)` — persists ISO 4217 code, uppercased
- `format_currency(amount, currency_code, locale="en_US")` — uses `babel.numbers.format_currency` when available; falls back to a built-in 30-currency symbol table (no hard babel dependency)
- Symbol table covers: USD, CAD, AUD, NZD, GBP, EUR, CHF, SEK/NOK/DKK, JPY, CNY, KRW, INR, BRL, MXN, ZAR, SGD, HKD, THB, PLN, CZK, HUF, RUB, TRY, ILS, AED, SAR, CLP, COP, ARS, VND, IDR, MYR, PHP
- JPY/KRW/HUF/CLP/COP/VND/IDR format with 0 decimal places per ISO 4217 minor-unit convention
- Exported from `circuitforge_core.preferences` as `currency` submodule
- 30 tests (preference store, env var fallback, format dispatch, symbol table, edge cases)
-
---
-
-## [0.12.0] — 2026-04-20
-
-### Added
-
-**`circuitforge_core.job_quality`** — deterministic trust scorer for job listings (MIT, closes #48)
-
-Pure signal processing module. No LLM calls, no network calls, no file I/O. Fully auditable and independently unit-testable per signal.
-
- `models.py` — `JobListing`, `JobEnrichment`, `SignalResult`, `JobQualityScore` (Pydantic)
- `signals.py` — 12 signal functions with weights: `listing_age` (0.25), `repost_detected` (0.25), `no_salary_transparency` (0.20), `always_open_pattern` (0.20), `staffing_agency` (0.15), `requirement_overload` (0.12), `layoff_news` (0.12), `jd_vagueness` (0.10), `ats_blackhole` (0.10), `high_applicant_count` (0.08), `poor_response_history` (0.08), `weekend_posted` (0.04)
- `scorer.py` — `score_job(listing, enrichment=None) -> JobQualityScore`; trust_score = 1 − clamp(sum(triggered weights), 0, 1); confidence = fraction of signals with available evidence
- Salary transparency enforcement for CO, CA, NY, WA, IL, MA; ATS blackhole detection (Lever, Greenhouse, Workday, iCIMS, Taleo)
- `ALL_SIGNALS` registry for iteration and extension
- 83 tests across models, signals (all 12 individually), and scorer — 100% pass
-
---
-
-## [0.11.0] — 2026-04-20
-
-### Added
-
-**`circuitforge_core.audio`** — shared PCM and audio signal utilities (MIT, numpy-only, closes #50)
-
-Pure signal processing module. No model weights, no HuggingFace, no torch dependency.
-
- `convert.py` — `pcm_to_float32`, `float32_to_pcm`, `bytes_to_float32` (int16 ↔ float32 with correct int16 asymmetry handling)
- `gate.py` — `is_silent`, `rms` (RMS energy gate; default 0.005 threshold extracted from cf-voice)
- `resample.py` — `resample` (scipy `resample_poly` when available; numpy linear interpolation fallback)
- `buffer.py` — `ChunkAccumulator` (window-based chunk collector with `flush`, `reset`, bounds enforcement)
- Replaces hand-rolled equivalents in cf-voice `stt.py` + `context.py`. Also consumed by Sparrow and Linnet.
-
-**`circuitforge_core.musicgen` tests** — 21 tests covering mock backend, factory, and FastAPI app endpoints (closes #49). Module was already implemented; tests were the missing deliverable.
-
-### Fixed
-
-**SQLCipher PRAGMA injection** (closes #45) — `db/base.py` now uses `PRAGMA key=?` parameterized form instead of f-string interpolation. Regression tests added (skipped gracefully when `pysqlcipher3` is not installed).
-
-**`circuitforge_core.text.app`** — early validation on empty `--model` argument: raises `ValueError` with a clear message before reaching the HuggingFace loader. Prevents the cryptic `HFValidationError` surfaced by cf-orch #46 when no model candidates were provided.
-
---
-
-## [0.10.0] — 2026-04-12
-
-### Added
-
-**`circuitforge_core.community`** — shared community signal module (BSL 1.1, closes #44)
-
-Provides the PostgreSQL-backed infrastructure for the cross-product community fine-tuning signal pipeline. Products write signals; the training pipeline reads them.
-
- `CommunityDB` — psycopg2 connection pool with `run_migrations()`. Picks up all `.sql` files from `circuitforge_core/community/migrations/` in filename order. Safe to call on every startup (idempotent `CREATE TABLE IF NOT EXISTS`).
- `CommunityPost` — frozen dataclass capturing a user-authored community post with a snapshot of the originating product item (`element_snapshot` as a tuple of key-value pairs for immutability).
- `SharedStore` — base class for product-specific community stores. Provides typed `pg_read()` and `pg_write()` helpers that products subclass without re-implementing connection management.
- Migration 001: `community_posts` schema (id, product, item_id, pseudonym, title, body, element_snapshot JSONB, created_at).
- Migration 002: `community_reactions` stub (post_id FK, pseudonym, reaction_type, created_at).
- `psycopg2-binary` added to `[community]` optional extras in `pyproject.toml`.
- All community classes exported from `circuitforge_core.community`.
-
---
-
-## [0.9.0] — 2026-04-10
-
-### Added
-
-**`circuitforge_core.text`** — OpenAI-compatible `/v1/chat/completions` endpoint and pipeline crystallization engine.
-
-**`circuitforge_core.pipeline`** — multimodal pipeline with staged output crystallization. Products queue draft outputs for human review before committing.
-
-**`circuitforge_core.stt`** — speech-to-text module. `FasterWhisperBackend` for local transcription via `faster-whisper`. Managed FastAPI app mountable in any product.
-
-**`circuitforge_core.tts`** — text-to-speech module. `ChatterboxTurbo` backend for local synthesis. Managed FastAPI app.
-
-**Accessibility preferences** — `preferences` module extended with structured accessibility fields (motion reduction, high contrast, font size, focus highlight) under `accessibility.*` key path.
-
-**LLM output corrections router** — `make_corrections_router()` for collecting LLM output corrections in any product. Stores corrections in product SQLite for future fine-tuning.
-
---
-
-## [0.8.0] — 2026-04-08
-
-### Added
-
-**`circuitforge_core.vision`** — cf-vision managed service shim. Routes vision inference requests to a local cf-vision worker (moondream2 / SigLIP). Closes #43.
-
-**`circuitforge_core.api.feedback`** — `make_feedback_router()` shared Forgejo issue-filing router. Products mount it under `/api/feedback`; requires `FORGEJO_API_TOKEN`. Closes #30.
-
-**License validation** — `CF_LICENSE_KEY` validation via Heimdall REST API. Products call `validate_license(key, product)` to gate premium features. Closes #26.
-
---
-
-## [0.7.0] — 2026-04-04
-
-### Added
-
-**`circuitforge_core.affiliates`** — affiliate link wrapping module (closes #21)
- `wrap_url(url, retailer, user_id, get_preference)` — resolution order: opt-out → BYOK → CF env var → plain URL
- `AffiliateProgram` frozen dataclass + `register_program()` / `get_program()` registry
- Built-in programs: eBay Partner Network (`EBAY_AFFILIATE_CAMPAIGN_ID`), Amazon Associates (`AMAZON_ASSOCIATES_TAG`)
- `get_disclosure_text(retailer)` — per-retailer tooltip copy + `BANNER_COPY` first-encounter constants
- `get_preference` callable injection for opt-out + BYOK without hard-wiring a storage backend
-
-**`circuitforge_core.preferences`** — preference persistence helpers (closes #22 self-hosted path)
- `LocalFileStore` — YAML-backed single-user preference store (`~/.config/circuitforge/preferences.yaml`)
- `get_user_preference(user_id, path, default, store)` + `set_user_preference(user_id, path, value, store)`
- `PreferenceStore` protocol — Heimdall cloud backend to follow once Heimdall#5 lands
- Dot-path utilities `get_path` / `set_path` (immutable nested dict read/write)
-
---
-
-## [0.5.0] — 2026-04-02
-
-### Added
-
-**`circuitforge_core.manage` — cross-platform product manager** (closes #6)
-
-Replaces bash-only `manage.sh` across all products. Works on Linux, macOS, and Windows natively — no WSL2 or Docker required.
-
- **`ManageConfig`**: reads `manage.toml` from the product root (TOML via stdlib `tomllib`). Falls back to directory name when no config file is present — Docker-only products need zero configuration.
- **Docker mode** (`DockerManager`): wraps `docker compose` (v2 plugin) or `docker-compose` (v1). Auto-detected when Docker is available and a compose file exists. Commands: `start`, `stop`, `restart`, `status`, `logs`, `build`.
- **Native mode** (`NativeManager`): PID-file process management with `platformdirs`-based paths (`AppData` on Windows, `~/.local/share` on Linux/macOS). Cross-platform kill (SIGTERM→SIGKILL on Unix, `taskkill /F` on Windows). Log tailing via polling — no `tail -f`, works everywhere.
- **CLI** (`typer`): `start`, `stop`, `restart`, `status`, `logs`, `build`, `open`, `install-shims`. `--mode auto|docker|native` override.
- **`install-shims`**: writes `manage.sh` (bash, +x) and `manage.ps1` (PowerShell) into the product directory, plus `manage.toml.example`.
- **Entry points**: `python -m circuitforge_core.manage` and `cf-manage` console script.
- **`pyproject.toml`**: `[manage]` optional extras group (`platformdirs`, `typer`).
-
---
-
-## [0.4.0] — 2026-04-02
-
-### Added
-
-**Agent watchdog — coordinator-restart reconnect** (closes #15)
- `NodeStore`: SQLite persistence for known agent nodes (`~/.local/share/circuitforge/cf-orch-nodes.db`); `upsert` on every registration, `prune_stale` removes nodes unseen for 30+ days
- `AgentSupervisor.restore_from_store()`: reloads all previously-known nodes on coordinator startup; nodes start `offline=False` and come online within one heartbeat cycle (~10 s) without touching the agent processes
- `AgentSupervisor.register()` now persists to `NodeStore` on every call
- Agent CLI: one-shot registration replaced with a persistent 30 s reconnect loop (daemon thread); coordinator restart → remote nodes (Navi, Strahl, etc.) reappear automatically with no manual intervention
-
-**Ollama adopt-if-running + configurable health path** (closes #16)
- `ProcessSpec.adopt` (`bool`, default `False`): when `True`, `ServiceManager.start()` probes the health endpoint first and claims the already-running process rather than spawning a new one — designed for system daemons like Ollama
- `ProcessSpec.health_path` (`str`, default `"/health"`): configurable health probe path; Ollama uses `/api/tags`
- `ServiceManager._probe_health()`: shared urllib health check used by both `start()` and `is_running()` for adopt services
- Agent `/services/{service}/start` response includes `adopted: true` when the service was claimed rather than started; coordinator sets instance state to `running` immediately (skips probe loop wait)
- `ServiceInstance.health_path` field; `upsert_instance(health_path=)` kwarg
- Coordinator probe loop uses `inst.health_path` instead of hardcoded `/health`
- `_get_health_path()` helper looks up the ProcessSpec health path from the profile registry
- All GPU profiles (2/4/6/8/16/24 GB + cpu-16/32 GB): `ollama` service now has a `managed:` block with `adopt: true`, `health_path: /api/tags`, port 11434
-
---
-
-## [0.3.0] — 2026-04-02
-
-### Added
-
-**Hardware module** (`circuitforge_core.hardware`) — closes #5
- `detect_hardware()`: probes nvidia-smi / rocm-smi / Apple system_profiler / CPU fallback → `HardwareSpec`
- `select_tier(vram_mb)`: maps physical VRAM to a named `VramTier` (CPU / 2 / 4 / 6 / 8 / 16 / 24 GB)
- `generate_profile(spec)`: converts a `HardwareSpec` + service URLs → `LLMConfig` (llm.yaml-compatible)
- `HardwareSpec`, `LLMBackendConfig`, `LLMConfig` dataclasses
-
-**cf-docuvision service** (`circuitforge_core.resources.docuvision`) — closes #8
- FastAPI HTTP service wrapping ByteDance/Dolphin-v2 (Qwen2.5-VL backbone, ~8 GB VRAM)
- `POST /extract`: accepts `image_b64` or `image_path` + `hint` (auto / table / text / form) → `ExtractResponse`
- Lazy model loading — model stays unloaded until first request
- JSON-structured output with 21 element types; plain-text fallback when model returns unstructured output
- `ProcessSpec` managed blocks wired into all four GPU profiles (6 / 8 / 16 / 24 GB)
- `--gpu-id` flag respected via `CUDA_VISIBLE_DEVICES`
-
-**Documents module** (`circuitforge_core.documents`) — closes #7
- `ingest(image_bytes, hint) → StructuredDocument` — single call for all consumers
- Primary path: cf-docuvision HTTP service; automatic fallback to `LLMRouter` vision; graceful empty doc on total failure
- `StructuredDocument`, `Element`, `ParsedTable` frozen dataclasses with `.headings` / `.paragraphs` convenience properties
- `CF_DOCUVISION_URL` env var for service URL override
- `DocuvisionClient`: reusable HTTP client for cf-docuvision with `is_healthy()` probe
-
-**Coordinator probe loop tests** — closes #13
- 4 async tests for `_run_instance_probe_loop`: healthy transition, timeout eviction, state cleanup, no-URL guard
-
---
-
-## [0.2.0] — 2026-04-02
-
-### Added
-
-**Orchestrator — auto service lifecycle**
- `ServiceRegistry`: in-memory allocation tracker with state machine (`starting → running → idle → stopped`)
- `NodeSelector`: warm-first GPU scoring — prefers nodes already running the requested model, falls back to highest free VRAM
- `/api/services/{service}/allocate` coordinator endpoint: auto-selects best node, starts the llm_server process via agent, returns URL
- `CFOrchClient`: sync + async context managers for coordinator allocation/release
- Idle sweep in `AgentSupervisor`: stops instances that have been idle longer than `idle_stop_after_s` (default 600 s for vllm slot)
- Background health probe loop: coordinator polls all `starting` instances every 5 s via `GET /health`; promotes to `running` on 200, marks `stopped` after 300 s timeout (closes #10)
- Services table in coordinator dashboard HTML
- `idle_stop_after_s` field in service profiles
-
-**LLM Router**
- cf-orch allocation support in `LLMRouter` backends
- VRAM lease acquisition/release wired through scheduler batch workers
-
-**Scheduler**
- cf-orch VRAM lease per batch worker — prevents over-subscription
- `join()` on batch worker threads during shutdown
-
-**HF inference server** (`llm_server.py`)
- Generic HuggingFace `transformers` inference server replacing Ouro/vllm-Docker-specific code
- `ProcessSpec` wiring in agent `service_manager.py`
- Handles transformers 5.x `BatchEncoding` return type from `apply_chat_template`
- Uses `dtype=` kwarg (replaces deprecated `torch_dtype=`)
-
-### Fixed
-
- VRAM pre-flight threshold tightened: coordinator and `NodeSelector` now require full `service_max_mb` free (was `max_mb // 2`), preventing instances from starting on GPUs with insufficient headroom (closes #11 / related)
- `ServiceInstance` now seeded correctly on first `/allocate` call
- TTL sweep, immutability, and service-scoped release correctness in allocation path
- Coordinator logger added for allocation path visibility
-
-### Changed
-
- Removed Ouro/vllm-Docker specifics from llm_server — now a generic HF inference endpoint
-
---
-
-## [0.1.0] — 2026-03-01
-
-### Added
-
- Package scaffold (`circuitforge_core`)
- DB base connection and migration runner
- Generalised tier system with BYOK (bring your own key) and local-vision unlocks
- LLM router extracted from Peregrine (fallback chain, vision-aware, BYOK support)
- Config module and vision router stub
- cf-orch orchestrator: coordinator (port 7700) + agent (port 7701)
- Agent registration + VRAM lease wiring
- Coordinator dashboard (HTML)
--- a/Dockerfile.orch
+++ b/Dockerfile.orch
@ -1,53 +0,0 @@
-# cf-orch coordinator image
-# Includes the coordinator + agent; designed for paid+ multi-node deployments.
-#
-# Usage (coordinator node):
-#   docker run -d \
-#     -p 7700:7700 \
-#     -e HEIMDALL_URL=https://license.circuitforge.tech \
-#     -e HEIMDALL_MIN_TIER=paid \
-#     -e CF_ORCH_AUTH_SECRET=<secret> \
-#     ghcr.io/circuit-forge/cf-orch:latest coordinator
-#
-# Usage (GPU agent node — connects back to coordinator):
-#   docker run -d \
-#     --gpus all \
-#     -e CF_COORDINATOR_URL=http://<coordinator-ip>:7700 \
-#     ghcr.io/circuit-forge/cf-orch:latest agent
-#
-# Environment variables
-# ─────────────────────
-# CF_ORCH_PORT          Coordinator listen port (default: 7700)
-# HEIMDALL_URL          Enable license auth (omit for LAN-only / self-hosted)
-# HEIMDALL_MIN_TIER     Minimum tier required (default: paid)
-# CF_ORCH_AUTH_SECRET   Shared secret with Heimdall /licenses/verify
-# CF_COORDINATOR_URL    Agent mode: coordinator URL to register with
-# CF_AGENT_GPU_IDS      Comma-separated GPU indices for agent (default: 0)
-
-FROM python:3.12-slim
-
-LABEL org.opencontainers.image.source="https://git.opensourcesolarpunk.com/Circuit-Forge/circuitforge-core"
-LABEL org.opencontainers.image.description="cf-orch coordinator and agent for CircuitForge multi-node GPU orchestration"
-LABEL org.opencontainers.image.licenses="BSL-1.1"
-
-WORKDIR /app
-
-# System deps — httpx needs curl for connection reuse; avoid full dev toolchain
-RUN apt-get update && apt-get install -y --no-install-recommends \
-    curl \
-    && rm -rf /var/lib/apt/lists/*
-
-# Install cf-core with the resources extra (coordinator + agent deps)
-COPY pyproject.toml README.md ./
-COPY circuitforge_core/ ./circuitforge_core/
-
-RUN pip install --no-cache-dir ".[resources,manage]"
-
-ENV CF_ORCH_PORT=7700
-EXPOSE 7700
-
-COPY docker/orch-entrypoint.sh /entrypoint.sh
-RUN chmod +x /entrypoint.sh
-
-ENTRYPOINT ["/entrypoint.sh"]
-CMD ["coordinator"]
--- a/21
+++ b/21
@ -1,21 +0,0 @@
-MIT License
-
-Copyright (c) 2026 CircuitForge LLC
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in all
-copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
-SOFTWARE.
--- a/README.md
+++ b/README.md
@ -1,212 +1,23 @@
-<p align="center">
-  <img src="docs/cf-logo.png" alt="CircuitForge logo" width="120" />
-</p>
+# circuitforge-core

-<h1 align="center">circuitforge-core</h1>
+Shared scaffold for CircuitForge products.

-<p align="center">Shared Python scaffold for privacy-first, self-hosted AI tools</p>
+## Modules

-<p align="center">
-  <a href="LICENSE"><img src="https://img.shields.io/badge/license-MIT-green.svg" alt="MIT License" /></a>
-  <img src="https://img.shields.io/badge/version-0.21.0-blue.svg" alt="v0.21.0" />
-  <img src="https://img.shields.io/badge/python-3.11%2B-blue.svg" alt="Python 3.11+" />
-  <a href="https://git.opensourcesolarpunk.com/Circuit-Forge/circuitforge-core"><img src="https://img.shields.io/badge/repo-Forgejo-orange.svg" alt="Forgejo" /></a>
-</p>
-
---
-
-## Why circuitforge-core?
-
- **Local inference first.** The LLM router defaults to Ollama on localhost. Cloud APIs are a configurable fallback, not the default path. No telemetry, no round-trips you didn't ask for.
- **VRAM-aware scheduling.** The task scheduler and resource coordinator track GPU memory across concurrent services, allocate slots before loading models, and evict backends gracefully when VRAM is scarce.
- **Consistent tier system across products.** One `tiers` module handles Free / Paid / Premium / Ultra tiers, BYOK (bring your own key) unlocks, and local-vision capability gates — the same way in every product.
- **Uniform developer experience.** DB migrations, config validation, document ingestion, process management, and preference storage all share a single, tested implementation. Products extend, not reimplement.
-
---
+- `circuitforge_core.db` — SQLite connection factory and migration runner
+- `circuitforge_core.llm` — LLM router with fallback chain
+- `circuitforge_core.tiers` — Tier system with BYOK and local vision unlocks
+- `circuitforge_core.config` — Env validation and .env loader
+- `circuitforge_core.vision` — Vision router stub (v0.2+)
+- `circuitforge_core.wizard` — First-run wizard base class stub
+- `circuitforge_core.pipeline` — Staging queue stub (v0.2+)

 ## Install

 ```bash
-# From PyPI
-pip install circuitforge-core
-
-# Editable install from source (recommended for product development)
-pip install -e /path/to/circuitforge-core
-
-# With optional extras
-pip install circuitforge-core[pdf]                  # PDF/DOCX/OCR document ingestion
-pip install circuitforge-core[vector]               # SQLite-vec vector store
-pip install circuitforge-core[text-transformers]    # Local transformer inference (cf-text)
-pip install circuitforge-core[stt-faster-whisper]   # Speech-to-text via Faster Whisper
-pip install circuitforge-core[tts-chatterbox]       # Text-to-speech via Chatterbox
-pip install circuitforge-core[reranker-qwen3]       # Reranking via Qwen3
-pip install circuitforge-core[video-service]        # Video captioning service (Marlin-2B)
-pip install circuitforge-core[mqtt]                 # MQTT broker client
-pip install circuitforge-core[signal-bus]           # SSE event publisher for real-time signal streams
-pip install circuitforge-core[meshtastic-service]   # Meshtastic mesh radio + MQTT + FastAPI
-pip install circuitforge-core[memory]               # Knowledge graph via mnemo sidecar
-pip install circuitforge-core[task-bridge]          # Push tasks into an external scheduler (e.g. Focus Flow)
-pip install circuitforge-core[community]            # PostgreSQL-backed community store
-pip install circuitforge-core[manage]               # cf-manage CLI (Typer)
-pip install circuitforge-core[dev]                  # All dev dependencies
+pip install -e .
 ```

---
-
-## Modules
-
-| Module | Status | Description |
-|---|---|---|
-| `db` | Implemented | SQLite connection factory and migration runner |
-| `llm` | Implemented | LLM router with priority fallback chain (Ollama, vLLM, Anthropic, OpenAI-compatible) |
-| `tiers` | Implemented | Tier system with BYOK and local-vision unlocks (Free / Paid / Premium) |
-| `config` | Implemented | Env validation and `.env` loader with startup fail-fast |
-| `hardware` | Implemented | GPU/CPU detection, VRAM profiling, backend profile generation |
-| `documents` | Implemented | PDF, DOCX, and image OCR ingestion into `StructuredDocument` |
-| `affiliates` | Implemented | Affiliate URL wrapping with per-user opt-out and env-var fallback |
-| `preferences` | Implemented | User preference store — local YAML with pluggable backend; dot-path get/set |
-| `tasks` | Implemented | VRAM-aware LLM task scheduler; shared slot manager across services; generic caller/args `dispatch_task`/`get_task_status` |
-| `manage` | Implemented | Cross-platform product process manager (Docker and native modes) |
-| `resources` | Implemented | VRAM allocation, eviction engine, GPU profile registry |
-| `text` | Implemented | Text utilities (normalize, chunk, truncate) + local LLM inference service (GGUF/transformers/VLM/classifier backends, multimodal content-block API) |
-| `activitypub` | Implemented | ActivityPub actor, inbox, delivery, and Lemmy federation primitives |
-| `audio` | Implemented | Audio buffer, format conversion, resampling, and VAD (voice activity detection) gate |
-| `stt` | Implemented | Speech-to-text service (Faster Whisper backend) |
-| `tts` | Implemented | Text-to-speech service (Chatterbox backend) |
-| `musicgen` | Implemented | Music generation service (AudioCraft/MusicGen backend) |
-| `video` | Implemented | Video captioning and temporal grounding service (Marlin-2B backend) |
-| `mqtt` | Implemented | Async MQTT client and Meshtastic mesh radio integration (serial + MQTT broker backends) |
-| `reranker` | Implemented | Result reranking — BGE, Qwen3, cross-encoder, and Cohere adapters |
-| `vector` | Implemented | SQLite-vec vector store with pluggable embedding backend |
-| `api` | Implemented | Shared API helpers — corrections and feedback endpoints |
-| `community` | Implemented | Community feed and social store (PostgreSQL-backed) |
-| `platforms` | Implemented | Platform-specific integrations (eBay) |
-| `cloud_session` | Implemented | Cloud session management primitives |
-| `input` | Implemented | Input handling — MediaPipe gesture recognition |
-| `job_quality` | Implemented | Job listing quality scoring and signal extraction |
-| `signal_bus` | Implemented | Generic SSE event publisher for real-time signal streams |
-| `retry` | Implemented | Standard retry/backoff wrapper over `backon` for external-call modules |
-| `task_bridge` | Implemented | Shared data contract + push client for external task schedulers (e.g. Focus Flow) |
-| `vision` | Stub | Vision router (moondream2 / SigLIP dispatch — planned) |
-| `wizard` | Stub | First-run wizard base class — products subclass `BaseWizard` |
-| `pipeline` | Stub | Staging queue base — products provide concrete schema |
-
---
-
-## Vue package: `@circuitforge/display`
-
-Strip-display Vue 3 primitives (`packages/display/`) for products running a secondary 1920×480 landscape / 480×1920 portrait kiosk display (Turnstone, Robin). Published as a **separate npm package**, not part of this Python distribution, so products that don't use it never pull in Vue as a dependency.
-
-```bash
-cd packages/display
-npm install
-npm test    # 37 tests — DisplayLayout, DisplayMetric, DisplayAlert, DisplayMacroButton
-npm run build
-```
-
-See `packages/display/README.md` for the component API and theming.
-
---
-
-## Usage: LLM Router
-
-The LLM router reads a config file at `~/.config/circuitforge/llm.yaml`, tries each backend in fallback order, and skips unreachable or disabled entries transparently.
-
-```python
-from circuitforge_core.llm import LLMRouter
-
-# Auto-detects from env vars when llm.yaml is absent:
-# ANTHROPIC_API_KEY, OPENAI_API_KEY / OPENAI_BASE_URL, OLLAMA_HOST
-router = LLMRouter()
-
-response = router.complete(
-    messages=[{"role": "user", "content": "Summarize this in one sentence."}],
-    system="You are a concise assistant.",
-)
-print(response)
-```
-
-**Example `llm.yaml`** (Ollama local, Anthropic cloud fallback):
-
-```yaml
-fallback_order:
-  - ollama
-  - anthropic
-
-backends:
-  ollama:
-    type: openai_compat
-    enabled: true
-    base_url: http://localhost:11434/v1
-    model: llama3.2:3b
-
-  anthropic:
-    type: anthropic
-    enabled: true
-    model: claude-haiku-4-5-20251001
-    api_key_env: ANTHROPIC_API_KEY
-    supports_images: true
-```
-
---
-
-## Usage: Database + Migrations
-
-```python
-from circuitforge_core.db import get_connection, run_migrations
-from pathlib import Path
-
-# Run product migrations on startup
-run_migrations(db_path=Path("data/app.db"), migrations_dir=Path("db/migrations"))
-
-# Get a connection anywhere in your app
-with get_connection(Path("data/app.db")) as conn:
-    conn.execute("INSERT INTO items (name) VALUES (?)", ("example",))
-```
-
---
-
-## Used by
-
-| Product | Description |
-|---|---|
-| [peregrine](https://git.opensourcesolarpunk.com/Circuit-Forge/peregrine) | Job search — discovery, cover letters, interview prep |
-| [snipe](https://git.opensourcesolarpunk.com/Circuit-Forge/snipe) | Auction sniping — eBay trust scoring, bid timing |
-| [kiwi](https://git.opensourcesolarpunk.com/Circuit-Forge/kiwi) | Pantry tracker with barcode/receipt OCR and recipe suggestions |
-| [avocet](https://git.opensourcesolarpunk.com/Circuit-Forge/avocet) | Email classifier training and benchmark harness |
-| [osprey](https://git.opensourcesolarpunk.com/Circuit-Forge/osprey) | Government hold-line automation |
-| [linnet](https://git.opensourcesolarpunk.com/Circuit-Forge/linnet) | Real-time tone annotation and voice transcription |
-| pagepiper | PDF/rulebook RAG (retrieval-augmented generation) search |
-
---
-
-## Contributing
-
-circuitforge-core is MIT licensed. Contributions are welcome.
-
-```bash
-git clone https://git.opensourcesolarpunk.com/Circuit-Forge/circuitforge-core
-cd circuitforge-core
-pip install -e ".[dev]"
-pytest
-```
-
- New modules belong in `circuitforge_core/<module>/` as a package, not a flat file
- Keep modules focused — extract when a module exceeds 400 lines
- All public functions need type annotations
- Tests live in `tests/` — aim for 80% coverage on new code
- Use `ruff` for linting before submitting a PR
-
-Open issues and PRs at: [git.opensourcesolarpunk.com/Circuit-Forge/circuitforge-core](https://git.opensourcesolarpunk.com/Circuit-Forge/circuitforge-core)
-
---
-
 ## License

-MIT — see [LICENSE](LICENSE).
-
-This is the fully open layer of the CircuitForge stack. Products built on top of circuitforge-core may carry different licenses (BSL 1.1 for AI features, proprietary for fine-tuned weights). The scaffold itself is and will remain MIT.
-
---
-
-Humans own design, architecture, code review, testing, and verification. LLMs are part of our development workflow. [Our positions on LLM use →](https://circuitforge.tech/positions)
+BSL 1.1 — see LICENSE
--- a/circuitforge_core/init.py
+++ b/circuitforge_core/init.py
@ -1,13 +1 @@
-from importlib.metadata import PackageNotFoundError, version
-
-try:
-    __version__ = version("circuitforge-core")
-except PackageNotFoundError:
-    __version__ = "dev"  # running from source without an editable install
-
-try:
-    from circuitforge_core.community import CommunityDB, CommunityPost, SharedStore
-    __all__ = ["CommunityDB", "CommunityPost", "SharedStore"]
-except ImportError:
-    # psycopg2 not installed — install with: pip install circuitforge-core[community]
-    pass
+__version__ = "0.1.0"
--- a/circuitforge_core/activitypub/init.py
+++ b/circuitforge_core/activitypub/init.py
@ -1,55 +0,0 @@
-"""
-circuitforge_core.activitypub — ActivityPub actor management, object construction,
-HTTP Signature signing, delivery, and Lemmy integration.
-
-MIT licensed.
-"""
-
-from circuitforge_core.activitypub.actor import (
-    CFActor,
-    generate_rsa_keypair,
-    load_actor_from_key_file,
-    make_actor,
-)
-from circuitforge_core.activitypub.delivery import deliver_activity
-from circuitforge_core.activitypub.lemmy import (
-    LemmyAuthError,
-    LemmyClient,
-    LemmyCommunityNotFound,
-    LemmyConfig,
-)
-from circuitforge_core.activitypub.objects import (
-    PUBLIC,
-    make_create,
-    make_note,
-    make_offer,
-    make_request,
-)
-from circuitforge_core.activitypub.signing import sign_headers, verify_signature
-
-__all__ = [
-    # Actor
-    "CFActor",
-    "generate_rsa_keypair",
-    "load_actor_from_key_file",
-    "make_actor",
-    # Objects
-    "PUBLIC",
-    "make_note",
-    "make_offer",
-    "make_request",
-    "make_create",
-    # Signing
-    "sign_headers",
-    "verify_signature",
-    # Delivery
-    "deliver_activity",
-    # Lemmy
-    "LemmyConfig",
-    "LemmyClient",
-    "LemmyAuthError",
-    "LemmyCommunityNotFound",
-]
-
-# inbox is optional (requires fastapi) — import it when needed:
-#   from circuitforge_core.activitypub.inbox import make_inbox_router
--- a/circuitforge_core/activitypub/actor.py
+++ b/circuitforge_core/activitypub/actor.py
@ -1,146 +0,0 @@
-"""
-CFActor — ActivityPub actor identity for CircuitForge products.
-
-An actor holds RSA key material and its ActivityPub identity URLs.
-The private key is in-memory only; to_ap_dict() never includes it.
-
-MIT licensed.
-"""
-from __future__ import annotations
-
-from dataclasses import dataclass
-from pathlib import Path
-
-
-@dataclass(frozen=True)
-class CFActor:
-    """ActivityPub actor for a CircuitForge product instance."""
-
-    actor_id: str          # e.g. "https://kiwi.circuitforge.tech/actors/kiwi"
-    username: str
-    display_name: str
-    inbox_url: str
-    outbox_url: str
-    public_key_pem: str
-    private_key_pem: str   # Never included in to_ap_dict()
-    icon_url: str | None = None
-    summary: str | None = None
-
-    def to_ap_dict(self) -> dict:
-        """Return an ActivityPub Person/Application object (public only)."""
-        obj: dict = {
-            "@context": [
-                "https://www.w3.org/ns/activitystreams",
-                "https://w3id.org/security/v1",
-            ],
-            "id": self.actor_id,
-            "type": "Application",
-            "preferredUsername": self.username,
-            "name": self.display_name,
-            "inbox": self.inbox_url,
-            "outbox": self.outbox_url,
-            "publicKey": {
-                "id": f"{self.actor_id}#main-key",
-                "owner": self.actor_id,
-                "publicKeyPem": self.public_key_pem,
-            },
-        }
-        if self.summary:
-            obj["summary"] = self.summary
-        if self.icon_url:
-            obj["icon"] = {
-                "type": "Image",
-                "mediaType": "image/png",
-                "url": self.icon_url,
-            }
-        return obj
-
-
-def generate_rsa_keypair(bits: int = 2048) -> tuple[str, str]:
-    """
-    Generate a new RSA keypair.
-
-    Returns:
-        (private_key_pem, public_key_pem) as PEM-encoded strings.
-    """
-    from cryptography.hazmat.primitives import serialization
-    from cryptography.hazmat.primitives.asymmetric import rsa
-
-    private_key = rsa.generate_private_key(public_exponent=65537, key_size=bits)
-    private_pem = private_key.private_bytes(
-        encoding=serialization.Encoding.PEM,
-        format=serialization.PrivateFormat.PKCS8,
-        encryption_algorithm=serialization.NoEncryption(),
-    ).decode()
-    public_pem = private_key.public_key().public_bytes(
-        encoding=serialization.Encoding.PEM,
-        format=serialization.PublicFormat.SubjectPublicKeyInfo,
-    ).decode()
-    return private_pem, public_pem
-
-
-def make_actor(
-    actor_id: str,
-    username: str,
-    display_name: str,
-    private_key_pem: str,
-    public_key_pem: str,
-    icon_url: str | None = None,
-    summary: str | None = None,
-) -> CFActor:
-    """
-    Construct a CFActor from an existing keypair.
-
-    Inbox and outbox URLs are derived from actor_id by convention:
-      {actor_id}/inbox and {actor_id}/outbox
-    """
-    return CFActor(
-        actor_id=actor_id,
-        username=username,
-        display_name=display_name,
-        inbox_url=f"{actor_id}/inbox",
-        outbox_url=f"{actor_id}/outbox",
-        public_key_pem=public_key_pem,
-        private_key_pem=private_key_pem,
-        icon_url=icon_url,
-        summary=summary,
-    )
-
-
-def load_actor_from_key_file(
-    actor_id: str,
-    username: str,
-    display_name: str,
-    private_key_path: str,
-    icon_url: str | None = None,
-    summary: str | None = None,
-) -> CFActor:
-    """
-    Load a CFActor from a PEM private key file on disk.
-
-    The public key is derived from the private key — no separate public key
-    file is required.
-    """
-    from cryptography.hazmat.primitives import serialization
-    from cryptography.hazmat.primitives.serialization import load_pem_private_key
-
-    pem_bytes = Path(private_key_path).read_bytes()
-    private_key = load_pem_private_key(pem_bytes, password=None)
-    private_pem = private_key.private_bytes(
-        encoding=serialization.Encoding.PEM,
-        format=serialization.PrivateFormat.PKCS8,
-        encryption_algorithm=serialization.NoEncryption(),
-    ).decode()
-    public_pem = private_key.public_key().public_bytes(
-        encoding=serialization.Encoding.PEM,
-        format=serialization.PublicFormat.SubjectPublicKeyInfo,
-    ).decode()
-    return make_actor(
-        actor_id=actor_id,
-        username=username,
-        display_name=display_name,
-        private_key_pem=private_pem,
-        public_key_pem=public_pem,
-        icon_url=icon_url,
-        summary=summary,
-    )
--- a/circuitforge_core/activitypub/delivery.py
+++ b/circuitforge_core/activitypub/delivery.py
@ -1,56 +0,0 @@
-"""
-ActivityPub HTTP delivery — POST a signed activity to a remote inbox.
-
-Synchronous (uses requests). Async callers can wrap in asyncio.to_thread.
-
-MIT licensed.
-"""
-from __future__ import annotations
-
-import json
-from typing import TYPE_CHECKING
-
-import requests
-
-from circuitforge_core.activitypub.signing import sign_headers
-
-if TYPE_CHECKING:
-    from circuitforge_core.activitypub.actor import CFActor
-
-ACTIVITY_CONTENT_TYPE = "application/activity+json"
-
-
-def deliver_activity(
-    activity: dict,
-    inbox_url: str,
-    actor: "CFActor",
-    timeout: float = 10.0,
-) -> requests.Response:
-    """
-    POST a signed ActivityPub activity to a remote inbox.
-
-    The activity dict is serialized to JSON, signed with the actor's private
-    key (HTTP Signatures, rsa-sha256), and delivered via HTTP POST.
-
-    Args:
-        activity:   ActivityPub activity dict (e.g. from make_create()).
-        inbox_url:  Target inbox URL (e.g. "https://lemmy.ml/inbox").
-        actor:      CFActor whose key signs the request.
-        timeout:    Request timeout in seconds.
-
-    Returns:
-        The raw requests.Response. Caller decides retry / error policy.
-
-    Raises:
-        requests.RequestException: On network-level failure.
-    """
-    body = json.dumps(activity).encode()
-    base_headers = {"Content-Type": ACTIVITY_CONTENT_TYPE}
-    signed = sign_headers(
-        method="POST",
-        url=inbox_url,
-        headers=base_headers,
-        body=body,
-        actor=actor,
-    )
-    return requests.post(inbox_url, data=body, headers=signed, timeout=timeout)
--- a/circuitforge_core/activitypub/inbox.py
+++ b/circuitforge_core/activitypub/inbox.py
@ -1,128 +0,0 @@
-"""
-ActivityPub inbox router — FastAPI stub for receiving federated activities.
-
-Products mount this router to handle incoming Create, Follow, Like, Announce,
-and other ActivityPub activities from the Fediverse.
-
-Requires fastapi (optional dep). ImportError is raised with a clear message
-when fastapi is not installed.
-
-NOTE: from __future__ import annotations is intentionally omitted here.
-FastAPI resolves route parameter annotations against module globals at
-definition time; lazy string annotations break the Request injection.
-
-MIT licensed.
-"""
-
-import json as _json
-import re
-from typing import Awaitable, Callable
-
-# Handler type: receives (activity_dict, request_headers) and returns None
-InboxHandler = Callable[[dict, dict], Awaitable[None]]
-
-# FastAPI imports at module level so annotations resolve correctly.
-# Products that don't use the inbox router are not affected by this import
-# since circuitforge_core.activitypub.__init__ does NOT import inbox.
-try:
-    from fastapi import APIRouter, HTTPException, Request
-    from fastapi.responses import JSONResponse
-    _FASTAPI_AVAILABLE = True
-except ImportError:
-    _FASTAPI_AVAILABLE = False
-    # Provide stubs so the module can be imported without fastapi
-    APIRouter = None       # type: ignore[assignment,misc]
-    HTTPException = None   # type: ignore[assignment]
-    Request = None         # type: ignore[assignment]
-    JSONResponse = None    # type: ignore[assignment]
-
-
-def make_inbox_router(
-    handlers: dict[str, InboxHandler] | None = None,
-    verify_key_fetcher: Callable[[str], Awaitable[str | None]] | None = None,
-    path: str = "/inbox",
-) -> "APIRouter":  # type: ignore[name-defined]
-    """
-    Build a FastAPI router that handles ActivityPub inbox POSTs.
-
-    The router:
-    1. Parses the JSON body into an activity dict
-    2. Optionally verifies the HTTP Signature (when verify_key_fetcher is provided)
-    3. Dispatches activity["type"] to the matching handler from *handlers*
-    4. Returns 202 Accepted on success, 400 on bad JSON, 401 on bad signature
-
-    Args:
-        handlers:            Dict mapping activity type strings (e.g. "Create",
-                             "Follow") to async handler callables.
-        verify_key_fetcher:  Async callable that takes a keyId URL and returns the
-                             actor's public key PEM, or None if not found.
-                             When None, signature verification is skipped (dev mode).
-        path:                Inbox endpoint path (default "/inbox").
-
-    Returns:
-        FastAPI APIRouter.
-
-    Example::
-
-        async def on_create(activity: dict, headers: dict) -> None:
-            print("Received Create:", activity)
-
-        router = make_inbox_router(handlers={"Create": on_create})
-        app.include_router(router, prefix="/actors/kiwi")
-    """
-    if not _FASTAPI_AVAILABLE:
-        raise ImportError(
-            "circuitforge_core.activitypub.inbox requires fastapi. "
-            "Install with: pip install fastapi"
-        )
-
-    from circuitforge_core.activitypub.signing import verify_signature
-
-    router = APIRouter()
-    _handlers: dict[str, InboxHandler] = handlers or {}
-
-    @router.post(path, status_code=202)
-    async def inbox_endpoint(request: Request) -> JSONResponse:
-        # Parse body — read bytes first (needed for signature verification),
-        # then decode JSON manually to avoid double-read issues.
-        try:
-            body = await request.body()
-            activity = _json.loads(body)
-        except Exception:
-            raise HTTPException(status_code=400, detail="Invalid JSON body.")
-
-        # Optional signature verification
-        if verify_key_fetcher is not None:
-            sig_header = request.headers.get("Signature", "")
-            key_id = _parse_key_id(sig_header)
-            if not key_id:
-                raise HTTPException(status_code=401, detail="Missing or malformed Signature header.")
-            public_key_pem = await verify_key_fetcher(key_id)
-            if public_key_pem is None:
-                raise HTTPException(status_code=401, detail=f"Unknown keyId: {key_id}")
-            ok = verify_signature(
-                headers=dict(request.headers),
-                method="POST",
-                path=request.url.path,
-                body=body,
-                public_key_pem=public_key_pem,
-            )
-            if not ok:
-                raise HTTPException(status_code=401, detail="Signature verification failed.")
-
-        activity_type = activity.get("type", "")
-        handler = _handlers.get(activity_type)
-        if handler is None:
-            # Unknown types are silently accepted per AP spec — return 202
-            return JSONResponse(status_code=202, content={"status": "accepted", "type": activity_type})
-
-        await handler(activity, dict(request.headers))
-        return JSONResponse(status_code=202, content={"status": "accepted"})
-
-    return router
-
-
-def _parse_key_id(sig_header: str) -> str | None:
-    """Extract keyId value from a Signature header string."""
-    match = re.search(r'keyId="([^"]+)"', sig_header)
-    return match.group(1) if match else None
--- a/circuitforge_core/activitypub/lemmy.py
+++ b/circuitforge_core/activitypub/lemmy.py
@ -1,173 +0,0 @@
-"""
-Lemmy REST API client for posting to Lemmy communities.
-
-Uses JWT authentication (Lemmy v0.19+ API). Does not require ActivityPub
-federation setup — the Lemmy REST API is simpler and more reliable for
-the initial integration.
-
-MIT licensed.
-"""
-from __future__ import annotations
-
-from dataclasses import dataclass
-from typing import Any
-
-import requests
-
-
-class LemmyAuthError(Exception):
-    """Raised when Lemmy login fails."""
-
-
-class LemmyCommunityNotFound(Exception):
-    """Raised when a community cannot be resolved by name."""
-
-
-@dataclass(frozen=True)
-class LemmyConfig:
-    """Connection config for a Lemmy instance."""
-
-    instance_url: str  # e.g. "https://lemmy.ml" (no trailing slash)
-    username: str
-    password: str      # Load from env/config; never hardcode
-
-
-class LemmyClient:
-    """
-    Lemmy REST API client.
-
-    Usage::
-
-        config = LemmyConfig(instance_url="https://lemmy.ml", username="bot", password="...")
-        client = LemmyClient(config)
-        client.login()
-        community_id = client.resolve_community("!cooking@lemmy.world")
-        client.post_to_community(community_id, title="Fresh pesto recipe", body="...")
-    """
-
-    def __init__(self, config: LemmyConfig) -> None:
-        self._config = config
-        self._jwt: str | None = None
-        self._session = requests.Session()
-        self._session.headers.update({"Content-Type": "application/json"})
-
-    @property
-    def _api(self) -> str:
-        return f"{self._config.instance_url.rstrip('/')}/api/v3"
-
-    def _auth_headers(self) -> dict[str, str]:
-        if not self._jwt:
-            raise LemmyAuthError("Not logged in — call login() first.")
-        return {"Authorization": f"Bearer {self._jwt}"}
-
-    def login(self) -> None:
-        """
-        Authenticate with the Lemmy instance and store the JWT.
-
-        Raises:
-            LemmyAuthError: If credentials are rejected or the request fails.
-        """
-        resp = self._session.post(
-            f"{self._api}/user/login",
-            json={"username_or_email": self._config.username, "password": self._config.password},
-            timeout=10,
-        )
-        if resp.status_code != 200:
-            raise LemmyAuthError(
-                f"Lemmy login failed ({resp.status_code}): {resp.text[:200]}"
-            )
-        data = resp.json()
-        token = data.get("jwt")
-        if not token:
-            raise LemmyAuthError("Lemmy login response missing 'jwt' field.")
-        self._jwt = token
-
-    def resolve_community(self, name: str) -> int:
-        """
-        Resolve a community name or address to its numeric Lemmy ID.
-
-        Accepts:
-        - Bare name: "cooking"
-        - Fediverse address: "!cooking@lemmy.world"
-        - Display name search (best-effort)
-
-        Args:
-            name: Community identifier.
-
-        Returns:
-            Numeric community ID.
-
-        Raises:
-            LemmyCommunityNotFound: If not found or multiple matches are ambiguous.
-            LemmyAuthError: If not logged in.
-        """
-        # Strip leading ! for address lookups
-        lookup = name.lstrip("!")
-        resp = self._session.get(
-            f"{self._api}/search",
-            params={"q": lookup, "type_": "Communities", "limit": 5},
-            headers=self._auth_headers(),
-            timeout=10,
-        )
-        if resp.status_code != 200:
-            raise LemmyCommunityNotFound(
-                f"Community search failed ({resp.status_code}): {resp.text[:200]}"
-            )
-        communities = resp.json().get("communities", [])
-        if not communities:
-            raise LemmyCommunityNotFound(f"No communities found for '{name}'.")
-        # Prefer exact actor_id match (e.g. !cooking@lemmy.world)
-        for item in communities:
-            view = item.get("community", {})
-            if "@" in lookup:
-                actor_id: str = view.get("actor_id", "")
-                if lookup.lower() in actor_id.lower():
-                    return int(view["id"])
-            else:
-                if view.get("name", "").lower() == lookup.lower():
-                    return int(view["id"])
-        # Fall back to first result
-        return int(communities[0]["community"]["id"])
-
-    def post_to_community(
-        self,
-        community_id: int,
-        title: str,
-        body: str,
-        url: str | None = None,
-        nsfw: bool = False,
-    ) -> dict[str, Any]:
-        """
-        Create a post in a Lemmy community.
-
-        Args:
-            community_id: Numeric community ID (from resolve_community()).
-            title:        Post title.
-            body:         Markdown post body.
-            url:          Optional external URL to attach.
-            nsfw:         Mark NSFW (default False).
-
-        Returns:
-            Lemmy API response dict (contains 'post_view', etc.).
-
-        Raises:
-            LemmyAuthError: If not logged in.
-            requests.RequestException: On network failure.
-        """
-        payload: dict[str, Any] = {
-            "community_id": community_id,
-            "name": title,
-            "body": body,
-            "nsfw": nsfw,
-        }
-        if url:
-            payload["url"] = url
-
-        resp = self._session.post(
-            f"{self._api}/post",
-            json=payload,
-            headers=self._auth_headers(),
-            timeout=15,
-        )
-        resp.raise_for_status()
-        return resp.json()
--- a/circuitforge_core/activitypub/objects.py
+++ b/circuitforge_core/activitypub/objects.py
@ -1,168 +0,0 @@
-"""
-ActivityStreams 2.0 object constructors.
-
-All functions return plain dicts (no classes) — they are serialized to JSON
-for delivery. IDs are minted with UUID4 so callers don't need to track them.
-
-Custom types:
- "Offer"   — AS2 Offer (Rook exchange offers)
- "Request" — custom CF extension (Rook exchange requests); not in core AS2
-
-MIT licensed.
-"""
-from __future__ import annotations
-
-import uuid
-from datetime import datetime, timezone
-from typing import TYPE_CHECKING
-
-if TYPE_CHECKING:
-    from circuitforge_core.activitypub.actor import CFActor
-
-# AS2 public address (all followers)
-PUBLIC = "https://www.w3.org/ns/activitystreams#Public"
-
-# Custom context extension for CF-specific types
-_CF_CONTEXT = "https://circuitforge.tech/ns/activitystreams"
-
-
-def _now_iso() -> str:
-    return datetime.now(tz=timezone.utc).isoformat().replace("+00:00", "Z")
-
-
-def _mint_id(actor_id: str, type_slug: str) -> str:
-    """Generate a unique ID scoped to the actor's namespace."""
-    return f"{actor_id}/{type_slug}/{uuid.uuid4().hex}"
-
-
-def make_note(
-    actor_id: str,
-    content: str,
-    to: list[str] | None = None,
-    cc: list[str] | None = None,
-    in_reply_to: str | None = None,
-    tag: list[dict] | None = None,
-    published: datetime | None = None,
-) -> dict:
-    """
-    Construct an AS2 Note object.
-
-    Args:
-        actor_id:    The actor's ID URL (attributedTo).
-        content:     HTML or plain-text body.
-        to:          Direct recipients (defaults to [PUBLIC]).
-        cc:          CC recipients.
-        in_reply_to: URL of the parent note when replying.
-        tag:         Mention/hashtag tag dicts.
-        published:   Post timestamp (defaults to now UTC).
-    """
-    note: dict = {
-        "@context": "https://www.w3.org/ns/activitystreams",
-        "id": _mint_id(actor_id, "notes"),
-        "type": "Note",
-        "attributedTo": actor_id,
-        "content": content,
-        "to": to if to is not None else [PUBLIC],
-        "published": published.isoformat().replace("+00:00", "Z") if published else _now_iso(),
-    }
-    if cc:
-        note["cc"] = cc
-    if in_reply_to:
-        note["inReplyTo"] = in_reply_to
-    if tag:
-        note["tag"] = tag
-    return note
-
-
-def make_offer(
-    actor_id: str,
-    summary: str,
-    content: str,
-    to: list[str] | None = None,
-    cc: list[str] | None = None,
-) -> dict:
-    """
-    Construct an AS2 Offer object (Rook exchange offers).
-
-    The Offer type is part of core ActivityStreams 2.0.
-
-    Args:
-        actor_id: The actor's ID URL (actor field).
-        summary:  Short one-line description (used as title in Lemmy).
-        content:  Full HTML/plain-text description.
-        to:       Recipients (defaults to [PUBLIC]).
-        cc:       CC recipients.
-    """
-    return {
-        "@context": "https://www.w3.org/ns/activitystreams",
-        "id": _mint_id(actor_id, "offers"),
-        "type": "Offer",
-        "actor": actor_id,
-        "summary": summary,
-        "content": content,
-        "to": to if to is not None else [PUBLIC],
-        "cc": cc or [],
-        "published": _now_iso(),
-    }
-
-
-def make_request(
-    actor_id: str,
-    summary: str,
-    content: str,
-    to: list[str] | None = None,
-    cc: list[str] | None = None,
-) -> dict:
-    """
-    Construct a CF-extension Request object (Rook exchange requests).
-
-    "Request" is not in core AS2 vocabulary — the CF namespace context
-    extension is included so federating servers don't reject it.
-
-    Args:
-        actor_id: The actor's ID URL.
-        summary:  Short one-line description.
-        content:  Full HTML/plain-text description.
-        to:       Recipients (defaults to [PUBLIC]).
-        cc:       CC recipients.
-    """
-    return {
-        "@context": [
-            "https://www.w3.org/ns/activitystreams",
-            _CF_CONTEXT,
-        ],
-        "id": _mint_id(actor_id, "requests"),
-        "type": "Request",
-        "actor": actor_id,
-        "summary": summary,
-        "content": content,
-        "to": to if to is not None else [PUBLIC],
-        "cc": cc or [],
-        "published": _now_iso(),
-    }
-
-
-def make_create(actor: "CFActor", obj: dict) -> dict:
-    """
-    Wrap any object dict in an AS2 Create activity.
-
-    The Create activity's id, actor, to, cc, and published fields are
-    derived from the wrapped object where available.
-
-    Args:
-        actor: The CFActor originating the Create.
-        obj:   An object dict (Note, Offer, Request, etc.).
-    """
-    # Propagate context from inner object if it's a list (custom types)
-    ctx = obj.get("@context", "https://www.w3.org/ns/activitystreams")
-
-    return {
-        "@context": ctx,
-        "id": _mint_id(actor.actor_id, "activities"),
-        "type": "Create",
-        "actor": actor.actor_id,
-        "to": obj.get("to", [PUBLIC]),
-        "cc": obj.get("cc", []),
-        "published": obj.get("published", _now_iso()),
-        "object": obj,
-    }
--- a/circuitforge_core/activitypub/signing.py
+++ b/circuitforge_core/activitypub/signing.py
@ -1,197 +0,0 @@
-"""
-HTTP Signatures for ActivityPub (draft-cavage-http-signatures-08).
-
-This is the signing convention used by Mastodon, Lemmy, and the broader
-ActivityPub ecosystem. It is distinct from the newer RFC 9421.
-
-Signing algorithm: rsa-sha256
-Signed headers: (request-target) host date [digest] content-type
-Digest header: SHA-256 of request body (when body is present)
-keyId: {actor.actor_id}#main-key
-
-MIT licensed.
-"""
-from __future__ import annotations
-
-import base64
-import hashlib
-import re
-from email.utils import formatdate
-from typing import TYPE_CHECKING
-from urllib.parse import urlparse
-
-if TYPE_CHECKING:
-    from circuitforge_core.activitypub.actor import CFActor
-
-
-def _rfc1123_now() -> str:
-    """Return current UTC time in RFC 1123 format as required by HTTP Date header."""
-    return formatdate(usegmt=True)
-
-
-def _sha256_digest(body: bytes) -> str:
-    """Return 'SHA-256=<base64>' digest string for body."""
-    digest = hashlib.sha256(body).digest()
-    return f"SHA-256={base64.b64encode(digest).decode()}"
-
-
-def sign_headers(
-    method: str,
-    url: str,
-    headers: dict,
-    body: bytes | None,
-    actor: "CFActor",  # type: ignore[name-defined]
-) -> dict:
-    """
-    Return a new headers dict with Date, Digest (if body), and Signature added.
-
-    The input *headers* dict is not mutated.
-
-    Args:
-        method:  HTTP method string (e.g. "POST"), case-insensitive.
-        url:     Full request URL.
-        headers: Existing headers dict (Content-Type, etc.).
-        body:    Request body bytes, or None for bodyless requests.
-        actor:   CFActor whose private key signs the request.
-
-    Returns:
-        New dict with all original headers plus Date, Digest (if body), Signature.
-    """
-    from cryptography.hazmat.primitives import hashes, serialization
-    from cryptography.hazmat.primitives.asymmetric import padding
-    from cryptography.hazmat.primitives.serialization import load_pem_private_key
-
-    parsed = urlparse(url)
-    host = parsed.netloc
-    path = parsed.path or "/"
-    if parsed.query:
-        path = f"{path}?{parsed.query}"
-
-    method_lower = method.lower()
-    date = _rfc1123_now()
-
-    out = dict(headers)
-    out["Date"] = date
-    out["Host"] = host
-
-    signed_header_names = ["(request-target)", "host", "date"]
-
-    if body is not None:
-        digest = _sha256_digest(body)
-        out["Digest"] = digest
-        signed_header_names.append("digest")
-
-    if "Content-Type" in out:
-        signed_header_names.append("content-type")
-
-    # Build the signature string — header names in the spec are lowercase,
-    # but the dict uses Title-Case HTTP convention, so look up case-insensitively.
-    def _ci_get(d: dict, key: str) -> str:
-        for k, v in d.items():
-            if k.lower() == key.lower():
-                return v
-        raise KeyError(key)
-
-    lines = []
-    for name in signed_header_names:
-        if name == "(request-target)":
-            lines.append(f"(request-target): {method_lower} {path}")
-        else:
-            lines.append(f"{name}: {_ci_get(out, name)}")
-
-    signature_string = "\n".join(lines).encode()
-
-    private_key = load_pem_private_key(actor.private_key_pem.encode(), password=None)
-    raw_sig = private_key.sign(signature_string, padding.PKCS1v15(), hashes.SHA256())
-    b64_sig = base64.b64encode(raw_sig).decode()
-
-    key_id = f"{actor.actor_id}#main-key"
-    headers_param = " ".join(signed_header_names)
-
-    out["Signature"] = (
-        f'keyId="{key_id}",'
-        f'algorithm="rsa-sha256",'
-        f'headers="{headers_param}",'
-        f'signature="{b64_sig}"'
-    )
-
-    return out
-
-
-def verify_signature(
-    headers: dict,
-    method: str,
-    path: str,
-    body: bytes | None,
-    public_key_pem: str,
-) -> bool:
-    """
-    Verify an incoming ActivityPub HTTP Signature.
-
-    Returns False on any parse or verification failure — never raises.
-
-    Args:
-        headers:        Request headers dict (case-insensitive lookup attempted).
-        method:         HTTP method (e.g. "POST").
-        path:           Request path (e.g. "/actors/kiwi/inbox").
-        body:           Raw request body bytes, or None.
-        public_key_pem: PEM-encoded RSA public key of the signing actor.
-    """
-    from cryptography.exceptions import InvalidSignature
-    from cryptography.hazmat.primitives import hashes, serialization
-    from cryptography.hazmat.primitives.asymmetric import padding
-    from cryptography.hazmat.primitives.serialization import load_pem_public_key
-
-    try:
-        # Case-insensitive header lookup helper
-        def _get(name: str) -> str | None:
-            name_lower = name.lower()
-            for k, v in headers.items():
-                if k.lower() == name_lower:
-                    return v
-            return None
-
-        sig_header = _get("Signature")
-        if not sig_header:
-            return False
-
-        # Parse Signature header key=value pairs
-        params: dict[str, str] = {}
-        for match in re.finditer(r'(\w+)="([^"]*)"', sig_header):
-            params[match.group(1)] = match.group(2)
-
-        if "signature" not in params or "headers" not in params:
-            return False
-
-        signed_header_names = params["headers"].split()
-        method_lower = method.lower()
-
-        lines = []
-        for name in signed_header_names:
-            if name == "(request-target)":
-                lines.append(f"(request-target): {method_lower} {path}")
-            else:
-                val = _get(name)
-                if val is None:
-                    return False
-                lines.append(f"{name}: {val}")
-
-        signature_string = "\n".join(lines).encode()
-        raw_sig = base64.b64decode(params["signature"])
-
-        public_key = load_pem_public_key(public_key_pem.encode())
-        public_key.verify(raw_sig, signature_string, padding.PKCS1v15(), hashes.SHA256())
-
-        # Also verify the Digest header matches the actual body, if both are present.
-        # Signing the Digest header proves it wasn't swapped; re-computing it proves
-        # the body wasn't replaced after signing.
-        digest_val = _get("Digest")
-        if digest_val and body is not None:
-            expected = _sha256_digest(body)
-            if digest_val != expected:
-                return False
-
-        return True
-
-    except (InvalidSignature, Exception):
-        return False
--- a/circuitforge_core/affiliates/init.py
+++ b/circuitforge_core/affiliates/init.py
@ -1,41 +0,0 @@
-"""Public API for circuitforge_core.affiliates.
-
-Usage::
-
-    from circuitforge_core.affiliates import wrap_url, get_disclosure_text
-
-    # Wrap a URL — env-var mode (no preferences, no opt-out)
-    url = wrap_url("https://www.ebay.com/itm/123", retailer="ebay")
-
-    # Wrap a URL — with preference injection (opt-out + BYOK)
-    url = wrap_url(
-        "https://www.ebay.com/itm/123",
-        retailer="ebay",
-        user_id="u123",
-        get_preference=my_prefs_client.get,
-    )
-
-    # Frontend disclosure tooltip
-    text = get_disclosure_text("ebay")
-
-    # Register a product-specific program at startup
-    register_program(AffiliateProgram(
-        name="My Shop",
-        retailer_key="myshop",
-        env_var="MYSHOP_AFFILIATE_ID",
-        build_url=lambda url, id_: f"{url}?ref={id_}",
-    ))
-"""
-from .disclosure import BANNER_COPY, get_disclosure_text
-from .programs import AffiliateProgram, get_program, register_program, registered_keys
-from .router import wrap_url
-
-__all__ = [
-    "wrap_url",
-    "get_disclosure_text",
-    "BANNER_COPY",
-    "AffiliateProgram",
-    "register_program",
-    "get_program",
-    "registered_keys",
-]
--- a/circuitforge_core/affiliates/disclosure.py
+++ b/circuitforge_core/affiliates/disclosure.py
@ -1,49 +0,0 @@
-"""Affiliate disclosure copy constants.
-
-Follows the plain-language disclosure design from the affiliate links design
-doc. All copy is centralized here so products don't drift out of sync and
-legal/copy review has a single file to audit.
-"""
-from __future__ import annotations
-
-# Per-retailer tooltip copy (shown on hover/tap of affiliate link indicator)
-_TOOLTIP: dict[str, str] = {
-    "ebay": (
-        "Affiliate link — CircuitForge earns a small commission if you purchase "
-        "on eBay. No purchase data is shared with us. [Opt out in Settings]"
-    ),
-    "amazon": (
-        "Affiliate link — CircuitForge earns a small commission if you purchase "
-        "on Amazon. No purchase data is shared with us. [Opt out in Settings]"
-    ),
-}
-
-_GENERIC_TOOLTIP = (
-    "Affiliate link — CircuitForge may earn a small commission if you purchase. "
-    "No purchase data is shared with us. [Opt out in Settings]"
-)
-
-# First-encounter banner copy (shown once, then preference saved)
-BANNER_COPY: dict[str, str] = {
-    "title": "A note on purchase links",
-    "body": (
-        "Some links in this product go to retailers using our affiliate code. "
-        "When you click one, the retailer knows you came from CircuitForge. "
-        "We don't see or store what you buy. The retailer may track your "
-        "purchase — that's between you and them.\n\n"
-        "If you'd rather use plain links with no tracking code, you can opt "
-        "out in Settings."
-    ),
-    "dismiss_label": "Got it",
-    "opt_out_label": "Opt out now",
-    "learn_more_label": "Learn more",
-}
-
-
-def get_disclosure_text(retailer: str) -> str:
-    """Return the tooltip disclosure string for *retailer*.
-
-    Falls back to a generic string for unregistered retailers so callers
-    never receive an empty string.
-    """
-    return _TOOLTIP.get(retailer, _GENERIC_TOOLTIP)
--- a/circuitforge_core/affiliates/programs.py
+++ b/circuitforge_core/affiliates/programs.py
@ -1,116 +0,0 @@
-"""Affiliate program definitions and URL builders.
-
-Each ``AffiliateProgram`` knows how to append its affiliate parameters to a
-plain product URL.  Built-in programs (eBay EPN, Amazon Associates) are
-registered at module import time.  Products can register additional programs
-with ``register_program()``.
-
-Affiliate IDs are read from environment variables at call time so they pick
-up values set after process startup (useful in tests).
-"""
-from __future__ import annotations
-
-import os
-from dataclasses import dataclass
-from typing import Callable
-from urllib.parse import parse_qs, urlencode, urlparse, urlunparse
-
-
-@dataclass(frozen=True)
-class AffiliateProgram:
-    """One affiliate program and its URL building logic.
-
-    Attributes:
-        name:         Human-readable program name.
-        retailer_key: Matches the ``retailer=`` argument in ``wrap_url()``.
-        env_var:      Environment variable holding CF's affiliate ID.
-        build_url:    ``(plain_url, affiliate_id) -> affiliate_url`` callable.
-    """
-
-    name: str
-    retailer_key: str
-    env_var: str
-    build_url: Callable[[str, str], str]
-
-    def cf_affiliate_id(self) -> str | None:
-        """Return CF's configured affiliate ID, or None if the env var is unset/blank."""
-        val = os.environ.get(self.env_var, "").strip()
-        return val or None
-
-
-# ---------------------------------------------------------------------------
-# URL builders
-# ---------------------------------------------------------------------------
-
-def _build_ebay_url(url: str, affiliate_id: str) -> str:
-    """Append eBay Partner Network parameters to a listing URL."""
-    sep = "&" if "?" in url else "?"
-    params = urlencode({
-        "mkcid": "1",
-        "mkrid": "711-53200-19255-0",
-        "siteid": "0",
-        "campid": affiliate_id,
-        "toolid": "10001",
-        "mkevt": "1",
-    })
-    return f"{url}{sep}{params}"
-
-
-def _build_instacart_url(url: str, affiliate_id: str) -> str:
-    """Append Instacart affiliate parameter to a search URL."""
-    sep = "&" if "?" in url else "?"
-    return f"{url}{sep}aff={affiliate_id}"
-
-
-def _build_amazon_url(url: str, affiliate_id: str) -> str:
-    """Merge an Amazon Associates tag into a product URL's query string."""
-    parsed = urlparse(url)
-    qs = parse_qs(parsed.query, keep_blank_values=True)
-    qs["tag"] = [affiliate_id]
-    new_query = urlencode({k: v[0] for k, v in qs.items()})
-    return urlunparse(parsed._replace(query=new_query))
-
-
-# ---------------------------------------------------------------------------
-# Registry
-# ---------------------------------------------------------------------------
-
-_REGISTRY: dict[str, AffiliateProgram] = {}
-
-
-def register_program(program: AffiliateProgram) -> None:
-    """Register an affiliate program (overwrites any existing entry for the same key)."""
-    _REGISTRY[program.retailer_key] = program
-
-
-def get_program(retailer_key: str) -> AffiliateProgram | None:
-    """Return the registered program for *retailer_key*, or None."""
-    return _REGISTRY.get(retailer_key)
-
-
-def registered_keys() -> list[str]:
-    """Return all currently registered retailer keys."""
-    return list(_REGISTRY.keys())
-
-
-# Register built-ins
-register_program(AffiliateProgram(
-    name="eBay Partner Network",
-    retailer_key="ebay",
-    env_var="EBAY_AFFILIATE_CAMPAIGN_ID",
-    build_url=_build_ebay_url,
-))
-
-register_program(AffiliateProgram(
-    name="Amazon Associates",
-    retailer_key="amazon",
-    env_var="AMAZON_ASSOCIATES_TAG",
-    build_url=_build_amazon_url,
-))
-
-register_program(AffiliateProgram(
-    name="Instacart",
-    retailer_key="instacart",
-    env_var="INSTACART_AFFILIATE_ID",
-    build_url=_build_instacart_url,
-))
--- a/circuitforge_core/affiliates/router.py
+++ b/circuitforge_core/affiliates/router.py
@ -1,83 +0,0 @@
-"""Affiliate URL wrapping — resolution logic.
-
-Resolution order (from affiliate links design doc):
-
-  1. User opted out?                          → return plain URL
-  2. User has BYOK ID for this retailer?      → wrap with user's ID
-  3. CF has a program with env var set?       → wrap with CF's ID
-  4. No program / no ID configured            → return plain URL
-
-The ``get_preference`` callable is optional.  When None (default), steps 1
-and 2 are skipped — the module operates in env-var-only mode.  Products
-inject their preferences client to enable opt-out and BYOK.
-
-Signature of ``get_preference``::
-
-    def get_preference(user_id: str | None, path: str, default=None) -> Any: ...
-"""
-from __future__ import annotations
-
-import logging
-from typing import Any, Callable
-
-from .programs import get_program
-
-logger = logging.getLogger(__name__)
-
-GetPreferenceFn = Callable[[str | None, str, Any], Any]
-
-
-def wrap_url(
-    url: str,
-    retailer: str,
-    user_id: str | None = None,
-    get_preference: GetPreferenceFn | None = None,
-) -> str:
-    """Return an affiliate URL for *url*, or the plain URL if no affiliate
-    link can be or should be generated.
-
-    Args:
-        url:            Plain product URL to wrap.
-        retailer:       Retailer key (e.g. ``"ebay"``, ``"amazon"``).
-        user_id:        User identifier for preference lookups. None = anonymous.
-        get_preference: Optional callable ``(user_id, path, default) -> value``.
-                        Injected by products to enable opt-out and BYOK resolution.
-                        When None, opt-out and BYOK checks are skipped.
-
-    Returns:
-        Affiliate URL, or *url* unchanged if:
-        - The user has opted out
-        - No program is registered for *retailer*
-        - No affiliate ID is configured (env var unset and no BYOK)
-    """
-    program = get_program(retailer)
-    if program is None:
-        logger.debug("affiliates: no program registered for retailer=%r", retailer)
-        return url
-
-    # Step 1: opt-out check
-    if get_preference is not None:
-        opted_out = get_preference(user_id, "affiliate.opt_out", False)
-        if opted_out:
-            logger.debug("affiliates: user %r opted out — returning plain URL", user_id)
-            return url
-
-    # Step 2: BYOK — user's own affiliate ID (Premium)
-    if get_preference is not None and user_id is not None:
-        byok_id = get_preference(user_id, f"affiliate.byok_ids.{retailer}", None)
-        if byok_id:
-            logger.debug(
-                "affiliates: using BYOK id for user=%r retailer=%r", user_id, retailer
-            )
-            return program.build_url(url, byok_id)
-
-    # Step 3: CF's affiliate ID from env var
-    cf_id = program.cf_affiliate_id()
-    if cf_id:
-        return program.build_url(url, cf_id)
-
-    logger.debug(
-        "affiliates: no affiliate ID configured for retailer=%r (env var %r unset)",
-        retailer, program.env_var,
-    )
-    return url
--- a/circuitforge_core/api/init.py
+++ b/circuitforge_core/api/init.py
@ -1,4 +0,0 @@
-from circuitforge_core.api.feedback import make_feedback_router
-from circuitforge_core.api.corrections import make_corrections_router, CORRECTIONS_MIGRATION_SQL
-
-__all__ = ["make_feedback_router", "make_corrections_router", "CORRECTIONS_MIGRATION_SQL"]
--- a/circuitforge_core/api/corrections.py
+++ b/circuitforge_core/api/corrections.py
@ -1,199 +0,0 @@
-"""
-Shared corrections router — stores user corrections to LLM output for SFT training.
-
-Products include this with make_corrections_router(get_db=..., product=...).
-Corrections are stored locally in each product's SQLite DB and exported as JSONL
-for the Avocet SFT pipeline. Separate from the bug-feedback→Forgejo-issue path.
-
-Required DB migration (add to product migrations dir):
-    -- From circuitforge_core.api.corrections import CORRECTIONS_MIGRATION_SQL
-"""
-from __future__ import annotations
-
-import json
-import sqlite3
-from collections.abc import Callable
-from datetime import datetime, timezone
-from typing import Iterator, Literal
-
-from fastapi import APIRouter, Depends, HTTPException
-from fastapi.responses import StreamingResponse
-from pydantic import BaseModel, Field
-
-# Drop this SQL into a product's migrations directory (e.g. 020_corrections.sql).
-CORRECTIONS_MIGRATION_SQL = """\
-CREATE TABLE IF NOT EXISTS corrections (
-    id               INTEGER PRIMARY KEY AUTOINCREMENT,
-    item_id          TEXT    NOT NULL DEFAULT '',
-    product          TEXT    NOT NULL,
-    correction_type  TEXT    NOT NULL,
-    input_text       TEXT    NOT NULL,
-    original_output  TEXT    NOT NULL,
-    corrected_output TEXT    NOT NULL DEFAULT '',
-    rating           TEXT    NOT NULL DEFAULT 'down',
-    context          TEXT    NOT NULL DEFAULT '{}',
-    opted_in         INTEGER NOT NULL DEFAULT 0,
-    created_at       TEXT    NOT NULL DEFAULT (datetime('now'))
-);
-
-CREATE INDEX IF NOT EXISTS idx_corrections_product
-    ON corrections (product);
-
-CREATE INDEX IF NOT EXISTS idx_corrections_opted_in
-    ON corrections (opted_in);
-"""
-
-
-class CorrectionRequest(BaseModel):
-    item_id: str = ""
-    product: str
-    correction_type: str
-    input_text: str
-    original_output: str
-    corrected_output: str = ""
-    rating: Literal["up", "down"] = "down"
-    context: dict = Field(default_factory=dict)
-    opted_in: bool = False
-
-
-class CorrectionResponse(BaseModel):
-    id: int
-    saved: bool
-
-
-class CorrectionRecord(BaseModel):
-    id: int
-    item_id: str
-    product: str
-    correction_type: str
-    input_text: str
-    original_output: str
-    corrected_output: str
-    rating: str
-    context: dict
-    opted_in: bool
-    created_at: str
-
-
-def make_corrections_router(
-    get_db: Callable[[], Iterator[sqlite3.Connection]],
-    product: str,
-) -> APIRouter:
-    """Return a configured corrections APIRouter.
-
-    Args:
-        get_db: FastAPI dependency that yields a sqlite3.Connection.
-        product: Product slug injected into every correction row (e.g. "linnet").
-    """
-    router = APIRouter()
-
-    @router.post("", response_model=CorrectionResponse)
-    def submit_correction(
-        payload: CorrectionRequest,
-        conn: sqlite3.Connection = Depends(get_db),
-    ) -> CorrectionResponse:
-        """Store a user correction to an LLM output."""
-        # Thumbs-up with no corrected text is a valid positive signal.
-        if payload.rating == "down" and not payload.corrected_output.strip():
-            raise HTTPException(
-                status_code=422,
-                detail="corrected_output is required when rating is 'down'.",
-            )
-
-        row_id = conn.execute(
-            """
-            INSERT INTO corrections
-                (item_id, product, correction_type, input_text, original_output,
-                 corrected_output, rating, context, opted_in)
-            VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?)
-            """,
-            (
-                payload.item_id,
-                product,
-                payload.correction_type,
-                payload.input_text,
-                payload.original_output,
-                payload.corrected_output,
-                payload.rating,
-                json.dumps(payload.context),
-                int(payload.opted_in),
-            ),
-        ).lastrowid
-        conn.commit()
-        return CorrectionResponse(id=row_id, saved=True)
-
-    @router.get("", response_model=list[CorrectionRecord])
-    def list_corrections(
-        opted_in_only: bool = False,
-        limit: int = 200,
-        conn: sqlite3.Connection = Depends(get_db),
-    ) -> list[CorrectionRecord]:
-        """List stored corrections, optionally filtered to opted-in rows only."""
-        conn.row_factory = sqlite3.Row
-        query = "SELECT * FROM corrections"
-        params: list = []
-        if opted_in_only:
-            query += " WHERE opted_in = 1"
-        query += " ORDER BY created_at DESC LIMIT ?"
-        params.append(max(1, min(limit, 1000)))
-        rows = conn.execute(query, params).fetchall()
-        return [
-            CorrectionRecord(
-                id=r["id"],
-                item_id=r["item_id"],
-                product=r["product"],
-                correction_type=r["correction_type"],
-                input_text=r["input_text"],
-                original_output=r["original_output"],
-                corrected_output=r["corrected_output"],
-                rating=r["rating"],
-                context=json.loads(r["context"] or "{}"),
-                opted_in=bool(r["opted_in"]),
-                created_at=r["created_at"],
-            )
-            for r in rows
-        ]
-
-    @router.get("/export")
-    def export_corrections(
-        opted_in_only: bool = True,
-        conn: sqlite3.Connection = Depends(get_db),
-    ) -> StreamingResponse:
-        """Stream corrections as JSONL for the Avocet SFT pipeline.
-
-        Each line is a JSON object with the fields expected by avocet's
-        SFT candidate importer. opted_in_only=True (default) — only rows
-        where the user consented to share are exported.
-        """
-        conn.row_factory = sqlite3.Row
-        query = "SELECT * FROM corrections"
-        if opted_in_only:
-            query += " WHERE opted_in = 1"
-        query += " ORDER BY created_at ASC"
-        rows = conn.execute(query).fetchall()
-
-        timestamp = datetime.now(timezone.utc).strftime("%Y%m%dT%H%M%SZ")
-        filename = f"corrections_{product}_{timestamp}.jsonl"
-
-        def generate() -> Iterator[str]:
-            for r in rows:
-                record = {
-                    "input": r["input_text"],
-                    "output": r["original_output"],
-                    "correction": r["corrected_output"],
-                    "rating": r["rating"],
-                    "correction_type": r["correction_type"],
-                    "product": r["product"],
-                    "item_id": r["item_id"],
-                    "context": json.loads(r["context"] or "{}"),
-                    "created_at": r["created_at"],
-                }
-                yield json.dumps(record, ensure_ascii=False) + "\n"
-
-        return StreamingResponse(
-            generate(),
-            media_type="application/x-ndjson",
-            headers={"Content-Disposition": f'attachment; filename="{filename}"'},
-        )
-
-    return router
--- a/circuitforge_core/api/feedback.py
+++ b/circuitforge_core/api/feedback.py
@ -1,183 +0,0 @@
-"""
-Shared feedback router — creates Forgejo issues from in-app beta feedback.
-Products include this with make_feedback_router(repo=..., product=...).
-"""
-from __future__ import annotations
-
-import os
-import platform
-import subprocess
-from collections.abc import Callable
-from datetime import datetime, timezone
-from pathlib import Path
-from typing import Literal
-
-import requests
-from fastapi import APIRouter, HTTPException
-from pydantic import BaseModel
-
-_LABEL_COLORS: dict[str, str] = {
-    "beta-feedback": "#0075ca",
-    "needs-triage": "#e4e669",
-    "bug": "#d73a4a",
-    "feature-request": "#a2eeef",
-    "question": "#d876e3",
-}
-
-_TYPE_LABEL_MAP: dict[str, str] = {"bug": "bug", "feature": "feature-request"}
-_TYPE_DISPLAY: dict[str, str] = {
-    "bug": "🐛 Bug",
-    "feature": "✨ Feature Request",
-    "other": "💬 Other",
-}
-
-
-class FeedbackRequest(BaseModel):
-    title: str
-    description: str
-    type: Literal["bug", "feature", "other"] = "other"
-    repro: str = ""
-    tab: str = "unknown"
-    submitter: str = ""
-
-
-class FeedbackResponse(BaseModel):
-    issue_number: int
-    issue_url: str
-
-
-def _forgejo_token() -> str:
-    """Return the bot token when set; fall back to the personal API token."""
-    return os.environ.get("FORGEJO_BOT_TOKEN") or os.environ.get("FORGEJO_API_TOKEN", "")
-
-
-def _forgejo_headers() -> dict[str, str]:
-    return {"Authorization": f"token {_forgejo_token()}", "Content-Type": "application/json"}
-
-
-def _ensure_labels(label_names: list[str], base: str, repo: str) -> list[int]:
-    headers = _forgejo_headers()
-    resp = requests.get(f"{base}/repos/{repo}/labels", headers=headers, timeout=10)
-    existing = {lb["name"]: lb["id"] for lb in resp.json()} if resp.ok else {}
-    ids: list[int] = []
-    for name in label_names:
-        if name in existing:
-            ids.append(existing[name])
-        else:
-            r = requests.post(
-                f"{base}/repos/{repo}/labels",
-                headers=headers,
-                json={"name": name, "color": _LABEL_COLORS.get(name, "#ededed")},
-                timeout=10,
-            )
-            if r.ok:
-                ids.append(r.json()["id"])
-            else:
-                raise HTTPException(
-                    status_code=502,
-                    detail=f"Failed to create label '{name}': {r.text[:200]}",
-                )
-    return ids
-
-
-def _collect_context(tab: str, product: str) -> dict[str, str]:
-    try:
-        version = subprocess.check_output(
-            ["git", "describe", "--tags", "--always"],
-            cwd=Path.cwd(),
-            text=True,
-            timeout=5,
-        ).strip()
-    except (subprocess.SubprocessError, OSError):
-        version = "dev"
-    return {
-        "product": product,
-        "tab": tab,
-        "version": version,
-        "platform": platform.platform(),
-        "timestamp": datetime.now(timezone.utc).isoformat().replace("+00:00", "Z"),
-    }
-
-
-def _build_issue_body(payload: FeedbackRequest, context: dict[str, str]) -> str:
-    lines: list[str] = [
-        f"## {_TYPE_DISPLAY.get(payload.type, '💬 Other')}",
-        "",
-        payload.description,
-        "",
-    ]
-    if payload.type == "bug" and payload.repro:
-        lines += ["### Reproduction Steps", "", payload.repro, ""]
-    lines += ["### Context", ""]
-    for k, v in context.items():
-        lines.append(f"- **{k}:** {v}")
-    lines.append("")
-    if payload.submitter:
-        lines += ["---", f"*Submitted by: {payload.submitter}*"]
-    return "\n".join(lines)
-
-
-def make_feedback_router(
-    repo: str,
-    product: str,
-    demo_mode_fn: Callable[[], bool] | None = None,
-) -> APIRouter:
-    """Return a configured feedback APIRouter for the given Forgejo repo and product.
-
-    Args:
-        repo: Forgejo repo slug, e.g. "Circuit-Forge/kiwi".
-        product: Product name injected into issue context, e.g. "kiwi".
-        demo_mode_fn: Optional callable returning True when in demo mode.
-            If None, reads the DEMO_MODE environment variable.
-    """
-
-    def _is_demo() -> bool:
-        if demo_mode_fn is not None:
-            return demo_mode_fn()
-        return os.environ.get("DEMO_MODE", "").lower() in ("1", "true", "yes")
-
-    router = APIRouter()
-
-    @router.get("/status")
-    def feedback_status() -> dict:
-        """Return whether feedback submission is configured on this instance."""
-        return {"enabled": bool(_forgejo_token()) and not _is_demo()}
-
-    @router.post("", response_model=FeedbackResponse)
-    def submit_feedback(payload: FeedbackRequest) -> FeedbackResponse:
-        """File a Forgejo issue from in-app feedback."""
-        token = _forgejo_token()
-        if not token:
-            raise HTTPException(
-                status_code=503,
-                detail="Feedback disabled: FORGEJO_BOT_TOKEN (or FORGEJO_API_TOKEN) not configured.",
-            )
-        if _is_demo():
-            raise HTTPException(status_code=403, detail="Feedback disabled in demo mode.")
-
-        base = os.environ.get(
-            "FORGEJO_API_URL", "https://git.opensourcesolarpunk.com/api/v1"
-        )
-        context = _collect_context(payload.tab, product)
-        body = _build_issue_body(payload, context)
-        labels = [
-            "beta-feedback",
-            "needs-triage",
-            _TYPE_LABEL_MAP.get(payload.type, "question"),
-        ]
-        label_ids = _ensure_labels(labels, base, repo)
-
-        resp = requests.post(
-            f"{base}/repos/{repo}/issues",
-            headers=_forgejo_headers(),
-            json={"title": payload.title, "body": body, "labels": label_ids},
-            timeout=15,
-        )
-        if not resp.ok:
-            raise HTTPException(
-                status_code=502, detail=f"Forgejo error: {resp.text[:200]}"
-            )
-        data = resp.json()
-        return FeedbackResponse(issue_number=data["number"], issue_url=data["html_url"])
-
-    return router
--- a/circuitforge_core/audio/init.py
+++ b/circuitforge_core/audio/init.py
@ -1,29 +0,0 @@
-"""
-circuitforge_core.audio — shared PCM and audio signal utilities.
-
-MIT licensed. No model weights. No HuggingFace. Dependency: numpy only
-(scipy optional for high-quality resampling).
-
-Consumers:
-  cf-voice   — replaces hand-rolled PCM conversion in stt.py / context.py
-  Sparrow    — torchaudio stitching, export, acoustic analysis
-  Avocet     — audio preprocessing for classifier training corpus
-  Linnet     — chunk accumulation for real-time tone annotation
-"""
-from circuitforge_core.audio.convert import (
-    bytes_to_float32,
-    float32_to_pcm,
-    pcm_to_float32,
-)
-from circuitforge_core.audio.gate import is_silent
-from circuitforge_core.audio.resample import resample
-from circuitforge_core.audio.buffer import ChunkAccumulator
-
-__all__ = [
-    "bytes_to_float32",
-    "float32_to_pcm",
-    "pcm_to_float32",
-    "is_silent",
-    "resample",
-    "ChunkAccumulator",
-]
--- a/circuitforge_core/audio/buffer.py
+++ b/circuitforge_core/audio/buffer.py
@ -1,67 +0,0 @@
-"""
-ChunkAccumulator — collect fixed-size audio chunks into a classify window.
-
-Used by cf-voice and Linnet to gather N × 100ms frames before firing
-a classification pass. The window size trades latency against context:
-a 2-second window (20 × 100ms) gives the classifier enough signal to
-detect tone/affect reliably without lagging the conversation.
-"""
-from __future__ import annotations
-
-from collections import deque
-
-import numpy as np
-
-
-class ChunkAccumulator:
-    """Accumulate audio chunks and flush when the window is full.
-
-    Args:
-        window_chunks: Number of chunks to collect before is_ready() is True.
-        dtype:         numpy dtype of the accumulated array. Default float32.
-    """
-
-    def __init__(self, window_chunks: int, *, dtype: np.dtype = np.float32) -> None:
-        if window_chunks < 1:
-            raise ValueError(f"window_chunks must be >= 1, got {window_chunks}")
-        self._window = window_chunks
-        self._dtype = dtype
-        self._buf: deque[np.ndarray] = deque()
-
-    def accumulate(self, chunk: np.ndarray) -> None:
-        """Add a chunk to the buffer. Oldest chunks are dropped once the
-        buffer exceeds window_chunks to bound memory."""
-        self._buf.append(chunk.astype(self._dtype))
-        while len(self._buf) > self._window:
-            self._buf.popleft()
-
-    def is_ready(self) -> bool:
-        """True when window_chunks have been accumulated."""
-        return len(self._buf) >= self._window
-
-    def flush(self) -> np.ndarray:
-        """Concatenate accumulated chunks and reset the buffer.
-
-        Returns:
-            float32 ndarray of concatenated audio.
-
-        Raises:
-            RuntimeError: if fewer than window_chunks have been accumulated.
-        """
-        if not self.is_ready():
-            raise RuntimeError(
-                f"Not enough chunks accumulated: have {len(self._buf)}, "
-                f"need {self._window}. Check is_ready() before calling flush()."
-            )
-        result = np.concatenate(list(self._buf), axis=-1).astype(self._dtype)
-        self._buf.clear()
-        return result
-
-    def reset(self) -> None:
-        """Discard all buffered audio without returning it."""
-        self._buf.clear()
-
-    @property
-    def chunk_count(self) -> int:
-        """Current number of buffered chunks."""
-        return len(self._buf)
--- a/circuitforge_core/audio/convert.py
+++ b/circuitforge_core/audio/convert.py
@ -1,50 +0,0 @@
-"""
-PCM / float32 conversion utilities.
-
-All functions operate on raw audio bytes or numpy arrays. No torch dependency.
-
-Standard pipeline:
-    bytes (int16 PCM) -> float32 ndarray -> signal processing -> bytes (int16 PCM)
-"""
-from __future__ import annotations
-
-import numpy as np
-
-
-def pcm_to_float32(pcm_bytes: bytes, *, dtype: np.dtype = np.int16) -> np.ndarray:
-    """Convert raw PCM bytes to a float32 numpy array in [-1.0, 1.0].
-
-    Args:
-        pcm_bytes: Raw PCM audio bytes.
-        dtype:     Sample dtype of the input. Default: int16 (standard mic input).
-
-    Returns:
-        float32 ndarray, values in [-1.0, 1.0].
-    """
-    scale = np.iinfo(dtype).max
-    return np.frombuffer(pcm_bytes, dtype=dtype).astype(np.float32) / scale
-
-
-def bytes_to_float32(pcm_bytes: bytes) -> np.ndarray:
-    """Alias for pcm_to_float32 with default int16 dtype.
-
-    Matches the naming used in cf-voice context.py for easier migration.
-    """
-    return pcm_to_float32(pcm_bytes)
-
-
-def float32_to_pcm(audio: np.ndarray, *, dtype: np.dtype = np.int16) -> bytes:
-    """Convert a float32 ndarray in [-1.0, 1.0] to raw PCM bytes.
-
-    Clips to [-1.0, 1.0] before scaling to prevent wraparound distortion.
-
-    Args:
-        audio: float32 ndarray, values nominally in [-1.0, 1.0].
-        dtype: Target PCM sample dtype. Default: int16.
-
-    Returns:
-        Raw PCM bytes.
-    """
-    scale = np.iinfo(dtype).max
-    clipped = np.clip(audio, -1.0, 1.0)
-    return (clipped * scale).astype(dtype).tobytes()
--- a/circuitforge_core/audio/gate.py
+++ b/circuitforge_core/audio/gate.py
@ -1,44 +0,0 @@
-"""
-Energy gate — silence detection via RMS amplitude.
-"""
-from __future__ import annotations
-
-import numpy as np
-
-# Default threshold extracted from cf-voice stt.py.
-# Signals below this RMS level are considered silent.
-_DEFAULT_RMS_THRESHOLD = 0.005
-
-
-def is_silent(
-    audio: np.ndarray,
-    *,
-    rms_threshold: float = _DEFAULT_RMS_THRESHOLD,
-) -> bool:
-    """Return True when the audio clip is effectively silent.
-
-    Uses root-mean-square amplitude as the energy estimate. This is a fast
-    frame-level gate — not a VAD model. Use it to skip inference on empty
-    audio frames before they hit a more expensive transcription or
-    classification pipeline.
-
-    Args:
-        audio:         float32 ndarray, values in [-1.0, 1.0].
-        rms_threshold: Clips with RMS below this value are silent.
-                       Default 0.005 is conservative — genuine speech at
-                       normal mic levels sits well above this.
-
-    Returns:
-        True if silent, False if the clip contains meaningful signal.
-    """
-    if audio.size == 0:
-        return True
-    rms = float(np.sqrt(np.mean(audio.astype(np.float32) ** 2)))
-    return rms < rms_threshold
-
-
-def rms(audio: np.ndarray) -> float:
-    """Return the RMS amplitude of an audio array."""
-    if audio.size == 0:
-        return 0.0
-    return float(np.sqrt(np.mean(audio.astype(np.float32) ** 2)))
--- a/circuitforge_core/audio/resample.py
+++ b/circuitforge_core/audio/resample.py
@ -1,39 +0,0 @@
-"""
-Audio resampling — change sample rate of a float32 audio array.
-
-Uses scipy.signal.resample_poly when available (high-quality, anti-aliased).
-Falls back to linear interpolation via numpy when scipy is absent — acceptable
-for 16kHz speech but not for music.
-"""
-from __future__ import annotations
-
-import numpy as np
-
-
-def resample(audio: np.ndarray, from_hz: int, to_hz: int) -> np.ndarray:
-    """Resample audio from one sample rate to another.
-
-    Args:
-        audio:   float32 ndarray, shape (samples,) or (channels, samples).
-        from_hz: Source sample rate in Hz.
-        to_hz:   Target sample rate in Hz.
-
-    Returns:
-        Resampled float32 ndarray at to_hz.
-    """
-    if from_hz == to_hz:
-        return audio.astype(np.float32)
-
-    try:
-        from scipy.signal import resample_poly  # type: ignore[import]
-        from math import gcd
-        g = gcd(from_hz, to_hz)
-        up, down = to_hz // g, from_hz // g
-        return resample_poly(audio.astype(np.float32), up, down, axis=-1)
-    except ImportError:
-        # Numpy linear interpolation fallback — lower quality but no extra deps.
-        # Adequate for 16kHz ↔ 8kHz conversion on speech; avoid for music.
-        n_out = int(len(audio) * to_hz / from_hz)
-        x_old = np.linspace(0, 1, len(audio), endpoint=False)
-        x_new = np.linspace(0, 1, n_out, endpoint=False)
-        return np.interp(x_new, x_old, audio.astype(np.float32)).astype(np.float32)
--- a/circuitforge_core/cloud_session/init.py
+++ b/circuitforge_core/cloud_session/init.py
@ -1,365 +0,0 @@
-"""
-circuitforge_core.cloud_session — shared cloud session resolution for all CF products.
-
-Usage (FastAPI product):
-
-    from circuitforge_core.cloud_session import CloudSessionFactory
-    from pathlib import Path
-
-    _sessions = CloudSessionFactory(
-        product="avocet",
-        local_db=Path("data/avocet.db"),
-    )
-    get_session = _sessions.dependency()
-    require_tier = _sessions.require_tier
-
-    @router.get("/api/imitate")
-    def imitate(session: CloudUser = Depends(get_session)):
-        # session.user_id is the Directus UUID for cloud users, "local" for self-hosted
-        ...
-
-Environment variables (set per-product via .env / compose):
-    CLOUD_MODE              1/true/yes to enable cloud auth (default: off)
-    CLOUD_DATA_ROOT         Root directory for per-user data (default: /devl/<product>-cloud-data)
-    DIRECTUS_JWT_SECRET     HS256 secret used to sign cf_session JWTs (required in cloud mode)
-    HEIMDALL_URL            License server base URL (default: https://license.circuitforge.tech)
-    HEIMDALL_ADMIN_TOKEN    Heimdall admin bearer token (required for tier resolution)
-    CF_SERVER_SECRET        Server-side secret for deriving per-user encryption keys
-    CLOUD_AUTH_BYPASS_IPS   Comma-separated IPs/CIDRs to skip JWT auth (dev LAN only)
-"""
-from __future__ import annotations
-
-import ipaddress
-import logging
-import os
-import re
-import time
-import uuid
-from dataclasses import dataclass, field
-from pathlib import Path
-from typing import Any, Callable
-
-try:
-    from starlette.requests import Request as _Request
-    from starlette.responses import Response as _Response
-except ImportError:  # pragma: no cover — starlette may be absent in non-web envs
-    _Request = Any  # type: ignore[assignment,misc]
-    _Response = Any  # type: ignore[assignment,misc]
-
-log = logging.getLogger(__name__)
-
-TIERS: list[str] = ["free", "paid", "premium", "ultra"]
-
-# ── CloudUser ─────────────────────────────────────────────────────────────────
-
-
-@dataclass(frozen=True)
-class CloudUser:
-    """Resolved user identity for one HTTP request.
-
-    user_id:  Directus UUID for authenticated cloud users.
-              "local"          for self-hosted / CLOUD_MODE=false.
-              "local-dev"      for dev-bypass-IP sessions.
-              "anon-<uuid>"    for unauthenticated guest visitors.
-    tier:     free | paid | premium | ultra | local
-    product:  Which CF product this session belongs to (e.g. "avocet").
-    meta:     Product-specific extras (e.g. household_id for Kiwi).
-              Access via session.meta.get("household_id").
-    """
-    user_id: str
-    tier: str
-    product: str
-    has_byok: bool = False
-    meta: dict[str, Any] = field(default_factory=dict)
-
-
-# ── Helpers ───────────────────────────────────────────────────────────────────
-
-
-def _parse_bypass_nets(raw: str) -> tuple[list[ipaddress.IPv4Network | ipaddress.IPv6Network], frozenset[str]]:
-    nets: list[ipaddress.IPv4Network | ipaddress.IPv6Network] = []
-    ips: set[str] = set()
-    for entry in (e.strip() for e in raw.split(",") if e.strip()):
-        try:
-            nets.append(ipaddress.ip_network(entry, strict=False))
-        except ValueError:
-            ips.add(entry)
-    return nets, frozenset(ips)
-
-
-def _is_bypass_ip(
-    ip: str,
-    nets: list[ipaddress.IPv4Network | ipaddress.IPv6Network],
-    ips: frozenset[str],
-) -> bool:
-    if not ip or (not nets and not ips):
-        return False
-    if ip in ips:
-        return True
-    try:
-        addr = ipaddress.ip_address(ip)
-        return any(addr in net for net in nets)
-    except ValueError:
-        return False
-
-
-def _extract_session_token(header_value: str) -> str:
-    """Pull cf_session value out of a raw Cookie header or return the value as-is."""
-    m = re.search(r'(?:^|;)\s*cf_session=([^;]+)', header_value)
-    return m.group(1).strip() if m else header_value.strip()
-
-
-# ── CloudSessionFactory ───────────────────────────────────────────────────────
-
-
-class CloudSessionFactory:
-    """Per-product session factory. Instantiate once at module level.
-
-    Args:
-        product:          Product code string (e.g. "avocet", "kiwi").
-        extra_meta:       Optional async-or-sync callable that receives
-                          (user_id: str, tier: str) and returns a dict merged
-                          into CloudUser.meta.  Use for product-specific fields
-                          like household_id.
-        byok_detector:    Callable() → bool.  Override to detect BYOK for this
-                          product's config path.  Default: always False.
-    """
-
-    def __init__(
-        self,
-        product: str,
-        extra_meta: Callable[[str, str], dict[str, Any]] | None = None,
-        byok_detector: Callable[[], bool] | None = None,
-    ) -> None:
-        self.product = product
-        self._extra_meta = extra_meta
-        self._byok_detector = byok_detector or (lambda: False)
-
-        # Config — read from environment at construction time so tests can patch env
-        self._cloud_mode: bool = os.environ.get("CLOUD_MODE", "").lower() in ("1", "true", "yes")
-        self._directus_secret: str = os.environ.get("DIRECTUS_JWT_SECRET", "")
-        self._heimdall_url: str = os.environ.get("HEIMDALL_URL", "https://license.circuitforge.tech")
-        self._heimdall_token: str = os.environ.get("HEIMDALL_ADMIN_TOKEN", "")
-        self._cloud_data_root: Path = Path(
-            os.environ.get("CLOUD_DATA_ROOT", f"/devl/{product}-cloud-data")
-        )
-
-        _bypass_raw = os.environ.get("CLOUD_AUTH_BYPASS_IPS", "")
-        self._bypass_nets, self._bypass_ips = _parse_bypass_nets(_bypass_raw)
-
-        # Tier resolution cache: {user_id: (result_dict, timestamp)}
-        self._tier_cache: dict[str, tuple[dict, float]] = {}
-        self._tier_cache_ttl: float = 300.0  # 5 minutes
-
-    # ── JWT ───────────────────────────────────────────────────────────────────
-
-    def validate_jwt(self, token: str) -> str:
-        """Validate a cf_session JWT and return the Directus user_id. Raises HTTPException on failure."""
-        try:
-            import jwt as pyjwt  # lazy — not needed in local mode
-            from fastapi import HTTPException
-            payload = pyjwt.decode(
-                token,
-                self._directus_secret,
-                algorithms=["HS256"],
-                options={"require": ["id", "exp"]},
-            )
-            return payload["id"]
-        except Exception as exc:
-            log.debug("JWT validation failed: %s", exc)
-            from fastapi import HTTPException
-            raise HTTPException(status_code=401, detail="Session invalid or expired")
-
-    # ── Heimdall ──────────────────────────────────────────────────────────────
-
-    def _ensure_provisioned(self, user_id: str) -> None:
-        if not self._heimdall_token:
-            return
-        try:
-            import requests
-            requests.post(
-                f"{self._heimdall_url}/admin/provision",
-                json={"directus_user_id": user_id, "product": self.product, "tier": "free"},
-                headers={"Authorization": f"Bearer {self._heimdall_token}"},
-                timeout=5,
-            )
-        except Exception as exc:
-            log.warning("Heimdall provision failed for user %s: %s", user_id, exc)
-
-    def _resolve_tier(self, user_id: str) -> dict[str, Any]:
-        """Returns dict with keys: tier, license_key (and any product extras)."""
-        now = time.monotonic()
-        cached = self._tier_cache.get(user_id)
-        if cached and (now - cached[1]) < self._tier_cache_ttl:
-            return cached[0]
-
-        result: dict[str, Any] = {"tier": "free", "license_key": None}
-        if self._heimdall_token:
-            try:
-                import requests
-                resp = requests.post(
-                    f"{self._heimdall_url}/admin/cloud/resolve",
-                    json={"directus_user_id": user_id, "product": self.product},
-                    headers={"Authorization": f"Bearer {self._heimdall_token}"},
-                    timeout=5,
-                )
-                if resp.ok:
-                    data = resp.json()
-                    result["tier"] = data.get("tier", "free")
-                    result["license_key"] = data.get("key_display")
-                    # Forward any extra fields Heimdall returns (household_id etc.)
-                    result.update({k: v for k, v in data.items() if k not in result})
-            except Exception as exc:
-                log.warning("Heimdall tier resolve failed for %s: %s", user_id, exc)
-        else:
-            log.debug("HEIMDALL_ADMIN_TOKEN not set — defaulting tier to free")
-
-        self._tier_cache[user_id] = (result, now)
-        return result
-
-    # ── Guest sessions ────────────────────────────────────────────────────────
-
-    _GUEST_COOKIE = "cf_guest_id"
-    _GUEST_COOKIE_MAX_AGE = 60 * 60 * 24 * 90  # 90 days
-
-    def _resolve_guest(self, request: Any, response: Any) -> CloudUser:
-        guest_id = (request.cookies.get(self._GUEST_COOKIE) or "").strip()
-        if not guest_id:
-            guest_id = str(uuid.uuid4())
-        is_https = request.headers.get("x-forwarded-proto", "http").lower() == "https"
-        response.set_cookie(
-            key=self._GUEST_COOKIE,
-            value=guest_id,
-            max_age=self._GUEST_COOKIE_MAX_AGE,
-            httponly=True,
-            samesite="lax",
-            secure=is_https,
-        )
-        return CloudUser(
-            user_id=f"anon-{guest_id}",
-            tier="free",
-            product=self.product,
-            has_byok=self._byok_detector(),
-        )
-
-    # ── Core resolver ─────────────────────────────────────────────────────────
-
-    def resolve(self, request: Any, response: Any) -> CloudUser:
-        """Resolve the CloudUser for a FastAPI request. Suitable as a Depends() target."""
-        has_byok = self._byok_detector()
-
-        if not self._cloud_mode:
-            return CloudUser(user_id="local", tier="local", product=self.product, has_byok=has_byok)
-
-        client_ip = (
-            request.headers.get("x-real-ip", "")
-            or (request.client.host if request.client else "")
-        )
-        is_bypass = _is_bypass_ip(client_ip, self._bypass_nets, self._bypass_ips)
-
-        raw_session = (
-            request.headers.get("x-cf-session", "").strip()
-            or request.cookies.get("cf_session", "").strip()
-        )
-
-        # Bypass IPs skip the JWT *requirement* but not JWT *validation*.
-        # If a token is present (dev is logged in), honour it so they land on
-        # their own account DB rather than the shared local-dev DB.
-        if not raw_session:
-            if is_bypass:
-                log.debug("Bypass IP %s, no token — returning local-dev session for product %s", client_ip, self.product)
-                return CloudUser(user_id="local-dev", tier="local", product=self.product, has_byok=has_byok)
-            return self._resolve_guest(request, response)
-
-        token = _extract_session_token(raw_session)
-        if not token:
-            return self._resolve_guest(request, response)
-
-        # Soft-fail on invalid/expired JWT: downgrade to guest rather than
-        # hard-erroring with 401.  Public endpoints (e.g. community blocklist)
-        # should remain accessible even when the browser has a stale cookie.
-        # Routes that genuinely require an authenticated identity should gate
-        # themselves with require_tier() — that's where the 401/403 belongs.
-        try:
-            user_id = self.validate_jwt(token)
-        except Exception:
-            log.warning(
-                "JWT validation failed for product %s (expired or tampered) — falling back to guest",
-                self.product,
-            )
-            return self._resolve_guest(request, response)
-
-        self._ensure_provisioned(user_id)
-        tier_data = self._resolve_tier(user_id)
-        tier = tier_data.get("tier", "free")
-
-        meta: dict[str, Any] = {}
-        if self._extra_meta:
-            meta = self._extra_meta(user_id, tier) or {}
-        # Merge any extra fields from Heimdall response (e.g. household_id)
-        meta.update({k: v for k, v in tier_data.items() if k not in ("tier", "license_key")})
-        meta["license_key"] = tier_data.get("license_key")
-
-        return CloudUser(
-            user_id=user_id,
-            tier=tier,
-            product=self.product,
-            has_byok=has_byok,
-            meta=meta,
-        )
-
-    def dependency(self) -> Callable[["_Request", "_Response"], CloudUser]:
-        """Return a FastAPI-compatible dependency function (use with Depends())."""
-        factory = self
-
-        def _get_session(request: _Request, response: _Response) -> CloudUser:
-            return factory.resolve(request, response)
-
-        return _get_session
-
-    def require_tier(self, min_tier: str) -> Callable:
-        """Dependency factory — raises 403 if the session tier is below min_tier."""
-        from fastapi import Depends, HTTPException
-        min_idx = TIERS.index(min_tier)
-        get_session = self.dependency()
-
-        def _check(session: CloudUser = Depends(get_session)) -> CloudUser:
-            if session.tier in ("local", "local-dev"):
-                return session
-            try:
-                if TIERS.index(session.tier) < min_idx:
-                    raise HTTPException(
-                        status_code=403,
-                        detail=f"This feature requires {min_tier} tier or above.",
-                    )
-            except ValueError:
-                raise HTTPException(status_code=403, detail="Unknown tier.")
-            return session
-
-        return _check
-
-
-# ── BYOK detection ────────────────────────────────────────────────────────────
-
-def detect_byok(config_path: Path | None = None) -> bool:
-    """Return True if at least one enabled non-vision LLM backend is configured.
-
-    Reads the shared llm.yaml that LLMRouter uses. Local (Ollama, vLLM) and
-    API-key backends both count — the policy is "user is supplying compute",
-    regardless of where that compute lives.
-
-    Args:
-        config_path: Override the default config location. Useful in tests.
-    """
-    import yaml
-    if config_path is None:
-        config_path = Path.home() / ".config" / "circuitforge" / "llm.yaml"
-    try:
-        with open(config_path) as f:
-            cfg = yaml.safe_load(f) or {}
-        return any(
-            b.get("enabled", True) and b.get("type") != "vision_service"
-            for b in cfg.get("backends", {}).values()
-        )
-    except Exception:
-        return False
--- a/circuitforge_core/community/init.py
+++ b/circuitforge_core/community/init.py
@ -1,9 +0,0 @@
-# circuitforge_core/community/__init__.py
-# MIT License
-
-from .models import CommunityPost
-from .db import CommunityDB
-from .store import SharedStore
-from .snipe_store import SellerTrustSignal, SnipeCommunityStore
-
-__all__ = ["CommunityDB", "CommunityPost", "SharedStore", "SellerTrustSignal", "SnipeCommunityStore"]
--- a/circuitforge_core/community/db.py
+++ b/circuitforge_core/community/db.py
@ -1,117 +0,0 @@
-# circuitforge_core/community/db.py
-# MIT License
-
-from __future__ import annotations
-
-import importlib.resources
-import logging
-from pathlib import Path
-
-import psycopg2
-from psycopg2.pool import ThreadedConnectionPool
-
-logger = logging.getLogger(__name__)
-
-_MIN_CONN = 1
-_MAX_CONN = 10
-
-
-class CommunityDB:
-    """Shared PostgreSQL connection pool + migration runner for the community module.
-
-    Products instantiate one CommunityDB at startup and pass it to SharedStore
-    subclasses. The pool is thread-safe (ThreadedConnectionPool).
-
-    Usage:
-        db = CommunityDB.from_env()   # reads COMMUNITY_DB_URL
-        db.run_migrations()
-        store = MyProductStore(db)
-        db.close()                    # at shutdown
-    """
-
-    def __init__(self, dsn: str | None) -> None:
-        if not dsn:
-            raise ValueError(
-                "CommunityDB requires a DSN. "
-                "Set COMMUNITY_DB_URL or pass dsn= explicitly."
-            )
-        self._pool = ThreadedConnectionPool(_MIN_CONN, _MAX_CONN, dsn=dsn)
-        logger.debug("CommunityDB pool created (min=%d, max=%d)", _MIN_CONN, _MAX_CONN)
-
-    @classmethod
-    def from_env(cls) -> "CommunityDB":
-        """Construct from the COMMUNITY_DB_URL environment variable."""
-        import os
-        dsn = os.environ.get("COMMUNITY_DB_URL")
-        return cls(dsn=dsn)
-
-    # ------------------------------------------------------------------
-    # Connection management
-    # ------------------------------------------------------------------
-
-    def getconn(self):
-        """Borrow a connection from the pool. Must be returned via putconn()."""
-        return self._pool.getconn()
-
-    def putconn(self, conn) -> None:
-        """Return a borrowed connection to the pool."""
-        self._pool.putconn(conn)
-
-    def close(self) -> None:
-        """Close all pool connections. Call at application shutdown."""
-        self._pool.closeall()
-        logger.debug("CommunityDB pool closed")
-
-    # ------------------------------------------------------------------
-    # Migration runner
-    # ------------------------------------------------------------------
-
-    def _discover_migrations(self) -> list[Path]:
-        """Return sorted list of .sql migration files from the community migrations dir."""
-        pkg = importlib.resources.files("circuitforge_core.community.migrations")
-        files = sorted(
-            [Path(str(p)) for p in pkg.iterdir() if str(p).endswith(".sql")],
-            key=lambda p: p.name,
-        )
-        return files
-
-    def run_migrations(self) -> None:
-        """Apply all community migration SQL files in numeric order.
-
-        Uses a simple applied-migrations table to avoid re-running already
-        applied migrations. Idempotent.
-        """
-        conn = self.getconn()
-        try:
-            with conn.cursor() as cur:
-                cur.execute("""
-                    CREATE TABLE IF NOT EXISTS _community_migrations (
-                        filename TEXT PRIMARY KEY,
-                        applied_at TIMESTAMPTZ NOT NULL DEFAULT NOW()
-                    )
-                """)
-                conn.commit()
-
-                for migration_file in self._discover_migrations():
-                    name = migration_file.name
-                    cur.execute(
-                        "SELECT 1 FROM _community_migrations WHERE filename = %s",
-                        (name,),
-                    )
-                    if cur.fetchone():
-                        logger.debug("Migration %s already applied, skipping", name)
-                        continue
-
-                    sql = migration_file.read_text()
-                    logger.info("Applying community migration: %s", name)
-                    cur.execute(sql)
-                    cur.execute(
-                        "INSERT INTO _community_migrations (filename) VALUES (%s)",
-                        (name,),
-                    )
-                    conn.commit()
-        except Exception:
-            conn.rollback()
-            raise
-        finally:
-            self.putconn(conn)
--- a/circuitforge_core/community/migrations/001_community_posts.sql
+++ b/circuitforge_core/community/migrations/001_community_posts.sql
@ -1,55 +0,0 @@
-- 001_community_posts.sql
-- Community posts table: published meal plans, recipe successes, and bloopers.
-- Applies to: cf_community PostgreSQL database (hosted by cf-orch).
-- BSL boundary: this schema is MIT (data layer, no inference).
-
-CREATE TABLE IF NOT EXISTS community_posts (
-    id              BIGSERIAL PRIMARY KEY,
-    slug            TEXT NOT NULL UNIQUE,
-    pseudonym       TEXT NOT NULL,
-    post_type       TEXT NOT NULL CHECK (post_type IN ('plan', 'recipe_success', 'recipe_blooper')),
-    published       TIMESTAMPTZ NOT NULL DEFAULT NOW(),
-    title           TEXT NOT NULL,
-    description     TEXT,
-    photo_url       TEXT,
-
-    -- Plan slots (JSON array: [{day, meal_type, recipe_id, recipe_name}])
-    slots           JSONB NOT NULL DEFAULT '[]',
-
-    -- Recipe result fields
-    recipe_id       BIGINT,
-    recipe_name     TEXT,
-    level           SMALLINT CHECK (level IS NULL OR level BETWEEN 1 AND 4),
-    outcome_notes   TEXT,
-
-    -- Element snapshot (denormalized from corpus at publish time)
-    seasoning_score REAL,
-    richness_score  REAL,
-    brightness_score REAL,
-    depth_score     REAL,
-    aroma_score     REAL,
-    structure_score REAL,
-    texture_profile TEXT,
-
-    -- Dietary / allergen / flavor
-    dietary_tags    JSONB NOT NULL DEFAULT '[]',
-    allergen_flags  JSONB NOT NULL DEFAULT '[]',
-    flavor_molecules JSONB NOT NULL DEFAULT '[]',
-
-    -- USDA FDC macros
-    fat_pct         REAL,
-    protein_pct     REAL,
-    moisture_pct    REAL,
-
-    -- Source product identifier
-    source_product  TEXT NOT NULL DEFAULT 'kiwi'
-);
-
-- Indexes for common filter patterns
-CREATE INDEX IF NOT EXISTS idx_community_posts_published ON community_posts (published DESC);
-CREATE INDEX IF NOT EXISTS idx_community_posts_post_type ON community_posts (post_type);
-CREATE INDEX IF NOT EXISTS idx_community_posts_source ON community_posts (source_product);
-
-- GIN index for dietary/allergen JSONB array containment queries
-CREATE INDEX IF NOT EXISTS idx_community_posts_dietary_tags ON community_posts USING GIN (dietary_tags);
-CREATE INDEX IF NOT EXISTS idx_community_posts_allergen_flags ON community_posts USING GIN (allergen_flags);
--- a/circuitforge_core/community/migrations/002_community_post_reactions.sql
+++ b/circuitforge_core/community/migrations/002_community_post_reactions.sql
@ -1,7 +0,0 @@
-- 002_community_post_reactions.sql
-- Reserved: community post reactions (thumbs-up, saves count).
-- Not yet implemented -- this migration is a stub to reserve the sequence number.
-- Applies to: cf_community PostgreSQL database (hosted by cf-orch).
-
-- Placeholder: no-op. Will be replaced when reactions feature is designed.
-SELECT 1;
--- a/circuitforge_core/community/migrations/003_seller_trust_signals.sql
+++ b/circuitforge_core/community/migrations/003_seller_trust_signals.sql
@ -1,26 +0,0 @@
-- Seller trust signals: confirmed scammer / confirmed legitimate outcomes from Snipe.
-- Separate table from community_posts (Kiwi-specific) — seller signals are a
-- structurally different domain and should not overload the recipe post schema.
-- Applies to: cf_community PostgreSQL database (hosted by cf-orch).
-- BSL boundary: table schema is MIT; signal ingestion route in cf-orch is BSL 1.1.
-
-CREATE TABLE IF NOT EXISTS seller_trust_signals (
-    id              BIGSERIAL PRIMARY KEY,
-    platform        TEXT    NOT NULL DEFAULT 'ebay',
-    platform_seller_id TEXT NOT NULL,
-    confirmed_scam  BOOLEAN NOT NULL,
-    signal_source   TEXT    NOT NULL,  -- 'blocklist_add' | 'community_vote' | 'resolved'
-    flags           JSONB   NOT NULL DEFAULT '[]',  -- red flag keys at time of signal
-    source_product  TEXT    NOT NULL DEFAULT 'snipe',
-    recorded_at     TIMESTAMPTZ NOT NULL DEFAULT NOW()
-);
-
-- No PII: platform_seller_id is the public eBay username or platform ID only.
-CREATE INDEX IF NOT EXISTS idx_seller_trust_platform_id
-    ON seller_trust_signals (platform, platform_seller_id);
-
-CREATE INDEX IF NOT EXISTS idx_seller_trust_confirmed
-    ON seller_trust_signals (confirmed_scam);
-
-CREATE INDEX IF NOT EXISTS idx_seller_trust_recorded
-    ON seller_trust_signals (recorded_at DESC);
--- a/circuitforge_core/community/migrations/004_community_categories.sql
+++ b/circuitforge_core/community/migrations/004_community_categories.sql
@ -1,19 +0,0 @@
-- 004_community_categories.sql
-- MIT License
-- Shared eBay category tree published by credentialed Snipe instances.
-- Credentialless instances pull from this table during refresh().
-- Privacy: only public eBay category metadata (IDs, names, paths) — no user data.
-
-CREATE TABLE IF NOT EXISTS community_categories (
-    id              SERIAL PRIMARY KEY,
-    platform        TEXT NOT NULL DEFAULT 'ebay',
-    category_id     TEXT NOT NULL,
-    name            TEXT NOT NULL,
-    full_path       TEXT NOT NULL,
-    source_product  TEXT NOT NULL DEFAULT 'snipe',
-    published_at    TIMESTAMPTZ NOT NULL DEFAULT NOW(),
-    UNIQUE (platform, category_id)
-);
-
-CREATE INDEX IF NOT EXISTS idx_community_cat_name
-    ON community_categories (platform, name);
--- a/circuitforge_core/community/migrations/005_recipe_tags.sql
+++ b/circuitforge_core/community/migrations/005_recipe_tags.sql
@ -1,42 +0,0 @@
-- 005_recipe_tags.sql
-- Community-contributed recipe subcategory tags.
--
-- Users can tag corpus recipes (from a product's local recipe dataset) with a
-- domain/category/subcategory from that product's browse taxonomy. Tags are
-- keyed by (recipe_source, recipe_ref) so a single table serves all CF products
-- that have a recipe corpus (currently: kiwi).
--
-- Acceptance threshold: upvotes >= 2 (submitter's implicit vote counts as 1,
-- so one additional voter is enough to publish). Browse counts caches merge
-- accepted tags into subcategory totals on each nightly refresh.
-
-CREATE TABLE IF NOT EXISTS recipe_tags (
-    id              BIGSERIAL PRIMARY KEY,
-    recipe_source   TEXT NOT NULL CHECK (recipe_source IN ('corpus')),
-    recipe_ref      TEXT NOT NULL,      -- corpus integer recipe ID stored as text
-    domain          TEXT NOT NULL,
-    category        TEXT NOT NULL,
-    subcategory     TEXT,               -- NULL = category-level tag (no subcategory)
-    pseudonym       TEXT NOT NULL,
-    upvotes         INTEGER NOT NULL DEFAULT 1,  -- starts at 1 (submitter's own vote)
-    source_product  TEXT NOT NULL DEFAULT 'kiwi',
-    created_at      TIMESTAMPTZ NOT NULL DEFAULT now(),
-    -- one tag per (recipe, location, user) — prevents submitting the same tag twice
-    UNIQUE (recipe_source, recipe_ref, domain, category, subcategory, pseudonym)
-);
-
-CREATE INDEX IF NOT EXISTS idx_recipe_tags_lookup
-    ON recipe_tags (source_product, domain, category, subcategory)
-    WHERE upvotes >= 2;
-
-CREATE INDEX IF NOT EXISTS idx_recipe_tags_recipe
-    ON recipe_tags (recipe_source, recipe_ref);
-
-- Tracks who voted on which tag to prevent double-voting.
-- The submitter's self-vote is inserted here at submission time.
-CREATE TABLE IF NOT EXISTS recipe_tag_votes (
-    tag_id      BIGINT NOT NULL REFERENCES recipe_tags(id) ON DELETE CASCADE,
-    pseudonym   TEXT NOT NULL,
-    voted_at    TIMESTAMPTZ NOT NULL DEFAULT now(),
-    PRIMARY KEY (tag_id, pseudonym)
-);
--- a/circuitforge_core/community/migrations/006_community_dedup.sql
+++ b/circuitforge_core/community/migrations/006_community_dedup.sql
@ -1,22 +0,0 @@
-- 006_community_dedup.sql
-- Adds variation-linking and title search support for community recipe dedup.
-- Applies to: cf_community PostgreSQL database.
-- BSL boundary: MIT (data layer, no inference).
-
-- Nullable self-referential FK: user-declared "this is a variation of X"
-ALTER TABLE community_posts
-    ADD COLUMN IF NOT EXISTS similar_to_ref TEXT REFERENCES community_posts(slug) ON DELETE SET NULL;
-
-- Index for variation lookup (find all variations of a parent post)
-CREATE INDEX IF NOT EXISTS idx_community_posts_similar_ref
-    ON community_posts (similar_to_ref)
-    WHERE similar_to_ref IS NOT NULL;
-
-- Index to speed up title ILIKE prefix and substring searches
-CREATE INDEX IF NOT EXISTS idx_community_posts_title_lower
-    ON community_posts (lower(title));
-
-- Index on recipe_id for exact-recipe duplicate detection
-CREATE INDEX IF NOT EXISTS idx_community_posts_recipe_id
-    ON community_posts (recipe_id)
-    WHERE recipe_id IS NOT NULL;
--- a/circuitforge_core/community/migrations/init.py
+++ b/circuitforge_core/community/migrations/init.py
@ -1,2 +0,0 @@
-# Community module migrations
-# These SQL files are shipped with circuitforge-core so cf-orch can locate them via importlib.resources.
--- a/circuitforge_core/community/models.py
+++ b/circuitforge_core/community/models.py
@ -1,90 +0,0 @@
-# circuitforge_core/community/models.py
-# MIT License
-
-from __future__ import annotations
-
-from dataclasses import dataclass, field
-from datetime import datetime
-from typing import Literal
-
-PostType = Literal["plan", "recipe_success", "recipe_blooper"]
-CreativityLevel = Literal[1, 2, 3, 4]
-
-_VALID_POST_TYPES: frozenset[str] = frozenset(["plan", "recipe_success", "recipe_blooper"])
-
-
-def _validate_score(name: str, value: float) -> float:
-    if not (0.0 <= value <= 1.0):
-        raise ValueError(f"{name} must be between 0.0 and 1.0, got {value!r}")
-    return value
-
-
-@dataclass(frozen=True)
-class CommunityPost:
-    """Immutable snapshot of a published community post.
-
-    Lists (dietary_tags, allergen_flags, flavor_molecules, slots) are stored as
-    tuples to enforce immutability. Pass lists -- they are converted in __post_init__.
-    """
-
-    # Identity
-    slug: str
-    pseudonym: str
-    post_type: PostType
-    published: datetime
-    title: str
-
-    # Optional content
-    description: str | None
-    photo_url: str | None
-
-    # Plan slots -- list[dict] for post_type="plan"
-    slots: tuple
-
-    # Recipe result fields -- for post_type="recipe_success" | "recipe_blooper"
-    recipe_id: int | None
-    recipe_name: str | None
-    level: CreativityLevel | None
-    outcome_notes: str | None
-
-    # Element snapshot
-    seasoning_score: float
-    richness_score: float
-    brightness_score: float
-    depth_score: float
-    aroma_score: float
-    structure_score: float
-    texture_profile: str
-
-    # Dietary/allergen/flavor
-    dietary_tags: tuple
-    allergen_flags: tuple
-    flavor_molecules: tuple
-
-    # USDA FDC macros (optional -- may not be available for all recipes)
-    fat_pct: float | None
-    protein_pct: float | None
-    moisture_pct: float | None
-
-    # Variation link: slug of the parent post this is explicitly a variation of
-    similar_to_ref: str | None = None
-
-    def __post_init__(self) -> None:
-        # Coerce list fields to tuples (frozen dataclass: use object.__setattr__)
-        for key in ("slots", "dietary_tags", "allergen_flags", "flavor_molecules"):
-            val = getattr(self, key)
-            if isinstance(val, list):
-                object.__setattr__(self, key, tuple(val))
-
-        # Validate post_type
-        if self.post_type not in _VALID_POST_TYPES:
-            raise ValueError(
-                f"post_type must be one of {sorted(_VALID_POST_TYPES)}, got {self.post_type!r}"
-            )
-
-        # Validate scores
-        for score_name in (
-            "seasoning_score", "richness_score", "brightness_score",
-            "depth_score", "aroma_score", "structure_score",
-        ):
-            _validate_score(score_name, getattr(self, score_name))
--- a/circuitforge_core/community/snipe_store.py
+++ b/circuitforge_core/community/snipe_store.py
@ -1,253 +0,0 @@
-# circuitforge_core/community/snipe_store.py
-# MIT License
-"""Snipe community store — publishes seller trust signals to the shared community DB.
-
-Snipe products subclass SharedStore here to write seller trust signals
-(confirmed scammer / confirmed legitimate) to the cf_community PostgreSQL.
-These signals aggregate across all Snipe users to power the cross-user
-seller trust classifier fine-tuning corpus.
-
-Privacy: only platform_seller_id (public eBay username/ID) and flag keys
-are written. No PII is stored.
-
-Usage:
-    from circuitforge_core.community import CommunityDB
-    from circuitforge_core.community.snipe_store import SnipeCommunityStore
-
-    db = CommunityDB.from_env()
-    store = SnipeCommunityStore(db, source_product="snipe")
-    store.publish_seller_signal(
-        platform_seller_id="ebay-username",
-        confirmed_scam=True,
-        signal_source="blocklist_add",
-        flags=["new_account", "suspicious_price"],
-    )
-"""
-from __future__ import annotations
-
-import json
-import logging
-from dataclasses import dataclass
-from datetime import datetime, timezone
-
-from .store import SharedStore
-
-log = logging.getLogger(__name__)
-
-
-@dataclass(frozen=True)
-class SellerTrustSignal:
-    """Immutable snapshot of a recorded seller trust signal."""
-    id: int
-    platform: str
-    platform_seller_id: str
-    confirmed_scam: bool
-    signal_source: str
-    flags: tuple
-    source_product: str
-    recorded_at: datetime
-
-
-class SnipeCommunityStore(SharedStore):
-    """Community store for Snipe — seller trust signal publishing and querying."""
-
-    def __init__(self, db, source_product: str = "snipe") -> None:
-        super().__init__(db, source_product=source_product)
-
-    def publish_seller_signal(
-        self,
-        platform_seller_id: str,
-        confirmed_scam: bool,
-        signal_source: str,
-        flags: list[str] | None = None,
-        platform: str = "ebay",
-    ) -> SellerTrustSignal:
-        """Record a seller trust outcome in the shared community DB.
-
-        Args:
-            platform_seller_id: Public eBay username or platform ID (no PII).
-            confirmed_scam: True = confirmed bad actor; False = confirmed legitimate.
-            signal_source: Origin of the signal.
-                'blocklist_add'   — user explicitly added to local blocklist
-                'community_vote'  — consensus threshold reached from multiple reports
-                'resolved'        — seller resolved as legitimate over time
-            flags: List of red-flag keys active at signal time (e.g. ["new_account"]).
-            platform: Source auction platform (default "ebay").
-
-        Returns the inserted SellerTrustSignal.
-        """
-        flags = flags or []
-        conn = self._db.getconn()
-        try:
-            with conn.cursor() as cur:
-                cur.execute(
-                    """
-                    INSERT INTO seller_trust_signals
-                        (platform, platform_seller_id, confirmed_scam,
-                         signal_source, flags, source_product)
-                    VALUES (%s, %s, %s, %s, %s::jsonb, %s)
-                    RETURNING id, recorded_at
-                    """,
-                    (
-                        platform,
-                        platform_seller_id,
-                        confirmed_scam,
-                        signal_source,
-                        json.dumps(flags),
-                        self._source_product,
-                    ),
-                )
-                row = cur.fetchone()
-                conn.commit()
-            return SellerTrustSignal(
-                id=row[0],
-                platform=platform,
-                platform_seller_id=platform_seller_id,
-                confirmed_scam=confirmed_scam,
-                signal_source=signal_source,
-                flags=tuple(flags),
-                source_product=self._source_product,
-                recorded_at=row[1],
-            )
-        except Exception:
-            conn.rollback()
-            log.warning(
-                "Failed to publish seller signal for %s (%s)",
-                platform_seller_id, signal_source, exc_info=True,
-            )
-            raise
-        finally:
-            self._db.putconn(conn)
-
-    def list_signals_for_seller(
-        self,
-        platform_seller_id: str,
-        platform: str = "ebay",
-        limit: int = 50,
-    ) -> list[SellerTrustSignal]:
-        """Return recent trust signals for a specific seller."""
-        conn = self._db.getconn()
-        try:
-            with conn.cursor() as cur:
-                cur.execute(
-                    """
-                    SELECT id, platform, platform_seller_id, confirmed_scam,
-                           signal_source, flags, source_product, recorded_at
-                    FROM seller_trust_signals
-                    WHERE platform = %s AND platform_seller_id = %s
-                    ORDER BY recorded_at DESC
-                    LIMIT %s
-                    """,
-                    (platform, platform_seller_id, limit),
-                )
-                rows = cur.fetchall()
-            return [
-                SellerTrustSignal(
-                    id=r[0], platform=r[1], platform_seller_id=r[2],
-                    confirmed_scam=r[3], signal_source=r[4],
-                    flags=tuple(json.loads(r[5]) if isinstance(r[5], str) else r[5] or []),
-                    source_product=r[6], recorded_at=r[7],
-                )
-                for r in rows
-            ]
-        finally:
-            self._db.putconn(conn)
-
-    def scam_signal_count(self, platform_seller_id: str, platform: str = "ebay") -> int:
-        """Return the number of confirmed_scam=True signals for a seller.
-
-        Used to determine if a seller has crossed the community consensus threshold
-        for appearing in the shared blocklist.
-        """
-        conn = self._db.getconn()
-        try:
-            with conn.cursor() as cur:
-                cur.execute(
-                    """
-                    SELECT COUNT(*) FROM seller_trust_signals
-                    WHERE platform = %s AND platform_seller_id = %s AND confirmed_scam = TRUE
-                    """,
-                    (platform, platform_seller_id),
-                )
-                return cur.fetchone()[0]
-        finally:
-            self._db.putconn(conn)
-
-    def publish_categories(
-        self,
-        categories: list[tuple[str, str, str]],
-        platform: str = "ebay",
-    ) -> int:
-        """Upsert a batch of eBay leaf categories into the shared community table.
-
-        Args:
-            categories: List of (category_id, name, full_path) tuples.
-            platform: Source auction platform (default "ebay").
-
-        Returns:
-            Number of rows upserted.
-        """
-        if not categories:
-            return 0
-        conn = self._db.getconn()
-        try:
-            with conn.cursor() as cur:
-                cur.executemany(
-                    """
-                    INSERT INTO community_categories
-                        (platform, category_id, name, full_path, source_product)
-                    VALUES (%s, %s, %s, %s, %s)
-                    ON CONFLICT (platform, category_id)
-                    DO UPDATE SET
-                        name = EXCLUDED.name,
-                        full_path = EXCLUDED.full_path,
-                        source_product = EXCLUDED.source_product,
-                        published_at = NOW()
-                    """,
-                    [
-                        (platform, cid, name, path, self._source_product)
-                        for cid, name, path in categories
-                    ],
-                )
-                conn.commit()
-                return len(categories)
-        except Exception:
-            conn.rollback()
-            log.warning(
-                "Failed to publish %d categories to community store",
-                len(categories), exc_info=True,
-            )
-            raise
-        finally:
-            self._db.putconn(conn)
-
-    def fetch_categories(
-        self,
-        platform: str = "ebay",
-        limit: int = 500,
-    ) -> list[tuple[str, str, str]]:
-        """Fetch community-contributed eBay categories.
-
-        Args:
-            platform: Source auction platform (default "ebay").
-            limit: Maximum rows to return.
-
-        Returns:
-            List of (category_id, name, full_path) tuples ordered by name.
-        """
-        conn = self._db.getconn()
-        try:
-            with conn.cursor() as cur:
-                cur.execute(
-                    """
-                    SELECT category_id, name, full_path
-                    FROM community_categories
-                    WHERE platform = %s
-                    ORDER BY name
-                    LIMIT %s
-                    """,
-                    (platform, limit),
-                )
-                return [(row[0], row[1], row[2]) for row in cur.fetchall()]
-        finally:
-            self._db.putconn(conn)
--- a/circuitforge_core/community/store.py
+++ b/circuitforge_core/community/store.py
@ -1,434 +0,0 @@
-# circuitforge_core/community/store.py
-# MIT License
-
-from __future__ import annotations
-
-import logging
-from typing import TYPE_CHECKING
-
-from .models import CommunityPost
-
-if TYPE_CHECKING:
-    from .db import CommunityDB
-
-logger = logging.getLogger(__name__)
-
-
-def _row_to_post(row: dict) -> CommunityPost:
-    """Convert a psycopg2 row dict to a CommunityPost.
-
-    JSONB columns (slots, dietary_tags, allergen_flags, flavor_molecules) come
-    back from psycopg2 as Python lists already — no json.loads() needed.
-    """
-    return CommunityPost(
-        slug=row["slug"],
-        pseudonym=row["pseudonym"],
-        post_type=row["post_type"],
-        published=row["published"],
-        title=row["title"],
-        description=row.get("description"),
-        photo_url=row.get("photo_url"),
-        slots=row.get("slots") or [],
-        recipe_id=row.get("recipe_id"),
-        recipe_name=row.get("recipe_name"),
-        level=row.get("level"),
-        outcome_notes=row.get("outcome_notes"),
-        seasoning_score=row["seasoning_score"] or 0.0,
-        richness_score=row["richness_score"] or 0.0,
-        brightness_score=row["brightness_score"] or 0.0,
-        depth_score=row["depth_score"] or 0.0,
-        aroma_score=row["aroma_score"] or 0.0,
-        structure_score=row["structure_score"] or 0.0,
-        texture_profile=row.get("texture_profile") or "",
-        dietary_tags=row.get("dietary_tags") or [],
-        allergen_flags=row.get("allergen_flags") or [],
-        flavor_molecules=row.get("flavor_molecules") or [],
-        fat_pct=row.get("fat_pct"),
-        protein_pct=row.get("protein_pct"),
-        moisture_pct=row.get("moisture_pct"),
-        similar_to_ref=row.get("similar_to_ref"),
-    )
-
-
-def _cursor_to_dict(cur, row) -> dict:
-    """Convert a psycopg2 row tuple to a dict using cursor.description."""
-    if isinstance(row, dict):
-        return row
-    return {desc[0]: val for desc, val in zip(cur.description, row)}
-
-
-class SharedStore:
-    """Base class for product community stores.
-
-    Subclass this in each product:
-        class KiwiCommunityStore(SharedStore):
-            def list_posts_for_week(self, week_start: str) -> list[CommunityPost]: ...
-
-    All methods return new objects (immutable pattern). Never mutate rows in-place.
-    """
-
-    def __init__(self, db: "CommunityDB", source_product: str = "kiwi") -> None:
-        self._db = db
-        self._source_product = source_product
-
-    # ------------------------------------------------------------------
-    # Reads
-    # ------------------------------------------------------------------
-
-    def get_post_by_slug(self, slug: str) -> CommunityPost | None:
-        conn = self._db.getconn()
-        try:
-            with conn.cursor() as cur:
-                cur.execute(
-                    "SELECT * FROM community_posts WHERE slug = %s LIMIT 1",
-                    (slug,),
-                )
-                row = cur.fetchone()
-                if row is None:
-                    return None
-                return _row_to_post(_cursor_to_dict(cur, row))
-        finally:
-            self._db.putconn(conn)
-
-    def list_posts(
-        self,
-        limit: int = 20,
-        offset: int = 0,
-        post_type: str | None = None,
-        dietary_tags: list[str] | None = None,
-        allergen_exclude: list[str] | None = None,
-        source_product: str | None = None,
-    ) -> list[CommunityPost]:
-        """Paginated post list with optional filters.
-
-        dietary_tags: JSONB containment — posts must include ALL listed tags.
-        allergen_exclude: JSONB overlap exclusion — posts must NOT include any listed flag.
-        """
-        conn = self._db.getconn()
-        try:
-            conditions = []
-            params: list = []
-
-            if post_type:
-                conditions.append("post_type = %s")
-                params.append(post_type)
-            if dietary_tags:
-                import json
-                conditions.append("dietary_tags @> %s::jsonb")
-                params.append(json.dumps(dietary_tags))
-            if allergen_exclude:
-                import json
-                conditions.append("NOT (allergen_flags && %s::jsonb)")
-                params.append(json.dumps(allergen_exclude))
-            if source_product:
-                conditions.append("source_product = %s")
-                params.append(source_product)
-
-            where = ("WHERE " + " AND ".join(conditions)) if conditions else ""
-            params.extend([limit, offset])
-
-            with conn.cursor() as cur:
-                cur.execute(
-                    f"SELECT * FROM community_posts {where} "
-                    "ORDER BY published DESC LIMIT %s OFFSET %s",
-                    params,
-                )
-                rows = cur.fetchall()
-                return [_row_to_post(_cursor_to_dict(cur, r)) for r in rows]
-        finally:
-            self._db.putconn(conn)
-
-    def search_similar_posts(
-        self,
-        title: str,
-        recipe_id: int | None = None,
-        post_type: str | None = None,
-        limit: int = 8,
-    ) -> list[CommunityPost]:
-        """Return posts similar to the given title or with the same recipe_id.
-
-        Used by the dedup check before a new post is submitted. Matches on:
-        - exact recipe_id (strongest signal)
-        - case-insensitive title substring match
-
-        Results are ordered: recipe_id matches first, then by published desc.
-        """
-        conn = self._db.getconn()
-        try:
-            conditions: list[str] = []
-            params: list = []
-
-            title_condition = "lower(title) LIKE lower(%s)"
-            title_param = f"%{title.lower()[:80]}%"
-
-            if recipe_id is not None:
-                conditions.append(f"(recipe_id = %s OR {title_condition})")
-                params.extend([recipe_id, title_param])
-            else:
-                conditions.append(title_condition)
-                params.append(title_param)
-
-            if post_type:
-                conditions.append("post_type = %s")
-                params.append(post_type)
-
-            where = "WHERE " + " AND ".join(conditions)
-            params.append(limit)
-
-            order_clause = (
-                "ORDER BY (recipe_id = %s) DESC, published DESC"
-                if recipe_id is not None
-                else "ORDER BY published DESC"
-            )
-            if recipe_id is not None:
-                params.insert(-1, recipe_id)
-
-            with conn.cursor() as cur:
-                cur.execute(
-                    f"SELECT * FROM community_posts {where} {order_clause} LIMIT %s",
-                    params,
-                )
-                rows = cur.fetchall()
-                return [_row_to_post(_cursor_to_dict(cur, r)) for r in rows]
-        finally:
-            self._db.putconn(conn)
-
-    # ------------------------------------------------------------------
-    # Writes
-    # ------------------------------------------------------------------
-
-    def insert_post(self, post: CommunityPost) -> CommunityPost:
-        """Insert a new community post. Returns the inserted post (unchanged — slug is the key)."""
-        import json
-
-        conn = self._db.getconn()
-        try:
-            with conn.cursor() as cur:
-                cur.execute(
-                    """
-                    INSERT INTO community_posts (
-                        slug, pseudonym, post_type, published, title, description, photo_url,
-                        slots, recipe_id, recipe_name, level, outcome_notes,
-                        seasoning_score, richness_score, brightness_score,
-                        depth_score, aroma_score, structure_score, texture_profile,
-                        dietary_tags, allergen_flags, flavor_molecules,
-                        fat_pct, protein_pct, moisture_pct, source_product,
-                        similar_to_ref
-                    ) VALUES (
-                        %s, %s, %s, %s, %s, %s, %s,
-                        %s::jsonb, %s, %s, %s, %s,
-                        %s, %s, %s, %s, %s, %s, %s,
-                        %s::jsonb, %s::jsonb, %s::jsonb,
-                        %s, %s, %s, %s, %s
-                    )
-                    """,
-                    (
-                        post.slug, post.pseudonym, post.post_type,
-                        post.published, post.title, post.description, post.photo_url,
-                        json.dumps(list(post.slots)),
-                        post.recipe_id, post.recipe_name, post.level, post.outcome_notes,
-                        post.seasoning_score, post.richness_score, post.brightness_score,
-                        post.depth_score, post.aroma_score, post.structure_score,
-                        post.texture_profile,
-                        json.dumps(list(post.dietary_tags)),
-                        json.dumps(list(post.allergen_flags)),
-                        json.dumps(list(post.flavor_molecules)),
-                        post.fat_pct, post.protein_pct, post.moisture_pct,
-                        self._source_product,
-                        post.similar_to_ref,
-                    ),
-                )
-                conn.commit()
-            return post
-        except Exception:
-            conn.rollback()
-            raise
-        finally:
-            self._db.putconn(conn)
-
-    def delete_post(self, slug: str, pseudonym: str) -> bool:
-        """Hard-delete a post. Only succeeds if pseudonym matches the author.
-
-        Returns True if a row was deleted, False if no matching row found.
-        """
-        conn = self._db.getconn()
-        try:
-            with conn.cursor() as cur:
-                cur.execute(
-                    "DELETE FROM community_posts WHERE slug = %s AND pseudonym = %s",
-                    (slug, pseudonym),
-                )
-                conn.commit()
-                return cur.rowcount > 0
-        except Exception:
-            conn.rollback()
-            raise
-        finally:
-            self._db.putconn(conn)
-
-    # ── Recipe tags ───────────────────────────────────────────────────────────
-
-    def submit_recipe_tag(
-        self,
-        recipe_id: int,
-        domain: str,
-        category: str,
-        subcategory: str | None,
-        pseudonym: str,
-        source_product: str = "kiwi",
-    ) -> dict:
-        """Submit a new subcategory tag for a corpus recipe.
-
-        Inserts the tag with upvotes=1 and records the submitter's self-vote in
-        recipe_tag_votes. Returns the created tag row as a dict.
-
-        Raises psycopg2.errors.UniqueViolation if the same user has already
-        tagged this recipe to this location — let the caller handle it.
-        """
-        conn = self._db.getconn()
-        try:
-            with conn.cursor() as cur:
-                cur.execute(
-                    """
-                    INSERT INTO recipe_tags
-                        (recipe_source, recipe_ref, domain, category, subcategory,
-                         pseudonym, upvotes, source_product)
-                    VALUES ('corpus', %s, %s, %s, %s, %s, 1, %s)
-                    RETURNING id, recipe_ref, domain, category, subcategory,
-                              pseudonym, upvotes, created_at
-                    """,
-                    (str(recipe_id), domain, category, subcategory,
-                     pseudonym, source_product),
-                )
-                row = dict(zip([d[0] for d in cur.description], cur.fetchone()))
-                # Record submitter's self-vote
-                cur.execute(
-                    "INSERT INTO recipe_tag_votes (tag_id, pseudonym) VALUES (%s, %s)",
-                    (row["id"], pseudonym),
-                )
-                conn.commit()
-                return row
-        except Exception:
-            conn.rollback()
-            raise
-        finally:
-            self._db.putconn(conn)
-
-    def upvote_recipe_tag(self, tag_id: int, pseudonym: str) -> int:
-        """Add an upvote to a tag from pseudonym. Returns new upvote count.
-
-        Raises psycopg2.errors.UniqueViolation if this pseudonym already voted.
-        Raises ValueError if the tag does not exist.
-        """
-        conn = self._db.getconn()
-        try:
-            with conn.cursor() as cur:
-                cur.execute(
-                    "INSERT INTO recipe_tag_votes (tag_id, pseudonym) VALUES (%s, %s)",
-                    (tag_id, pseudonym),
-                )
-                cur.execute(
-                    "UPDATE recipe_tags SET upvotes = upvotes + 1 WHERE id = %s"
-                    " RETURNING upvotes",
-                    (tag_id,),
-                )
-                row = cur.fetchone()
-                if row is None:
-                    raise ValueError(f"recipe_tag {tag_id} not found")
-                conn.commit()
-                return row[0]
-        except Exception:
-            conn.rollback()
-            raise
-        finally:
-            self._db.putconn(conn)
-
-    def get_recipe_tag_by_id(self, tag_id: int) -> dict | None:
-        """Return a single recipe_tag row by ID, or None if not found."""
-        conn = self._db.getconn()
-        try:
-            with conn.cursor() as cur:
-                cur.execute(
-                    """
-                    SELECT id, recipe_ref, domain, category, subcategory,
-                           pseudonym, upvotes, created_at
-                    FROM recipe_tags WHERE id = %s
-                    """,
-                    (tag_id,),
-                )
-                row = cur.fetchone()
-                if row is None:
-                    return None
-                return dict(zip([d[0] for d in cur.description], row))
-        finally:
-            self._db.putconn(conn)
-
-    def list_tags_for_recipe(
-        self,
-        recipe_id: int,
-        source_product: str = "kiwi",
-    ) -> list[dict]:
-        """Return all tags for a corpus recipe, accepted or not, newest first."""
-        conn = self._db.getconn()
-        try:
-            with conn.cursor() as cur:
-                cur.execute(
-                    """
-                    SELECT id, domain, category, subcategory, pseudonym,
-                           upvotes, created_at
-                    FROM recipe_tags
-                    WHERE recipe_source = 'corpus'
-                      AND recipe_ref = %s
-                      AND source_product = %s
-                    ORDER BY upvotes DESC, created_at DESC
-                    """,
-                    (str(recipe_id), source_product),
-                )
-                cols = [d[0] for d in cur.description]
-                return [dict(zip(cols, r)) for r in cur.fetchall()]
-        finally:
-            self._db.putconn(conn)
-
-    def get_accepted_recipe_ids_for_subcategory(
-        self,
-        domain: str,
-        category: str,
-        subcategory: str | None,
-        source_product: str = "kiwi",
-        threshold: int = 2,
-    ) -> list[int]:
-        """Return corpus recipe IDs with accepted community tags for a subcategory.
-
-        Used by browse_counts_cache refresh and browse_recipes() FTS fallback.
-        Only includes tags that have reached the acceptance threshold.
-        """
-        conn = self._db.getconn()
-        try:
-            with conn.cursor() as cur:
-                if subcategory is None:
-                    cur.execute(
-                        """
-                        SELECT DISTINCT recipe_ref::INTEGER
-                        FROM recipe_tags
-                        WHERE source_product = %s
-                          AND domain = %s AND category = %s
-                          AND subcategory IS NULL
-                          AND upvotes >= %s
-                        """,
-                        (source_product, domain, category, threshold),
-                    )
-                else:
-                    cur.execute(
-                        """
-                        SELECT DISTINCT recipe_ref::INTEGER
-                        FROM recipe_tags
-                        WHERE source_product = %s
-                          AND domain = %s AND category = %s
-                          AND subcategory = %s
-                          AND upvotes >= %s
-                        """,
-                        (source_product, domain, category, subcategory, threshold),
-                    )
-                return [r[0] for r in cur.fetchall()]
-        finally:
-            self._db.putconn(conn)
--- a/circuitforge_core/config/init.py
+++ b/circuitforge_core/config/init.py
@ -1,4 +1,3 @@
 from .settings import require_env, load_env
-from .license import validate_license, get_license_tier

-__all__ = ["require_env", "load_env", "validate_license", "get_license_tier"]
+__all__ = ["require_env", "load_env"]
--- a/circuitforge_core/config/license.py
+++ b/circuitforge_core/config/license.py
@ -1,104 +0,0 @@
-"""
-License validation via Heimdall.
-
-Products call validate_license() or get_license_tier() at startup to check
-the CF_LICENSE_KEY environment variable against Heimdall.
-
-Both functions are safe to call when CF_LICENSE_KEY is absent — they return
-"free" tier gracefully rather than raising.
-
-Environment variables:
-    CF_LICENSE_KEY  — Raw license key (e.g. CFG-PRNG-XXXX-XXXX-XXXX).
-                      If absent, product runs as free tier.
-    CF_LICENSE_URL  — Heimdall base URL override.
-                      Default: https://license.circuitforge.tech
-"""
-from __future__ import annotations
-
-import logging
-import os
-import time
-
-import requests
-
-logger = logging.getLogger(__name__)
-
-_DEFAULT_HEIMDALL_URL = "https://license.circuitforge.tech"
-_CACHE_TTL_SECONDS = 1800  # 30 minutes
-
-# Cache: (key, product) -> (result_dict, expires_at)
-_cache: dict[tuple[str, str], tuple[dict[str, bool | str], float]] = {}
-
-_INVALID: dict[str, bool | str] = {"valid": False, "tier": "free", "user_id": ""}
-
-
-def _heimdall_url(override: str | None) -> str:
-    return override or os.environ.get("CF_LICENSE_URL", _DEFAULT_HEIMDALL_URL)
-
-
-def validate_license(
-    product: str,
-    min_tier: str = "free",
-    heimdall_url: str | None = None,
-) -> dict[str, bool | str]:
-    """
-    Validate CF_LICENSE_KEY against Heimdall for the given product.
-
-    Returns a dict with keys: valid (bool), tier (str), user_id (str).
-    Returns {"valid": False, "tier": "free", "user_id": ""} when:
-      - CF_LICENSE_KEY is not set
-      - Heimdall is unreachable
-      - The key is invalid/expired/revoked
-
-    Results are cached for 30 minutes per (key, product) pair.
-    """
-    key = os.environ.get("CF_LICENSE_KEY", "").strip()
-    if not key:
-        return dict(_INVALID)
-
-    cache_key = (key, product)
-    now = time.monotonic()
-    if cache_key in _cache:
-        cached_result, expires_at = _cache[cache_key]
-        if now < expires_at:
-            return dict(cached_result)
-
-    base = _heimdall_url(heimdall_url)
-    try:
-        resp = requests.post(
-            f"{base}/licenses/verify",
-            json={"key": key, "min_tier": min_tier},
-            timeout=5,
-        )
-        if not resp.ok:
-            logger.warning("[license] Heimdall returned %s for key validation", resp.status_code)
-            result = dict(_INVALID)
-        else:
-            data = resp.json()
-            result = {
-                "valid": bool(data.get("valid", False)),
-                "tier": data.get("tier", "free") or "free",
-                "user_id": data.get("user_id", "") or "",
-            }
-    except Exception as exc:
-        logger.warning("[license] License validation failed: %s", exc)
-        result = dict(_INVALID)
-
-    _cache[cache_key] = (result, now + _CACHE_TTL_SECONDS)
-    return result
-
-
-def get_license_tier(
-    product: str,
-    heimdall_url: str | None = None,
-) -> str:
-    """
-    Return the active tier for CF_LICENSE_KEY, or "free" if absent/invalid.
-
-    Convenience wrapper around validate_license() for the common case
-    where only the tier string is needed.
-    """
-    result = validate_license(product, min_tier="free", heimdall_url=heimdall_url)
-    if not result["valid"]:
-        return "free"
-    return result["tier"]
--- a/circuitforge_core/db/base.py
+++ b/circuitforge_core/db/base.py
@ -23,12 +23,8 @@ def get_connection(db_path: Path, key: str = "") -> sqlite3.Connection:
    if cloud_mode and key:
        from pysqlcipher3 import dbapi2 as _sqlcipher  # type: ignore
        conn = _sqlcipher.connect(str(db_path), timeout=30)
-        conn.execute("PRAGMA key=?", (key,))
+        conn.execute(f"PRAGMA key='{key}'")
        return conn
    # timeout=30: retry for up to 30s when another writer holds the lock (WAL mode
    # allows concurrent readers but only one writer at a time).
-    # check_same_thread=False: each Store is owned by exactly one request; FastAPI
-    # uses asyncio.to_thread() to run sync DB calls in a worker thread, crossing
-    # the thread boundary that sqlite3 guards by default. Since no two threads share
-    # the same connection, disabling the check is safe.
-    return sqlite3.connect(str(db_path), timeout=30, check_same_thread=False)
+    return sqlite3.connect(str(db_path), timeout=30)
--- a/circuitforge_core/db/migrations.py
+++ b/circuitforge_core/db/migrations.py
@ -4,22 +4,12 @@ Applies *.sql files from migrations_dir in filename order.
 Tracks applied migrations in a _migrations table — safe to call multiple times.
 """
 from __future__ import annotations
-import logging
 import sqlite3
 from pathlib import Path

-_log = logging.getLogger(__name__)
-

 def run_migrations(conn: sqlite3.Connection, migrations_dir: Path) -> None:
-    """Apply any unapplied *.sql migrations from migrations_dir.
-
-    Resilient to partial-failure recovery: if a migration previously crashed
-    mid-run (e.g. a process killed after some ALTER TABLE statements
-    auto-committed via executescript), the next startup re-runs that migration.
-    Any "duplicate column name" errors are silently skipped so the migration
-    can complete and be marked as applied.  All other errors still propagate.
-    """
+    """Apply any unapplied *.sql migrations from migrations_dir."""
    conn.execute(
        "CREATE TABLE IF NOT EXISTS _migrations "
        "(name TEXT PRIMARY KEY, applied_at TEXT DEFAULT CURRENT_TIMESTAMP)"
@ -32,92 +22,8 @@ def run_migrations(conn: sqlite3.Connection, migrations_dir: Path) -> None:
    for sql_file in sql_files:
        if sql_file.name in applied:
            continue
-
-        try:
-            conn.executescript(sql_file.read_text())
-        except sqlite3.OperationalError as exc:
-            if "duplicate column name" not in str(exc).lower():
-                raise
-            # A previous run partially applied this migration (some ALTER TABLE
-            # statements auto-committed before the failure).  Re-run with
-            # per-statement recovery to skip already-applied columns.
-            _log.warning(
-                "Migration %s: partial-failure detected (%s) — "
-                "retrying with per-statement recovery",
-                sql_file.name,
-                exc,
-            )
-            _run_script_with_recovery(conn, sql_file)
-
+        conn.executescript(sql_file.read_text())
        # OR IGNORE: safe if two Store() calls race on the same DB — second writer
        # just skips the insert rather than raising UNIQUE constraint failed.
        conn.execute("INSERT OR IGNORE INTO _migrations (name) VALUES (?)", (sql_file.name,))
        conn.commit()
-
-
-def _run_script_with_recovery(conn: sqlite3.Connection, sql_file: Path) -> None:
-    """Re-run a migration via executescript, skipping duplicate-column errors.
-
-    Used only when the first executescript() attempt raised a duplicate column
-    error (indicating a previous partial run).  Splits the script on the
-    double-dash comment prefix pattern to re-issue each logical statement,
-    catching only the known-safe "duplicate column name" error class.
-
-    Splitting is done via SQLite's own parser — we feed the script to a
-    temporary in-memory connection using executescript (which commits
-    auto-matically per DDL statement) and mirror the results on the real
-    connection statement by statement.  That's circular, so instead we use
-    the simpler approach: executescript handles tokenization; we wrap the
-    whole call in a try/except and retry after removing the offending statement.
-
-    Simpler approach: use conn.execute() per statement from the script.
-    This avoids the semicolon-in-comment tokenization problem by not splitting
-    ourselves — instead we let the DB tell us which statement failed and only
-    skip that exact error class.
-    """
-    # executescript() uses SQLite's real tokenizer, so re-issuing it after a
-    # partial failure will hit "duplicate column name" again.  We catch and
-    # ignore that specific error class only, re-running until the script
-    # completes or a different error is raised.
-    #
-    # Implementation: issue the whole script again; catch duplicate-column
-    # errors; keep trying.  Since executescript auto-commits per statement,
-    # each successful statement in successive retries is a no-op (CREATE TABLE
-    # IF NOT EXISTS, etc.) or a benign duplicate skip.
-    #
-    # Limit retries to prevent infinite loops on genuinely broken SQL.
-    script = sql_file.read_text()
-    for attempt in range(20):
-        try:
-            conn.executescript(script)
-            return  # success
-        except sqlite3.OperationalError as exc:
-            msg = str(exc).lower()
-            if "duplicate column name" in msg:
-                col = str(exc).split(":")[-1].strip() if ":" in str(exc) else "?"
-                _log.warning(
-                    "Migration %s (attempt %d): skipping duplicate column '%s'",
-                    sql_file.name,
-                    attempt + 1,
-                    col,
-                )
-                # Remove the offending ALTER TABLE statement from the script
-                # so the next attempt skips it.  This is safe because SQLite
-                # already auto-committed that column addition on a prior run.
-                script = _remove_column_add(script, col)
-            else:
-                raise
-    raise RuntimeError(
-        f"Migration {sql_file.name}: could not complete after 20 recovery attempts"
-    )
-
-
-def _remove_column_add(script: str, column: str) -> str:
-    """Remove the ALTER TABLE ADD COLUMN statement for *column* from *script*."""
-    import re
-    # Match: ALTER TABLE <tbl> ADD COLUMN <column> <rest-of-line>
-    pattern = re.compile(
-        r"ALTER\s+TABLE\s+\w+\s+ADD\s+COLUMN\s+" + re.escape(column) + r"[^\n]*\n?",
-        re.IGNORECASE,
-    )
-    return pattern.sub("", script)
--- a/circuitforge_core/documents/init.py
+++ b/circuitforge_core/documents/init.py
@ -1,18 +0,0 @@
-"""
-circuitforge_core.documents — shared document ingestion pipeline.
-
-Primary entry point::
-
-    from circuitforge_core.documents import ingest, StructuredDocument
-
-    doc: StructuredDocument = ingest(image_bytes, hint="auto")
-"""
-from .ingest import ingest
-from .models import Element, ParsedTable, StructuredDocument
-
-__all__ = [
-    "ingest",
-    "Element",
-    "ParsedTable",
-    "StructuredDocument",
-]
--- a/circuitforge_core/documents/client.py
+++ b/circuitforge_core/documents/client.py
@ -1,84 +0,0 @@
-"""
-circuitforge_core.documents.client — HTTP client for the cf-docuvision service.
-
-Thin wrapper around the cf-docuvision FastAPI service's POST /extract endpoint.
-Used by ingest() as the primary path; callers should not use this directly.
-"""
-from __future__ import annotations
-
-import base64
-import logging
-from typing import Any
-
-import requests
-
-from .models import Element, ParsedTable, StructuredDocument
-
-logger = logging.getLogger(__name__)
-
-_DEFAULT_TIMEOUT_S = 60
-
-
-class DocuvisionClient:
-    """Synchronous HTTP client for cf-docuvision.
-
-    Args:
-        base_url: Root URL of the cf-docuvision service, e.g. 'http://localhost:8003'
-        timeout:  Request timeout in seconds.
-    """
-
-    def __init__(self, base_url: str = "http://localhost:8003", timeout: int = _DEFAULT_TIMEOUT_S) -> None:
-        self.base_url = base_url.rstrip("/")
-        self.timeout = timeout
-
-    def is_healthy(self) -> bool:
-        """Return True if the service responds to GET /health."""
-        try:
-            resp = requests.get(f"{self.base_url}/health", timeout=3)
-            return resp.status_code == 200
-        except Exception:
-            return False
-
-    def extract(self, image_bytes: bytes, hint: str = "auto") -> StructuredDocument:
-        """
-        Submit image bytes to cf-docuvision and return a StructuredDocument.
-
-        Raises:
-            requests.HTTPError: if the service returns a non-2xx status.
-            requests.ConnectionError / requests.Timeout: if the service is unreachable.
-        """
-        payload = {
-            "image_b64": base64.b64encode(image_bytes).decode(),
-            "hint": hint,
-        }
-        resp = requests.post(
-            f"{self.base_url}/extract",
-            json=payload,
-            timeout=self.timeout,
-        )
-        resp.raise_for_status()
-        return _parse_response(resp.json())
-
-
-def _parse_response(data: dict[str, Any]) -> StructuredDocument:
-    elements = [
-        Element(
-            type=e["type"],
-            text=e["text"],
-            bbox=tuple(e["bbox"]) if e.get("bbox") else None,
-        )
-        for e in data.get("elements", [])
-    ]
-    tables = [
-        ParsedTable(
-            html=t["html"],
-            bbox=tuple(t["bbox"]) if t.get("bbox") else None,
-        )
-        for t in data.get("tables", [])
-    ]
-    return StructuredDocument(
-        elements=elements,
-        raw_text=data.get("raw_text", ""),
-        tables=tables,
-        metadata=data.get("metadata", {}),
-    )
--- a/circuitforge_core/documents/ingest.py
+++ b/circuitforge_core/documents/ingest.py
@ -1,137 +0,0 @@
-"""
-circuitforge_core.documents.ingest — public document ingestion entry point.
-
-Primary path: cf-docuvision HTTP service (Dolphin-v2, layout-aware).
-Fallback path: LLMRouter vision call (lower fidelity, no layout/bbox).
-
-Usage::
-
-    from circuitforge_core.documents import ingest
-
-    with open("receipt.jpg", "rb") as f:
-        doc = ingest(f.read(), hint="table")
-
-    print(doc.raw_text)
-    for table in doc.tables:
-        print(table.html)
-"""
-from __future__ import annotations
-
-import base64
-import logging
-import os
-from typing import Any
-
-from .client import DocuvisionClient
-from .models import Element, StructuredDocument
-
-logger = logging.getLogger(__name__)
-
-_DOCUVISION_URL_ENV = "CF_DOCUVISION_URL"
-_DOCUVISION_URL_DEFAULT = "http://localhost:8003"
-
-_LLM_FALLBACK_PROMPTS: dict[str, str] = {
-    "auto":  "Extract all text from this document. Return a JSON array of {\"type\": ..., \"text\": ...} objects.",
-    "table": "Extract all tables from this document as HTML. Return a JSON array including {\"type\": \"table\", \"html\": ..., \"text\": ...} objects.",
-    "text":  "Extract all text from this document preserving headings and paragraphs. Return a JSON array of {\"type\": ..., \"text\": ...} objects.",
-    "form":  "Extract all form field labels and values from this document. Return a JSON array of {\"type\": ..., \"text\": ...} objects.",
-}
-
-
-def ingest(
-    image_bytes: bytes,
-    hint: str = "auto",
-    *,
-    docuvision_url: str | None = None,
-    llm_router: Any | None = None,
-    llm_config_path: Any | None = None,
-) -> StructuredDocument:
-    """
-    Ingest an image and return a StructuredDocument.
-
-    Tries cf-docuvision first; falls back to LLMRouter vision if the service is
-    unavailable or fails. If neither is available, returns an empty document.
-
-    Args:
-        image_bytes:      Raw bytes of the image (JPEG, PNG, etc.).
-        hint:             Extraction mode: "auto" | "table" | "text" | "form".
-        docuvision_url:   Override service URL (defaults to CF_DOCUVISION_URL env or localhost:8003).
-        llm_router:       Pre-built LLMRouter instance for fallback (optional).
-        llm_config_path:  Path to llm.yaml for lazy-constructing LLMRouter if needed.
-
-    Returns:
-        StructuredDocument — always, even on total failure (empty document).
-    """
-    url = docuvision_url or os.environ.get(_DOCUVISION_URL_ENV, _DOCUVISION_URL_DEFAULT)
-    client = DocuvisionClient(base_url=url)
-
-    # ── primary: cf-docuvision ────────────────────────────────────────────────
-    try:
-        if client.is_healthy():
-            doc = client.extract(image_bytes, hint=hint)
-            logger.debug("ingest: cf-docuvision succeeded (%d elements)", len(doc.elements))
-            return doc
-        logger.debug("ingest: cf-docuvision unhealthy, falling back to LLM")
-    except Exception as exc:
-        logger.warning("ingest: cf-docuvision failed (%s), falling back to LLM", exc)
-
-    # ── fallback: LLMRouter vision ────────────────────────────────────────────
-    router = llm_router or _build_llm_router(llm_config_path)
-    if router is None:
-        logger.warning("ingest: no LLM router available; returning empty document")
-        return StructuredDocument(metadata={"source": "none", "hint": hint})
-
-    try:
-        return _llm_ingest(router, image_bytes, hint)
-    except Exception as exc:
-        logger.warning("ingest: LLM fallback failed (%s); returning empty document", exc)
-        return StructuredDocument(metadata={"source": "llm_error", "hint": hint, "error": str(exc)})
-
-
-# ── helpers ───────────────────────────────────────────────────────────────────
-
-def _build_llm_router(config_path: Any | None) -> Any | None:
-    """Lazily construct an LLMRouter; return None if unavailable."""
-    try:
-        from circuitforge_core.llm import LLMRouter
-        kwargs: dict[str, Any] = {}
-        if config_path is not None:
-            kwargs["config_path"] = config_path
-        return LLMRouter(**kwargs)
-    except Exception as exc:
-        logger.debug("ingest: could not build LLMRouter: %s", exc)
-        return None
-
-
-def _llm_ingest(router: Any, image_bytes: bytes, hint: str) -> StructuredDocument:
-    """Use LLMRouter's vision capability to extract document text."""
-    import json
-
-    prompt = _LLM_FALLBACK_PROMPTS.get(hint, _LLM_FALLBACK_PROMPTS["auto"])
-    b64 = base64.b64encode(image_bytes).decode()
-
-    raw = router.generate_vision(
-        prompt=prompt,
-        image_b64=b64,
-    )
-
-    # Try to parse structured output; fall back to single paragraph
-    elements: list[Element] = []
-    try:
-        parsed = json.loads(raw)
-        if isinstance(parsed, list):
-            for item in parsed:
-                elements.append(Element(
-                    type=item.get("type", "paragraph"),
-                    text=item.get("text", ""),
-                ))
-    except (json.JSONDecodeError, TypeError):
-        elements = [Element(type="paragraph", text=raw.strip())]
-
-    raw_text = "\n".join(e.text for e in elements)
-    return StructuredDocument(
-        elements=elements,
-        raw_text=raw_text,
-        tables=[],
-        metadata={"source": "llm_fallback", "hint": hint},
-    )
--- a/circuitforge_core/documents/models.py
+++ b/circuitforge_core/documents/models.py
@ -1,53 +0,0 @@
-"""
-circuitforge_core.documents.models — shared document data types.
-
-These are the canonical output types from the document ingestion pipeline.
-All consumers (kiwi, falcon, peregrine, godwit, …) receive a StructuredDocument
-regardless of whether Dolphin-v2 or LLM fallback was used.
-"""
-from __future__ import annotations
-
-from dataclasses import dataclass, field
-from typing import Any
-
-
-@dataclass(frozen=True)
-class Element:
-    """A single logical content unit within a document.
-
-    type: one of heading | paragraph | list | table | figure | formula | code
-    text: extracted plain text (for tables: may be row summary or empty)
-    bbox: normalised [x0, y0, x1, y1] in 0-1 space, None when unavailable
-    """
-    type: str
-    text: str
-    bbox: tuple[float, float, float, float] | None = None
-
-
-@dataclass(frozen=True)
-class ParsedTable:
-    """An extracted table rendered as HTML."""
-    html: str
-    bbox: tuple[float, float, float, float] | None = None
-
-
-@dataclass
-class StructuredDocument:
-    """
-    The canonical result of document ingestion.
-
-    Produced by ingest() for any input image regardless of which backend
-    (cf-docuvision or LLM fallback) processed it.
-    """
-    elements: list[Element] = field(default_factory=list)
-    raw_text: str = ""
-    tables: list[ParsedTable] = field(default_factory=list)
-    metadata: dict[str, Any] = field(default_factory=dict)
-
-    @property
-    def headings(self) -> list[Element]:
-        return [e for e in self.elements if e.type == "heading"]
-
-    @property
-    def paragraphs(self) -> list[Element]:
-        return [e for e in self.elements if e.type == "paragraph"]
--- a/circuitforge_core/documents/pdf.py
+++ b/circuitforge_core/documents/pdf.py
@ -1,133 +0,0 @@
-# circuitforge_core/documents/pdf.py
-"""
-circuitforge_core.documents.pdf — PDF text extraction and page-level chunking.
-
-Primary path: pdfplumber (selectable text layers).
-Fallback: pytesseract OCR (scanned / image-only pages).
-
-Usage::
-
-    from circuitforge_core.documents.pdf import PDFExtractor
-
-    chunks = PDFExtractor().chunk_pages("/path/to/book.pdf")
-    for chunk in chunks:
-        print(f"[p.{chunk.page_number}] ({chunk.source}) {chunk.text[:80]}")
-"""
-
-from __future__ import annotations
-
-import io
-import logging
-from dataclasses import dataclass
-from pathlib import Path
-
-logger = logging.getLogger(__name__)
-
-try:
-    import pdfplumber
-except ImportError:  # pragma: no cover
-    pdfplumber = None  # type: ignore[assignment]
-
-try:
-    import pytesseract
-except ImportError:  # pragma: no cover
-    pytesseract = None  # type: ignore[assignment]
-
-try:
-    from PIL import Image
-except ImportError:  # pragma: no cover
-    Image = None  # type: ignore[assignment]
-
-
-@dataclass(frozen=True)
-class PageChunk:
-    """Text content extracted from a single PDF page."""
-
-    page_number: int  # 1-indexed
-    text: str
-    source: str  # "text_layer" | "ocr"
-    word_count: int
-
-
-class PDFExtractor:
-    """
-    Extract page-level text chunks from PDF files.
-
-    Args:
-        ocr_min_words: Pages with fewer words from the text layer trigger OCR.
-    """
-
-    def __init__(self, ocr_min_words: int = 10) -> None:
-        self.ocr_min_words = ocr_min_words
-
-    def chunk_pages(self, pdf_path: str | Path) -> list[PageChunk]:
-        """
-        Primary entry point. Returns one PageChunk per page.
-
-        Uses text-layer extraction per page; falls back to OCR when text is sparse.
-        Empty PDFs return an empty list.
-        """
-        if pdfplumber is None:
-            raise ImportError(
-                "pdfplumber is required for PDF extraction. "
-                "Install it with: pip install pdfplumber"
-            )
-
-        path = Path(pdf_path)
-        chunks: list[PageChunk] = []
-
-        with pdfplumber.open(path) as pdf:
-            for i, page in enumerate(pdf.pages, start=1):
-                text = page.extract_text() or ""
-                words = text.split()
-
-                if len(words) >= self.ocr_min_words:
-                    chunks.append(
-                        PageChunk(
-                            page_number=i,
-                            text=text.strip(),
-                            source="text_layer",
-                            word_count=len(words),
-                        )
-                    )
-                else:
-                    logger.debug(
-                        "pdf: page %d sparse (%d words), falling back to OCR",
-                        i,
-                        len(words),
-                    )
-                    chunks.append(self._ocr_page(page, i))
-
-        return chunks
-
-    def _ocr_page(self, page: object, page_number: int) -> PageChunk:
-        """Render page to image and extract text via tesseract."""
-        try:
-            rendered = page.to_image(resolution=200).original  # type: ignore[attr-defined]
-            rendered = _ensure_pil_image(rendered)
-            text = pytesseract.image_to_string(rendered)  # type: ignore[union-attr]
-            words = text.split()
-            return PageChunk(
-                page_number=page_number,
-                text=text.strip(),
-                source="ocr",
-                word_count=len(words),
-            )
-        except Exception as exc:
-            logger.warning("pdf: OCR failed for page %d: %s", page_number, exc)
-            return PageChunk(
-                page_number=page_number, text="", source="ocr", word_count=0
-            )
-
-
-def _ensure_pil_image(rendered: object) -> object:
-    """Return *rendered* as a PIL Image, converting from bytes if needed."""
-    if Image is None:
-        return rendered
-    try:
-        if not isinstance(rendered, Image.Image):
-            rendered = Image.open(io.BytesIO(rendered))  # type: ignore[arg-type]
-    except TypeError:
-        # Image may be patched (e.g. in tests); skip the conversion.
-        pass
-    return rendered
--- a/circuitforge_core/hardware/init.py
+++ b/circuitforge_core/hardware/init.py
@ -1,34 +0,0 @@
-# circuitforge_core/hardware/__init__.py
-"""
-Hardware detection and LLM profile generation.
-
-Typical usage::
-
-    from circuitforge_core.hardware import detect_hardware, generate_profile
-    import yaml
-
-    spec = detect_hardware()
-    config = generate_profile(spec)
-    print(yaml.dump(config.to_dict()))
-    print("Recommended profile:", config.profile_name)
-"""
-from .detect import detect_hardware, detect_hardware_json
-from .generator import generate_profile
-from .models import HardwareSpec, LLMBackendConfig, LLMConfig
-from .tiers import VRAM_TIERS, VramTier, select_tier
-from .vram_estimate import ModelVramLookupError, VramEstimate, model_vram_estimate
-
-__all__ = [
-    "detect_hardware",
-    "detect_hardware_json",
-    "generate_profile",
-    "HardwareSpec",
-    "LLMBackendConfig",
-    "LLMConfig",
-    "VRAM_TIERS",
-    "VramTier",
-    "select_tier",
-    "ModelVramLookupError",
-    "VramEstimate",
-    "model_vram_estimate",
-]
--- a/circuitforge_core/hardware/detect.py
+++ b/circuitforge_core/hardware/detect.py
@ -1,196 +0,0 @@
-# circuitforge_core/hardware/detect.py
-"""
-Cross-platform hardware auto-detection.
-
-Reads GPU info from:
-  - nvidia-smi     (NVIDIA, Linux/Windows)
-  - rocm-smi       (AMD, Linux)
-  - system_profiler (Apple Silicon, macOS)
-  - /proc/meminfo  (Linux RAM)
-  - psutil         (cross-platform RAM fallback)
-
-Returns a HardwareSpec. On detection failure, returns a conservative
-CPU-only spec so callers always get a usable result.
-"""
-from __future__ import annotations
-
-import json
-import platform
-import re
-import subprocess
-import sys
-from pathlib import Path
-
-from .models import HardwareSpec
-
-
-def _run(*args: str, timeout: int = 5) -> str:
-    """Run a subprocess and return stdout, or empty string on any error."""
-    try:
-        result = subprocess.run(
-            list(args), capture_output=True, text=True, timeout=timeout
-        )
-        return result.stdout.strip()
-    except Exception:
-        return ""
-
-
-def _ram_mb() -> int:
-    """Return total system RAM in MB."""
-    # psutil is optional but preferred
-    try:
-        import psutil  # type: ignore[import-untyped]
-        return psutil.virtual_memory().total // (1024 * 1024)
-    except ImportError:
-        pass
-
-    # Linux /proc/meminfo fallback
-    mem_info = Path("/proc/meminfo")
-    if mem_info.exists():
-        for line in mem_info.read_text().splitlines():
-            if line.startswith("MemTotal:"):
-                kb = int(line.split()[1])
-                return kb // 1024
-
-    return 0
-
-
-def _detect_nvidia() -> tuple[int, int, str, str, str] | None:
-    """
-    Returns (vram_mb, gpu_count, gpu_name, cuda_version, vendor) or None.
-    Uses nvidia-smi --query-gpu for reliable machine-parseable output.
-    """
-    out = _run(
-        "nvidia-smi",
-        "--query-gpu=name,memory.total",
-        "--format=csv,noheader,nounits",
-    )
-    if not out:
-        return None
-
-    lines = [l.strip() for l in out.splitlines() if l.strip()]
-    if not lines:
-        return None
-
-    gpu_count = len(lines)
-    # Use the first GPU's VRAM as the representative value
-    parts = lines[0].split(",")
-    if len(parts) < 2:
-        return None
-
-    gpu_name = parts[0].strip()
-    try:
-        vram_mb = int(parts[1].strip())
-    except ValueError:
-        return None
-
-    # CUDA version from nvidia-smi header
-    header = _run("nvidia-smi", "--query", "--display=COMPUTE")
-    cuda_match = re.search(r"CUDA Version\s*:\s*([\d.]+)", header)
-    cuda_version = cuda_match.group(1) if cuda_match else ""
-
-    return vram_mb, gpu_count, gpu_name, cuda_version, "nvidia"
-
-
-def _detect_amd() -> tuple[int, int, str, str, str] | None:
-    """Returns (vram_mb, gpu_count, gpu_name, rocm_version, vendor) or None."""
-    out = _run("rocm-smi", "--showmeminfo", "vram", "--json")
-    if not out:
-        return None
-
-    try:
-        data = json.loads(out)
-    except json.JSONDecodeError:
-        return None
-
-    cards = [k for k in data if k.startswith("card")]
-    if not cards:
-        return None
-
-    gpu_count = len(cards)
-    first = data[cards[0]]
-    try:
-        vram_mb = int(first.get("VRAM Total Memory (B)", 0)) // (1024 * 1024)
-    except (ValueError, TypeError):
-        return None
-
-    gpu_name = first.get("Card series", "AMD GPU")
-    rocm_out = _run("rocminfo")
-    rocm_match = re.search(r"ROCm Runtime Version\s*:\s*([\d.]+)", rocm_out)
-    rocm_version = rocm_match.group(1) if rocm_match else ""
-
-    return vram_mb, gpu_count, gpu_name, rocm_version, "amd"
-
-
-def _detect_apple() -> tuple[int, int, str, str, str] | None:
-    """
-    Returns (unified_ram_mb, 1, gpu_name, '', 'apple') or None.
-    Apple Silicon shares RAM between CPU and GPU; we report total RAM as VRAM.
-    """
-    if platform.system() != "Darwin":
-        return None
-
-    # Check for Apple Silicon
-    arm_check = _run("sysctl", "-n", "hw.optional.arm64")
-    if arm_check.strip() != "1":
-        return None
-
-    out = _run("system_profiler", "SPHardwareDataType", "-json")
-    try:
-        data = json.loads(out)
-        hw = data["SPHardwareDataType"][0]
-        chip = hw.get("chip_type", "Apple Silicon")
-        ram_str = hw.get("physical_memory", "0 GB")
-        ram_gb = int(re.search(r"(\d+)", ram_str).group(1))  # type: ignore[union-attr]
-        vram_mb = ram_gb * 1024  # unified memory
-    except Exception:
-        return None
-
-    return vram_mb, 1, chip, "", "apple"
-
-
-def detect_hardware() -> HardwareSpec:
-    """
-    Auto-detect hardware and return a HardwareSpec.
-
-    Detection order: NVIDIA → AMD → Apple → CPU fallback.
-    Never raises — returns a CPU-only spec on any detection failure.
-    """
-    ram_mb = _ram_mb()
-
-    for detector in (_detect_nvidia, _detect_amd, _detect_apple):
-        try:
-            result = detector()
-        except Exception:
-            result = None
-        if result is not None:
-            vram_mb, gpu_count, gpu_name, version, vendor = result
-            return HardwareSpec(
-                vram_mb=vram_mb,
-                ram_mb=ram_mb,
-                gpu_count=gpu_count,
-                gpu_vendor=vendor,
-                gpu_name=gpu_name,
-                cuda_version=version if vendor == "nvidia" else "",
-                rocm_version=version if vendor == "amd" else "",
-            )
-
-    # CPU-only fallback
-    return HardwareSpec(
-        vram_mb=0,
-        ram_mb=ram_mb,
-        gpu_count=0,
-        gpu_vendor="cpu",
-        gpu_name="",
-    )
-
-
-def detect_hardware_json() -> str:
-    """Return detect_hardware() result as a JSON string (for CLI / one-liner use)."""
-    import dataclasses
-    spec = detect_hardware()
-    return json.dumps(dataclasses.asdict(spec), indent=2)
-
-
-if __name__ == "__main__":
-    print(detect_hardware_json())
--- a/circuitforge_core/hardware/generator.py
+++ b/circuitforge_core/hardware/generator.py
@ -1,91 +0,0 @@
-# circuitforge_core/hardware/generator.py
-"""
-Profile generator: HardwareSpec → LLMConfig.
-
-`generate_profile()` is the main entry point. It selects the appropriate
-VRAM tier, builds a complete LLMConfig dict ready to write as llm.yaml,
-and returns the matching public GpuProfile name for orch use.
-"""
-from __future__ import annotations
-
-from .models import HardwareSpec, LLMBackendConfig, LLMConfig
-from .tiers import select_tier
-
-
-# Default backend URLs — overridable for non-standard setups
-_OLLAMA_URL = "http://localhost:11434"
-_VLLM_URL = "http://localhost:8000"
-_VISION_URL = "http://localhost:8002"
-_DOCUVISION_URL = "http://localhost:8003"
-
-
-def generate_profile(
-    spec: HardwareSpec,
-    *,
-    ollama_url: str = _OLLAMA_URL,
-    vllm_url: str = _VLLM_URL,
-    vision_url: str = _VISION_URL,
-    docuvision_url: str = _DOCUVISION_URL,
-) -> LLMConfig:
-    """
-    Map a HardwareSpec to an LLMConfig.
-
-    Returns an LLMConfig whose `profile_name` matches a public GpuProfile YAML
-    in `circuitforge_core/resources/profiles/public/` so the orch can load the
-    correct service allocation profile automatically.
-    """
-    tier = select_tier(spec.vram_mb)
-    has_vllm = "vllm" in tier.services
-    has_vision = "cf-vision" in tier.services
-    has_docuvision = "cf-docuvision" in tier.services
-
-    backends: dict[str, LLMBackendConfig] = {}
-
-    # Ollama is always available (CPU fallback)
-    backends["ollama"] = LLMBackendConfig(
-        enabled=True,
-        url=ollama_url,
-        model=tier.ollama_model,
-    )
-
-    # vllm — only on GPU tiers that can fit a model
-    if has_vllm and tier.vllm_candidates:
-        backends["vllm"] = LLMBackendConfig(
-            enabled=True,
-            url=vllm_url,
-            model_candidates=list(tier.vllm_candidates),
-        )
-
-    # Vision service
-    if has_vision:
-        backends["vision_service"] = LLMBackendConfig(
-            enabled=True,
-            url=vision_url,
-        )
-
-    # Docuvision service
-    if has_docuvision:
-        backends["docuvision_service"] = LLMBackendConfig(
-            enabled=True,
-            url=docuvision_url,
-        )
-
-    # Fallback order: prefer vllm over ollama when available (faster for batch)
-    if has_vllm:
-        fallback = ["vllm", "ollama"]
-        research_fallback = ["vllm", "ollama"]
-    else:
-        fallback = ["ollama"]
-        research_fallback = ["ollama"]
-
-    vision_fallback = (
-        ["vision_service"] if has_vision else []
-    ) + ["ollama"]
-
-    return LLMConfig(
-        profile_name=tier.profile_name,
-        backends=backends,
-        fallback_order=fallback,
-        research_fallback_order=research_fallback,
-        vision_fallback_order=vision_fallback,
-    )
--- a/circuitforge_core/hardware/models.py
+++ b/circuitforge_core/hardware/models.py
@ -1,60 +0,0 @@
-# circuitforge_core/hardware/models.py
-"""Data models for hardware detection and LLM configuration output."""
-from __future__ import annotations
-
-from dataclasses import dataclass, field
-from typing import Any
-
-
-@dataclass(frozen=True)
-class HardwareSpec:
-    """Describes a user's hardware as detected or manually entered."""
-
-    vram_mb: int          # total VRAM per primary GPU (0 = CPU-only)
-    ram_mb: int           # total system RAM
-    gpu_count: int        # number of GPUs
-    gpu_vendor: str       # "nvidia" | "amd" | "apple" | "cpu"
-    gpu_name: str = ""    # human-readable card name, e.g. "RTX 4080"
-    cuda_version: str = ""   # e.g. "12.4" (empty if not CUDA)
-    rocm_version: str = ""   # e.g. "5.7" (empty if not ROCm)
-
-
-@dataclass
-class LLMBackendConfig:
-    """Configuration for a single LLM backend."""
-
-    enabled: bool
-    url: str
-    model: str = ""
-    model_candidates: list[str] = field(default_factory=list)
-
-    def to_dict(self) -> dict[str, Any]:
-        d: dict[str, Any] = {"enabled": self.enabled, "url": self.url}
-        if self.model:
-            d["model"] = self.model
-        if self.model_candidates:
-            d["model_candidates"] = self.model_candidates
-        return d
-
-
-@dataclass
-class LLMConfig:
-    """
-    Ready-to-serialize llm.yaml configuration.
-
-    Matches the schema consumed by LLMRouter in circuitforge products.
-    """
-
-    profile_name: str       # e.g. "single-gpu-8gb" — matches a public GpuProfile
-    backends: dict[str, LLMBackendConfig] = field(default_factory=dict)
-    fallback_order: list[str] = field(default_factory=list)
-    research_fallback_order: list[str] = field(default_factory=list)
-    vision_fallback_order: list[str] = field(default_factory=list)
-
-    def to_dict(self) -> dict[str, Any]:
-        return {
-            "backends": {k: v.to_dict() for k, v in self.backends.items()},
-            "fallback_order": self.fallback_order,
-            "research_fallback_order": self.research_fallback_order,
-            "vision_fallback_order": self.vision_fallback_order,
-        }
--- a/circuitforge_core/hardware/tiers.py
+++ b/circuitforge_core/hardware/tiers.py
@ -1,104 +0,0 @@
-# circuitforge_core/hardware/tiers.py
-"""
-VRAM tier ladder and model catalog.
-
-Tiers map hardware VRAM (per-GPU) to:
-  - profile_name: matching public GpuProfile YAML in profiles/public/
-  - ollama_model:  best default Ollama model for this tier
-  - vllm_candidates: ordered list of HF model dirs to try via cf-orch/vllm
-  - services: which cf-* managed services are available at this tier
-  - llm_max_params: rough upper bound, for human-readable display
-"""
-from __future__ import annotations
-
-from dataclasses import dataclass, field
-
-
-@dataclass(frozen=True)
-class VramTier:
-    vram_min_mb: int        # inclusive lower bound (0 = CPU-only)
-    vram_max_mb: int        # exclusive upper bound (use sys.maxsize for the top tier)
-    profile_name: str       # public GpuProfile YAML stem
-    ollama_model: str       # e.g. "qwen2.5:7b-instruct-q4_k_m"
-    vllm_candidates: list[str] = field(default_factory=list)
-    services: list[str] = field(default_factory=list)
-    llm_max_params: str = ""   # human-readable, e.g. "7b-q4"
-
-
-# Ordered from smallest to largest — first match wins in select_tier().
-VRAM_TIERS: list[VramTier] = [
-    VramTier(
-        vram_min_mb=0,
-        vram_max_mb=1,
-        profile_name="cpu-16gb",
-        ollama_model="qwen2.5:1.5b-instruct-q4_k_m",
-        vllm_candidates=[],
-        services=["ollama", "cf-stt", "cf-tts"],
-        llm_max_params="3b-q4",
-    ),
-    VramTier(
-        vram_min_mb=1,
-        vram_max_mb=3_000,
-        profile_name="single-gpu-2gb",
-        ollama_model="qwen2.5:1.5b-instruct-q4_k_m",
-        vllm_candidates=[],
-        services=["ollama"],
-        llm_max_params="1.5b",
-    ),
-    VramTier(
-        vram_min_mb=3_000,
-        vram_max_mb=5_000,
-        profile_name="single-gpu-4gb",
-        ollama_model="qwen2.5:3b-instruct-q4_k_m",
-        vllm_candidates=[],
-        services=["ollama", "cf-vision", "cf-stt", "cf-tts"],
-        llm_max_params="3b",
-    ),
-    VramTier(
-        vram_min_mb=5_000,
-        vram_max_mb=7_000,
-        profile_name="single-gpu-6gb",
-        ollama_model="qwen2.5:7b-instruct-q4_k_m",
-        vllm_candidates=["Qwen2.5-3B-Instruct", "Phi-4-mini-instruct"],
-        services=["ollama", "vllm", "cf-vision", "cf-docuvision", "cf-stt", "cf-tts"],
-        llm_max_params="7b-q4",
-    ),
-    VramTier(
-        vram_min_mb=7_000,
-        vram_max_mb=12_000,
-        profile_name="single-gpu-8gb",
-        ollama_model="qwen2.5:7b-instruct",
-        vllm_candidates=["Qwen2.5-3B-Instruct", "Phi-4-mini-instruct"],
-        services=["ollama", "vllm", "cf-vision", "cf-docuvision", "cf-stt", "cf-tts", "cf-musicgen"],
-        llm_max_params="8b",
-    ),
-    VramTier(
-        vram_min_mb=12_000,
-        vram_max_mb=20_000,
-        profile_name="single-gpu-16gb",
-        ollama_model="qwen2.5:14b-instruct-q4_k_m",
-        vllm_candidates=["Qwen2.5-14B-Instruct", "Qwen2.5-3B-Instruct", "Phi-4-mini-instruct"],
-        services=["ollama", "vllm", "cf-vision", "cf-docuvision", "cf-stt", "cf-tts",
-                  "cf-musicgen", "cf-embed", "cf-classify"],
-        llm_max_params="14b",
-    ),
-    VramTier(
-        vram_min_mb=20_000,
-        vram_max_mb=10 ** 9,
-        profile_name="single-gpu-24gb",
-        ollama_model="qwen2.5:32b-instruct-q4_k_m",
-        vllm_candidates=["Qwen2.5-14B-Instruct", "Qwen2.5-3B-Instruct", "Phi-4-mini-instruct"],
-        services=["ollama", "vllm", "cf-vision", "cf-docuvision", "cf-stt", "cf-tts",
-                  "cf-musicgen", "cf-embed", "cf-classify", "comfyui"],
-        llm_max_params="32b-q4",
-    ),
-]
-
-
-def select_tier(vram_mb: int) -> VramTier:
-    """Return the best matching tier for the given per-GPU VRAM in MB."""
-    for tier in VRAM_TIERS:
-        if tier.vram_min_mb <= vram_mb < tier.vram_max_mb:
-            return tier
-    # Fallback: return the top tier for unusually large VRAM
-    return VRAM_TIERS[-1]
--- a/circuitforge_core/hardware/vram_estimate.py
+++ b/circuitforge_core/hardware/vram_estimate.py
@ -1,185 +0,0 @@
-# circuitforge_core/hardware/vram_estimate.py
-"""
-Model VRAM fit estimation — cf-core #64.
-
-`cf_core.hardware` can detect available VRAM but has no way to answer "can this
-hardware run model X at quantization level Y?". This module closes that gap by
-querying the HuggingFace Hub API for parameter count and architecture, then
-applying the standard VRAM estimation formula:
-
-    vram_gb = params * bytes_per_param(quant) + kv_cache_gb(ctx_len, arch) + overhead_gb
-
-The formula is the reference algorithm used by LLMcalc
-(https://github.com/Raskoll2/LLMcalc, no license — algorithm reference only,
-not a dependency). No LLMcalc code is copied here.
-"""
-from __future__ import annotations
-
-from dataclasses import dataclass
-
-import requests
-
-_HF_API_MODEL_URL = "https://huggingface.co/api/models/{model_id}"
-_HF_CONFIG_URL = "https://huggingface.co/{model_id}/resolve/main/config.json"
-
-_DEFAULT_OVERHEAD_GB = 0.6  # CUDA context + activation buffers, rough constant
-_KV_CACHE_DTYPE_BYTES = 2  # KV cache is stored fp16 in the common case
-
-# Bits per parameter for common quantization levels (weights-only, excludes KV cache).
-_QUANT_BITS: dict[str, float] = {
-    "fp32": 32.0,
-    "fp16": 16.0,
-    "bf16": 16.0,
-    "int8": 8.0,
-    "q8": 8.0,
-    "q8_0": 8.0,
-    "q6_k": 6.0,
-    "q5_k_m": 5.0,
-    "q5_0": 5.0,
-    "int4": 4.0,
-    "q4": 4.0,
-    "q4_k_m": 4.0,
-    "q4_0": 4.0,
-    "q3_k_m": 3.0,
-    "q2_k": 2.0,
-}
-
-
-class ModelVramLookupError(RuntimeError):
-    """Raised when the HuggingFace Hub API can't supply data needed to estimate VRAM."""
-
-
-@dataclass(frozen=True)
-class VramEstimate:
-    """Result of a `model_vram_estimate()` call."""
-
-    hf_model_id: str
-    quant_level: str
-    params_billions: float
-    weights_gb: float
-    kv_cache_gb: float
-    overhead_gb: float
-    total_vram_gb: float
-    fits: bool | None  # None when available_vram_mb wasn't supplied
-
-
-def _quant_bits(quant_level: str) -> float:
-    key = quant_level.strip().lower()
-    try:
-        return _QUANT_BITS[key]
-    except KeyError:
-        raise ValueError(
-            f"Unknown quant_level {quant_level!r}. Known levels: {sorted(_QUANT_BITS)}"
-        ) from None
-
-
-def _fetch_param_count(hf_model_id: str, *, timeout: float) -> float:
-    """Return total parameter count via the HF Hub API's safetensors metadata."""
-    url = _HF_API_MODEL_URL.format(model_id=hf_model_id)
-    try:
-        resp = requests.get(url, params={"expand": ["safetensors"]}, timeout=timeout)
-    except requests.RequestException as exc:
-        raise ModelVramLookupError(
-            f"HF Hub API request failed for {hf_model_id!r}: {exc}"
-        ) from exc
-
-    if resp.status_code != 200:
-        raise ModelVramLookupError(
-            f"HF Hub API returned {resp.status_code} for {hf_model_id!r}"
-        )
-
-    data = resp.json()
-    total = (data.get("safetensors") or {}).get("total")
-    if not total:
-        raise ModelVramLookupError(
-            f"{hf_model_id!r} has no safetensors parameter metadata on the HF Hub "
-            "(model may not publish safetensors weights)"
-        )
-    return float(total)
-
-
-def _fetch_arch_config(hf_model_id: str, *, timeout: float) -> dict:
-    """Return the model's config.json (architecture fields used for KV cache sizing)."""
-    url = _HF_CONFIG_URL.format(model_id=hf_model_id)
-    try:
-        resp = requests.get(url, timeout=timeout)
-    except requests.RequestException as exc:
-        raise ModelVramLookupError(
-            f"config.json fetch failed for {hf_model_id!r}: {exc}"
-        ) from exc
-
-    if resp.status_code != 200:
-        raise ModelVramLookupError(
-            f"config.json unavailable for {hf_model_id!r} (HTTP {resp.status_code})"
-        )
-    return resp.json()
-
-
-def _kv_cache_gb(config: dict, ctx_len: int) -> float:
-    """Estimate KV cache size in GB from architecture fields, 0.0 if unavailable."""
-    num_layers = config.get("num_hidden_layers")
-    hidden_size = config.get("hidden_size")
-    num_heads = config.get("num_attention_heads")
-    num_kv_heads = config.get("num_key_value_heads", num_heads)
-
-    if not (num_layers and hidden_size and num_heads):
-        # Non-standard config (missing architecture fields) — skip the KV
-        # estimate rather than fail the whole call. Weights dominate VRAM use.
-        return 0.0
-
-    head_dim = hidden_size / num_heads
-    bytes_total = 2 * num_layers * num_kv_heads * head_dim * ctx_len * _KV_CACHE_DTYPE_BYTES
-    return bytes_total / 1e9
-
-
-def model_vram_estimate(
-    hf_model_id: str,
-    quant_level: str,
-    *,
-    ctx_len: int = 4096,
-    available_vram_mb: int | None = None,
-    overhead_gb: float = _DEFAULT_OVERHEAD_GB,
-    timeout: float = 10.0,
-) -> VramEstimate:
-    """
-    Estimate VRAM required to run `hf_model_id` at `quant_level`.
-
-    Args:
-        hf_model_id: HuggingFace model repo ID, e.g. "Qwen/Qwen2.5-7B-Instruct".
-        quant_level: One of the known quant levels (see `_QUANT_BITS`), e.g. "q4_k_m".
-        ctx_len: Context length used for KV cache sizing.
-        available_vram_mb: If given, populates `VramEstimate.fits`.
-        overhead_gb: Fixed overhead for CUDA context / activation buffers.
-        timeout: Per-request timeout in seconds for HF Hub API calls.
-
-    Raises:
-        ModelVramLookupError: HF Hub API request failed or returned unusable data.
-        ValueError: `quant_level` isn't a recognized quantization level.
-    """
-    bits = _quant_bits(quant_level)
-    params = _fetch_param_count(hf_model_id, timeout=timeout)
-    weights_gb = (params * bits / 8) / 1e9
-
-    try:
-        config = _fetch_arch_config(hf_model_id, timeout=timeout)
-        kv_gb = _kv_cache_gb(config, ctx_len)
-    except ModelVramLookupError:
-        # Architecture lookup is best-effort — weights_gb alone is still useful.
-        kv_gb = 0.0
-
-    total_gb = weights_gb + kv_gb + overhead_gb
-
-    fits = None
-    if available_vram_mb is not None:
-        fits = total_gb <= (available_vram_mb / 1024)
-
-    return VramEstimate(
-        hf_model_id=hf_model_id,
-        quant_level=quant_level,
-        params_billions=params / 1e9,
-        weights_gb=weights_gb,
-        kv_cache_gb=kv_gb,
-        overhead_gb=overhead_gb,
-        total_vram_gb=total_gb,
-        fits=fits,
-    )
--- a/circuitforge_core/input/gestures/init.py
+++ b/circuitforge_core/input/gestures/init.py
@ -1,15 +0,0 @@
-"""
-cf_input.gestures — camera capture, hand detection, landmark normalization.
-
-Public API:
-    CameraCapture      — OpenCV frame source
-    HandsDetector      — MediaPipe Hands wrapper
-    HandLandmarks      — immutable detected hand dataclass
-    normalize_hand()   — scale/translation-invariant feature vector
-"""
-
-from circuitforge_core.input.gestures.camera import CameraCapture
-from circuitforge_core.input.gestures.hands import HandLandmarks, HandsDetector
-from circuitforge_core.input.gestures.normalizer import normalize_hand
-
-__all__ = ["CameraCapture", "HandLandmarks", "HandsDetector", "normalize_hand"]
--- a/circuitforge_core/input/gestures/camera.py
+++ b/circuitforge_core/input/gestures/camera.py
@ -1,57 +0,0 @@
-"""
-OpenCV camera capture — context manager wrapping VideoCapture.
-
-Yields BGR frames. Callers convert to RGB before passing to HandsDetector:
-    frame_rgb = frame_bgr[:, :, ::-1]
-"""
-
-from __future__ import annotations
-
-from typing import Iterator
-
-import cv2
-import numpy as np
-
-
-class CameraCapture:
-    """
-    Thin wrapper around cv2.VideoCapture.
-
-    Usage:
-        with CameraCapture(device_index=0) as cam:
-            for frame_bgr in cam.frames():
-                process(frame_bgr)
-    """
-
-    def __init__(
-        self,
-        device_index: int = 0,
-        width: int = 640,
-        height: int = 480,
-        fps: int = 30,
-    ) -> None:
-        self._cap = cv2.VideoCapture(device_index)
-        self._cap.set(cv2.CAP_PROP_FRAME_WIDTH, width)
-        self._cap.set(cv2.CAP_PROP_FRAME_HEIGHT, height)
-        self._cap.set(cv2.CAP_PROP_FPS, fps)
-
-    @property
-    def is_open(self) -> bool:
-        return self._cap.isOpened()
-
-    def frames(self) -> Iterator[np.ndarray]:
-        """Yield BGR uint8 frames until camera fails or caller breaks."""
-        while self._cap.isOpened():
-            ok, frame = self._cap.read()
-            if not ok:
-                break
-            yield frame
-
-    def release(self) -> None:
-        self._cap.release()
-
-    def __enter__(self) -> CameraCapture:
-        return self
-
-    def __exit__(self, *_: object) -> None:
-        self.release()
--- a/circuitforge_core/input/gestures/hands.py
+++ b/circuitforge_core/input/gestures/hands.py
@ -1,91 +0,0 @@
-"""
-MediaPipe Hands wrapper.
-
-Produces immutable HandLandmarks dataclasses from RGB video frames.
-The caller is responsible for BGR→RGB conversion before passing frames.
-"""
-
-from __future__ import annotations
-
-from dataclasses import dataclass
-
-import mediapipe as mp
-import numpy as np
-
-
-@dataclass(frozen=True)
-class HandLandmarks:
-    """Immutable snapshot of one detected hand."""
-
-    points: np.ndarray  # shape (21, 3) — x, y, z in [0,1] normalized image space
-    handedness: str  # 'Left' | 'Right' (mirror of physical hand)
-    confidence: float  # [0.0, 1.0]
-
-
-class HandsDetector:
-    """
-    Thin wrapper around mediapipe.solutions.hands.Hands.
-
-    Usage:
-        detector = HandsDetector()
-        for frame_bgr in camera.frames():
-            frame_rgb = frame_bgr[:, :, ::-1]
-            hands = detector.detect(frame_rgb)
-            for hand in hands:
-                vec = normalize_hand(hand.points)
-                ...
-        detector.close()
-
-    Or use as a context manager:
-        with HandsDetector() as detector:
-            ...
-    """
-
-    def __init__(
-        self,
-        max_hands: int = 2,
-        min_detection_confidence: float = 0.7,
-        min_tracking_confidence: float = 0.5,
-    ) -> None:
-        self._hands = mp.solutions.hands.Hands(
-            static_image_mode=False,
-            max_num_hands=max_hands,
-            min_detection_confidence=min_detection_confidence,
-            min_tracking_confidence=min_tracking_confidence,
-        )
-
-    def detect(self, rgb_frame: np.ndarray) -> list[HandLandmarks]:
-        """
-        Run hand detection on one RGB frame.
-
-        Args:
-            rgb_frame: (H, W, 3) uint8 RGB image.
-
-        Returns:
-            List of HandLandmarks, one per detected hand (up to max_hands).
-            Empty list if no hands detected.
-        """
-        results = self._hands.process(rgb_frame)
-        if not results.multi_hand_landmarks:
-            return []
-        out: list[HandLandmarks] = []
-        for lm, hand in zip(results.multi_hand_landmarks, results.multi_handedness):
-            points = np.array([[p.x, p.y, p.z] for p in lm.landmark], dtype=np.float32)
-            points.flags.writeable = False  # enforce immutability of stored array
-            out.append(
-                HandLandmarks(
-                    points=points,
-                    handedness=hand.classification[0].label,
-                    confidence=float(hand.classification[0].score),
-                )
-            )
-        return out
-
-    def close(self) -> None:
-        self._hands.close()
-
-    def __enter__(self) -> HandsDetector:
-        return self
-
-    def __exit__(self, *_: object) -> None:
-        self.close()
--- a/circuitforge_core/input/gestures/normalizer.py
+++ b/circuitforge_core/input/gestures/normalizer.py
@ -1,33 +0,0 @@
-"""
-Landmark normalization for MediaPipe hand landmarks.
-
-Converts raw (21, 3) landmark array into a 63-element translation- and
-scale-invariant feature vector suitable for gesture classifiers.
-"""
-
-import numpy as np
-
-
-def normalize_hand(points: np.ndarray) -> np.ndarray:
-    """
-    Normalize 21 MediaPipe hand landmarks into a scale/translation-invariant
-    63-element feature vector.
-
-    Steps:
-        1. Translate so wrist (landmark 0) is at origin.
-        2. Scale so distance from wrist to middle-finger MCP (landmark 9) = 1.0.
-           If that distance is near-zero (degenerate hand), return zeros.
-        3. Flatten to shape (63,).
-
-    Args:
-        points: (21, 3) float32 array — raw MediaPipe landmark coords.
-
-    Returns:
-        (63,) float32 feature vector.
-    """
-    pts = points.astype(np.float32).copy()
-    pts -= pts[0]  # translate: wrist → origin
-    scale = float(np.linalg.norm(pts[9]))  # wrist-to-middle-MCP distance
-    if scale > 1e-6:
-        pts /= scale
-    return pts.flatten()
--- a/circuitforge_core/job_quality/init.py
+++ b/circuitforge_core/job_quality/init.py
@ -1,23 +0,0 @@
-"""
-circuitforge_core.job_quality — deterministic trust scorer for job listings.
-
-MIT licensed.
-"""
-
-from circuitforge_core.job_quality.models import (
-    JobEnrichment,
-    JobListing,
-    JobQualityScore,
-    SignalResult,
-)
-from circuitforge_core.job_quality.scorer import score_job
-from circuitforge_core.job_quality.signals import ALL_SIGNALS
-
-__all__ = [
-    "JobEnrichment",
-    "JobListing",
-    "JobQualityScore",
-    "SignalResult",
-    "score_job",
-    "ALL_SIGNALS",
-]
--- a/circuitforge_core/job_quality/models.py
+++ b/circuitforge_core/job_quality/models.py
@ -1,70 +0,0 @@
-"""
-Pydantic models for the job_quality trust scorer.
-
-MIT licensed — no LLM calls, no network calls, no file I/O.
-"""
-
-from __future__ import annotations
-
-from datetime import datetime
-from typing import Any
-
-from pydantic import BaseModel, Field
-
-
-class JobListing(BaseModel):
-    """Input data sourced directly from a job board scraper or ATS export."""
-
-    # Core identity
-    title: str = ""
-    company: str = ""
-    location: str = ""
-    state_code: str = ""  # Two-letter US state code, e.g. "CA"
-
-    # Salary / compensation
-    salary_min: float | None = None
-    salary_max: float | None = None
-    salary_text: str = ""  # Raw salary string from the listing
-
-    # Posting metadata
-    posted_at: datetime | None = None
-    repost_count: int = 0  # Times the same listing has been reposted
-    applicant_count: int | None = None
-    is_staffing_agency: bool = False
-    is_always_open: bool = False  # Evergreen/always-accepting flag
-
-    # Content
-    description: str = ""
-    requirements: list[str] = Field(default_factory=list)
-    ats_url: str = ""  # ATS apply URL (Greenhouse, Lever, Workday, etc.)
-
-    # Signals from scraper enrichment
-    weekend_posted: bool = False  # Posted on Saturday or Sunday
-
-
-class JobEnrichment(BaseModel):
-    """Optional enrichment data gathered outside the listing (news, history, etc.)."""
-
-    has_layoff_news: bool = False  # Recent layoff news for this company
-    avg_response_days: float | None = None  # Average recruiter response time (days)
-    no_response_rate: float | None = None  # Fraction of applicants with no response (0–1)
-
-
-class SignalResult(BaseModel):
-    """Output of a single signal function."""
-
-    name: str
-    triggered: bool
-    weight: float
-    penalty: float  # weight * triggered (0.0 when not triggered)
-    detail: str = ""  # Human-readable explanation
-
-
-class JobQualityScore(BaseModel):
-    """Aggregated trust score for a job listing."""
-
-    trust_score: float  # 0.0 (low trust) – 1.0 (high trust)
-    confidence: float  # 0.0 – 1.0: fraction of signals with available evidence
-    signals: list[SignalResult]
-    raw_penalty: float  # Sum of triggered weights before clamping
-    metadata: dict[str, Any] = Field(default_factory=dict)
--- a/circuitforge_core/job_quality/scorer.py
+++ b/circuitforge_core/job_quality/scorer.py
@ -1,60 +0,0 @@
-"""
-score_job: aggregate all signals into a JobQualityScore.
-
-MIT licensed — pure function, no I/O.
-"""
-
-from __future__ import annotations
-
-from circuitforge_core.job_quality.models import JobEnrichment, JobListing, JobQualityScore, SignalResult
-from circuitforge_core.job_quality.signals import ALL_SIGNALS
-
-
-def score_job(
-    listing: JobListing,
-    enrichment: JobEnrichment | None = None,
-) -> JobQualityScore:
-    """
-    Score a job listing for trust/quality.
-
-    Each signal produces a penalty in [0, weight].  The raw penalty is the sum of
-    all triggered signal weights.  trust_score = 1 - clamp(raw_penalty, 0, 1).
-
-    confidence reflects what fraction of signals had enough data to evaluate.
-    Signals that return triggered=False with a "not available" detail are counted
-    as unevaluable — they reduce confidence without adding penalty.
-    """
-    results: list[SignalResult] = []
-    evaluable_count = 0
-
-    for fn in ALL_SIGNALS:
-        result = fn(listing, enrichment)
-        results.append(result)
-        # A signal is evaluable when it either triggered or had data to decide it didn't.
-        # Signals that skip due to missing data always set triggered=False AND include
-        # "not available" or "No" in their detail.
-        if result.triggered or _has_data(result):
-            evaluable_count += 1
-
-    raw_penalty = sum(r.penalty for r in results)
-    trust_score = max(0.0, min(1.0, 1.0 - raw_penalty))
-    confidence = evaluable_count / len(ALL_SIGNALS) if ALL_SIGNALS else 0.0
-
-    return JobQualityScore(
-        trust_score=round(trust_score, 4),
-        confidence=round(confidence, 4),
-        signals=results,
-        raw_penalty=round(raw_penalty, 4),
-    )
-
-
-def _has_data(result: SignalResult) -> bool:
-    """Return True when the signal's detail indicates it actually evaluated data."""
-    skip_phrases = (
-        "not available",
-        "No enrichment",
-        "No posted_at",
-        "No response rate",
-        "No salary information",
-    )
-    return not any(phrase.lower() in result.detail.lower() for phrase in skip_phrases)
--- a/circuitforge_core/job_quality/signals.py
+++ b/circuitforge_core/job_quality/signals.py
@ -1,275 +0,0 @@
-"""
-Individual signal functions for the job_quality trust scorer.
-
-Each function takes a JobListing and optional JobEnrichment and returns a SignalResult.
-All signals are pure functions: no I/O, no LLM calls, no side effects.
-
-MIT licensed.
-"""
-
-from __future__ import annotations
-
-from datetime import datetime, timezone
-
-from circuitforge_core.job_quality.models import JobEnrichment, JobListing, SignalResult
-
-# US states with salary transparency laws (as of 2026)
-_SALARY_TRANSPARENCY_STATES = {"CO", "CA", "NY", "WA", "IL", "MA"}
-
-# ATS providers whose apply URLs are commonly associated with high ghosting rates
-_GHOSTING_ATS_PATTERNS = ("lever.co", "greenhouse.io", "workday.com", "icims.com", "taleo.net")
-
-# Threshold for "always open" detection: repost every N days for M months
-_ALWAYS_OPEN_REPOST_THRESHOLD = 3
-
-# Requirement count above which a listing is considered overloaded
-_REQUIREMENT_OVERLOAD_COUNT = 12
-
-# Vagueness: description length below this suggests bare-minimum content
-_VAGUE_DESCRIPTION_CHARS = 400
-
-# Applicant count above which competition is considered very high
-_HIGH_APPLICANT_THRESHOLD = 200
-
-# Listing age above which staleness is likely
-_STALE_DAYS = 30
-
-# Response rate above which the role is considered a high-ghosting source
-_NO_RESPONSE_RATE_THRESHOLD = 0.60
-
-
-def _now() -> datetime:
-    return datetime.now(tz=timezone.utc)
-
-
-# ---------------------------------------------------------------------------
-# High-weight signals (0.15 – 0.25)
-# ---------------------------------------------------------------------------
-
-
-def listing_age(listing: JobListing, _: JobEnrichment | None = None) -> SignalResult:
-    """Listing older than 30 days is likely stale or already filled."""
-    weight = 0.25
-    if listing.posted_at is None:
-        return SignalResult(name="listing_age", triggered=False, weight=weight, penalty=0.0,
-                            detail="No posted_at date available.")
-    age_days = (_now() - listing.posted_at.astimezone(timezone.utc)).days
-    triggered = age_days > _STALE_DAYS
-    return SignalResult(
-        name="listing_age",
-        triggered=triggered,
-        weight=weight,
-        penalty=weight if triggered else 0.0,
-        detail=f"Listing is {age_days} days old (threshold: {_STALE_DAYS}).",
-    )
-
-
-def repost_detected(listing: JobListing, _: JobEnrichment | None = None) -> SignalResult:
-    """Listing has been reposted multiple times — a strong ghost-job indicator."""
-    weight = 0.25
-    triggered = listing.repost_count >= _ALWAYS_OPEN_REPOST_THRESHOLD
-    return SignalResult(
-        name="repost_detected",
-        triggered=triggered,
-        weight=weight,
-        penalty=weight if triggered else 0.0,
-        detail=f"Repost count: {listing.repost_count} (threshold: {_ALWAYS_OPEN_REPOST_THRESHOLD}).",
-    )
-
-
-def no_salary_transparency(listing: JobListing, _: JobEnrichment | None = None) -> SignalResult:
-    """No salary info despite being in a transparency-law state, or generally absent."""
-    weight = 0.20
-    has_range = listing.salary_min is not None or listing.salary_max is not None
-    has_text = bool(listing.salary_text.strip())
-    has_salary = has_range or has_text
-    in_transparency_state = listing.state_code.upper() in _SALARY_TRANSPARENCY_STATES
-
-    if not has_salary:
-        if in_transparency_state:
-            detail = (f"No salary disclosed despite {listing.state_code} transparency law. "
-                      "Possible compliance violation.")
-        else:
-            detail = "No salary information provided."
-        triggered = True
-    else:
-        triggered = False
-        detail = "Salary information present."
-
-    return SignalResult(
-        name="no_salary_transparency",
-        triggered=triggered,
-        weight=weight,
-        penalty=weight if triggered else 0.0,
-        detail=detail,
-    )
-
-
-def always_open_pattern(listing: JobListing, _: JobEnrichment | None = None) -> SignalResult:
-    """Listing is flagged as always-accepting or evergreen — pipeline filler."""
-    weight = 0.20
-    triggered = listing.is_always_open
-    return SignalResult(
-        name="always_open_pattern",
-        triggered=triggered,
-        weight=weight,
-        penalty=weight if triggered else 0.0,
-        detail="Listing marked as always-open/evergreen." if triggered else "Not always-open.",
-    )
-
-
-def staffing_agency(listing: JobListing, _: JobEnrichment | None = None) -> SignalResult:
-    """Posted by a staffing or recruiting agency rather than the hiring company directly."""
-    weight = 0.15
-    triggered = listing.is_staffing_agency
-    return SignalResult(
-        name="staffing_agency",
-        triggered=triggered,
-        weight=weight,
-        penalty=weight if triggered else 0.0,
-        detail="Listed by a staffing/recruiting agency." if triggered else "Direct employer listing.",
-    )
-
-
-# ---------------------------------------------------------------------------
-# Medium-weight signals (0.08 – 0.12)
-# ---------------------------------------------------------------------------
-
-
-def requirement_overload(listing: JobListing, _: JobEnrichment | None = None) -> SignalResult:
-    """Excessive requirements list suggests a wish-list role or perpetual search."""
-    weight = 0.12
-    count = len(listing.requirements)
-    triggered = count > _REQUIREMENT_OVERLOAD_COUNT
-    return SignalResult(
-        name="requirement_overload",
-        triggered=triggered,
-        weight=weight,
-        penalty=weight if triggered else 0.0,
-        detail=f"{count} requirements listed (threshold: {_REQUIREMENT_OVERLOAD_COUNT}).",
-    )
-
-
-def layoff_news(listing: JobListing, enrichment: JobEnrichment | None = None) -> SignalResult:
-    """Company has recent layoff news — new hires may be at high risk."""
-    weight = 0.12
-    if enrichment is None:
-        return SignalResult(name="layoff_news", triggered=False, weight=weight, penalty=0.0,
-                            detail="No enrichment data available.")
-    triggered = enrichment.has_layoff_news
-    return SignalResult(
-        name="layoff_news",
-        triggered=triggered,
-        weight=weight,
-        penalty=weight if triggered else 0.0,
-        detail="Recent layoff news detected for this company." if triggered else "No layoff news found.",
-    )
-
-
-def jd_vagueness(listing: JobListing, _: JobEnrichment | None = None) -> SignalResult:
-    """Job description is suspiciously short — may not represent a real open role."""
-    weight = 0.10
-    char_count = len(listing.description.strip())
-    triggered = char_count < _VAGUE_DESCRIPTION_CHARS
-    return SignalResult(
-        name="jd_vagueness",
-        triggered=triggered,
-        weight=weight,
-        penalty=weight if triggered else 0.0,
-        detail=f"Description is {char_count} characters (threshold: {_VAGUE_DESCRIPTION_CHARS}).",
-    )
-
-
-def ats_blackhole(listing: JobListing, _: JobEnrichment | None = None) -> SignalResult:
-    """Apply URL routes through a high-volume ATS known for candidate ghosting."""
-    weight = 0.10
-    url_lower = listing.ats_url.lower()
-    matched = next((p for p in _GHOSTING_ATS_PATTERNS if p in url_lower), None)
-    triggered = matched is not None
-    return SignalResult(
-        name="ats_blackhole",
-        triggered=triggered,
-        weight=weight,
-        penalty=weight if triggered else 0.0,
-        detail=f"ATS matches high-ghosting pattern '{matched}'." if triggered else "No high-ghosting ATS detected.",
-    )
-
-
-def high_applicant_count(listing: JobListing, _: JobEnrichment | None = None) -> SignalResult:
-    """Very high applicant count means low odds and possible ghost-collection."""
-    weight = 0.08
-    if listing.applicant_count is None:
-        return SignalResult(name="high_applicant_count", triggered=False, weight=weight, penalty=0.0,
-                            detail="Applicant count not available.")
-    triggered = listing.applicant_count > _HIGH_APPLICANT_THRESHOLD
-    return SignalResult(
-        name="high_applicant_count",
-        triggered=triggered,
-        weight=weight,
-        penalty=weight if triggered else 0.0,
-        detail=f"{listing.applicant_count} applicants (threshold: {_HIGH_APPLICANT_THRESHOLD}).",
-    )
-
-
-# ---------------------------------------------------------------------------
-# Low-weight signals (0.04 – 0.08)
-# ---------------------------------------------------------------------------
-
-
-def weekend_posted(listing: JobListing, _: JobEnrichment | None = None) -> SignalResult:
-    """Posted on a weekend — may indicate bulk/automated ghost-job pipeline posting."""
-    weight = 0.04
-    if listing.posted_at is None and not listing.weekend_posted:
-        return SignalResult(name="weekend_posted", triggered=False, weight=weight, penalty=0.0,
-                            detail="No posted_at date available.")
-    if listing.weekend_posted:
-        triggered = True
-    else:
-        triggered = listing.posted_at.weekday() >= 5  # type: ignore[union-attr]
-    return SignalResult(
-        name="weekend_posted",
-        triggered=triggered,
-        weight=weight,
-        penalty=weight if triggered else 0.0,
-        detail="Posted on a weekend." if triggered else "Posted on a weekday.",
-    )
-
-
-def poor_response_history(listing: JobListing, enrichment: JobEnrichment | None = None) -> SignalResult:
-    """Company/ATS historically does not respond to applicants."""
-    weight = 0.08
-    if enrichment is None:
-        return SignalResult(name="poor_response_history", triggered=False, weight=weight, penalty=0.0,
-                            detail="No enrichment data available.")
-    rate = enrichment.no_response_rate
-    if rate is None:
-        return SignalResult(name="poor_response_history", triggered=False, weight=weight, penalty=0.0,
-                            detail="No response rate data available.")
-    triggered = rate > _NO_RESPONSE_RATE_THRESHOLD
-    return SignalResult(
-        name="poor_response_history",
-        triggered=triggered,
-        weight=weight,
-        penalty=weight if triggered else 0.0,
-        detail=f"No-response rate: {rate:.0%} (threshold: {_NO_RESPONSE_RATE_THRESHOLD:.0%}).",
-    )
-
-
-# ---------------------------------------------------------------------------
-# Signal registry — ordered by weight descending for scorer iteration
-# ---------------------------------------------------------------------------
-
-ALL_SIGNALS = [
-    listing_age,
-    repost_detected,
-    no_salary_transparency,
-    always_open_pattern,
-    staffing_agency,
-    requirement_overload,
-    layoff_news,
-    jd_vagueness,
-    ats_blackhole,
-    high_applicant_count,
-    weekend_posted,
-    poor_response_history,
-]
--- a/circuitforge_core/llm/router.py
+++ b/circuitforge_core/llm/router.py
@ -1,143 +1,26 @@
 """
 LLM abstraction layer with priority fallback chain.
-
-Reads config from ~/.config/circuitforge/llm.yaml (or the path passed to
-LLMRouter.__init__). Tries backends in fallback_order; skips unreachable or
-disabled entries and falls back to the next until one succeeds.
-
-## Backend types
-
-**openai_compat** — OpenAI-compatible /v1/chat/completions endpoint.
-  Used for: Ollama, vLLM, GitHub Copilot wrapper, Claude Code wrapper,
-  and the cf-orch trunk services (cf-text, cf-voice).
-
-  With a cf_orch block the router first allocates via cf-orch, which
-  starts the service on-demand and returns its URL. Without cf_orch the
-  router does a static reachability check against base_url.
-
-**anthropic** — Direct Anthropic API via the anthropic SDK.
-
-**vision_service** — cf-vision managed service (moondream2 / SigLIP).
-  Posts to /analyze; only used when images= is provided to complete().
-  Supports cf_orch allocation to start cf-vision on-demand.
-
-## Trunk services (The Orchard architecture)
-
-These services live in cf-orch as branches; cf-core wires them as backends.
-Products declare them in llm.yaml using the openai_compat type plus a
-cf_orch block — the router handles allocation and URL injection transparently.
-
-  cf-text   — Local transformer inference (/v1/chat/completions, port 8008).
-               Default model set by default_model in the node's service
-               profile; override via model_candidates in the cf_orch block.
-
-  cf-voice  — STT/TTS pipeline endpoint (/v1/chat/completions, port 8009).
-               Same allocation pattern as cf-text.
-
-  cf-vision — Vision inference (moondream2 / SigLIP), vision_service type.
-               Used via the vision_fallback_order when images are present.
-
-## Config auto-detection (no llm.yaml)
-
-When llm.yaml is absent, the router builds a minimal config from environment
-variables: ANTHROPIC_API_KEY, OPENAI_API_KEY / OPENAI_BASE_URL, OLLAMA_HOST.
-Ollama on localhost:11434 is always included as the lowest-cost local fallback.
+Reads config from ~/.config/circuitforge/llm.yaml.
+Tries backends in order; falls back on any error.
 """
-
-import logging
 import os
 import yaml
 import requests
 from pathlib import Path
 from openai import OpenAI

-logger = logging.getLogger(__name__)
-
 CONFIG_PATH = Path.home() / ".config" / "circuitforge" / "llm.yaml"


 class LLMRouter:
-    def __init__(self, config_path: Path | dict = CONFIG_PATH):
-        self._ollama_tags_cache: dict[str, set[str]] = {}
-        if isinstance(config_path, dict):
-            self.config = config_path
-        elif config_path.exists():
-            with open(config_path) as f:
-                self.config = yaml.safe_load(f)
-        else:
-            env_config = self._auto_config_from_env()
-            if env_config is None:
-                raise FileNotFoundError(
-                    f"{config_path} not found and no LLM env vars detected. "
-                    "Either copy llm.yaml.example to ~/.config/circuitforge/llm.yaml, "
-                    "or set ANTHROPIC_API_KEY, OPENAI_API_KEY, or OLLAMA_HOST."
-                )
-            logger.info(
-                "[LLMRouter] No llm.yaml found — using env-var auto-config "
-                "(backends: %s)",
-                ", ".join(env_config["fallback_order"]),
+    def __init__(self, config_path: Path = CONFIG_PATH):
+        if not config_path.exists():
+            raise FileNotFoundError(
+                f"{config_path} not found. "
+                "Copy the llm.yaml.example to ~/.config/circuitforge/llm.yaml and configure your LLM backends."
            )
-            self.config = env_config
-
-    @staticmethod
-    def _auto_config_from_env() -> dict | None:
-        """Build a minimal LLM config from well-known environment variables.
-
-        Priority order (highest to lowest):
-          1. ANTHROPIC_API_KEY  → anthropic backend
-          2. OPENAI_API_KEY     → openai-compat → api.openai.com (or OPENAI_BASE_URL)
-          3. OLLAMA_HOST        → openai-compat → local Ollama (always included as last resort)
-
-        Returns None only when none of these are set and Ollama is not configured,
-        so the caller can decide whether to raise or surface a user-facing message.
-        """
-        backends: dict = {}
-        fallback_order: list[str] = []
-
-        if os.environ.get("ANTHROPIC_API_KEY"):
-            backends["anthropic"] = {
-                "type": "anthropic",
-                "enabled": True,
-                "model": os.environ.get("ANTHROPIC_MODEL", "claude-haiku-4-5-20251001"),
-                "api_key_env": "ANTHROPIC_API_KEY",
-                "supports_images": True,
-            }
-            fallback_order.append("anthropic")
-
-        if os.environ.get("OPENAI_API_KEY"):
-            backends["openai"] = {
-                "type": "openai_compat",
-                "enabled": True,
-                "base_url": os.environ.get(
-                    "OPENAI_BASE_URL", "https://api.openai.com/v1"
-                ),
-                "model": os.environ.get("OPENAI_MODEL", "gpt-4o-mini"),
-                "api_key": os.environ.get("OPENAI_API_KEY"),
-                "supports_images": True,
-            }
-            fallback_order.append("openai")
-
-        # Ollama — always added when any config exists, as the lowest-cost local fallback.
-        # Unreachable Ollama is harmless — _is_reachable() skips it gracefully.
-        ollama_host = os.environ.get("OLLAMA_HOST", "http://localhost:11434")
-        if not ollama_host.startswith("http"):
-            ollama_host = f"http://{ollama_host}"
-        backends["ollama"] = {
-            "type": "openai_compat",
-            "enabled": True,
-            "base_url": ollama_host.rstrip("/") + "/v1",
-            "model": os.environ.get("OLLAMA_MODEL", "llama3.2:3b"),
-            "api_key": "any",
-            "supports_images": False,
-        }
-        fallback_order.append("ollama")
-
-        # Return None if only ollama is in the list AND no explicit host was set —
-        # that means the user set nothing at all, not even OLLAMA_HOST.
-        if fallback_order == ["ollama"] and "OLLAMA_HOST" not in os.environ:
-            return None
-
-        return {"backends": backends, "fallback_order": fallback_order}
+        with open(config_path) as f:
+            self.config = yaml.safe_load(f)

    def _is_reachable(self, base_url: str) -> bool:
        """Quick health-check ping. Returns True if backend is up."""
@ -148,37 +31,6 @@ class LLMRouter:
        except Exception:
            return False

-    def _check_ollama_model_pulled(self, base_url: str, model: str) -> None:
-        """Raise RuntimeError with actionable message if model is not pulled in Ollama.
-
-        Silently skips the check if the /api/tags endpoint is unavailable (e.g. vLLM).
-        Results are cached per base_url for the lifetime of this router instance.
-        """
-        tags_url = base_url.rstrip("/").removesuffix("/v1") + "/api/tags"
-        if not hasattr(self, "_ollama_tags_cache"):
-            self._ollama_tags_cache = {}
-        if base_url not in self._ollama_tags_cache:
-            try:
-                resp = requests.get(tags_url, timeout=3)
-                if resp.status_code != 200:
-                    return
-                pulled = {
-                    m["name"].split(":")[0]
-                    for m in resp.json().get("models", [])
-                }
-                self._ollama_tags_cache[base_url] = pulled
-            except Exception:
-                return  # can't verify — let the actual embed call fail naturally
-        pulled_models = self._ollama_tags_cache.get(base_url)
-        if pulled_models is None:
-            return
-        model_base = model.split(":")[0]
-        if model_base not in pulled_models:
-            raise RuntimeError(
-                f'Ollama embedding model "{model}" is not pulled.\n'
-                f"Fix: ollama pull {model}"
-            )
-
    def _resolve_model(self, client: OpenAI, model: str) -> str:
        """Resolve __auto__ to the first model served by vLLM."""
        if model != "__auto__":
@ -186,71 +38,11 @@ class LLMRouter:
        models = client.models.list()
        return models.data[0].id

-    def _try_cf_orch_alloc(self, backend: dict) -> "tuple | None":
-        """
-        If backend config has a cf_orch block and CF_ORCH_URL is set (env takes
-        precedence over yaml url), allocate via cf-orch and return (ctx, alloc).
-
-        Two allocation modes:
-        - task-based (preferred): cf_orch block has `product` + `task` keys.
-          Calls POST /api/inference/task; coordinator resolves model/node from
-          assignments.yaml. No hardcoded model IDs in product config.
-        - service-based (legacy): cf_orch block has `service` key.
-          Calls allocate(service=...) directly.
-
-        Returns None if not configured or allocation fails.
-        Caller MUST call ctx.__exit__(None, None, None) in a finally block.
-        """
-        import os
-
-        orch_cfg = backend.get("cf_orch")
-        if not orch_cfg:
-            return None
-        orch_url = os.environ.get("CF_ORCH_URL", orch_cfg.get("url", ""))
-        if not orch_url:
-            return None
-        try:
-            from circuitforge_orch.client import CFOrchClient
-
-            client = CFOrchClient(orch_url)
-            ttl_s = float(orch_cfg.get("ttl_s", 3600.0))
-
-            # Task-based allocation: product+task → coordinator resolves model/node.
-            task = orch_cfg.get("task")
-            product = orch_cfg.get("product") or os.environ.get("CF_APP_NAME") or None
-            if task and product:
-                ctx = client.task_allocate(product, task, ttl_s=ttl_s)
-                alloc = ctx.__enter__()
-                return (ctx, alloc)
-
-            # Service-based allocation (legacy path).
-            cf_app = os.environ.get("CF_APP_NAME") or None
-            caller = f"{cf_app}.llm-router" if cf_app else "llm-router"
-            ctx = client.allocate(
-                orch_cfg.get("service", "vllm"),
-                model_candidates=orch_cfg.get("model_candidates", []),
-                ttl_s=ttl_s,
-                caller=caller,
-                pipeline=cf_app,
-            )
-            alloc = ctx.__enter__()
-            return (ctx, alloc)
-        except Exception as exc:
-            logger.warning(
-                "[LLMRouter] cf_orch allocation failed, using base_url directly: %s",
-                exc,
-            )
-            return None
-
-    def complete(
-        self,
-        prompt: str,
-        system: str | None = None,
-        model_override: str | None = None,
-        fallback_order: list[str] | None = None,
-        images: list[str] | None = None,
-        max_tokens: int | None = None,
-    ) -> str:
+    def complete(self, prompt: str, system: str | None = None,
+                 model_override: str | None = None,
+                 fallback_order: list[str] | None = None,
+                 images: list[str] | None = None,
+                 max_tokens: int | None = None) -> str:
        """
        Generate a completion. Tries each backend in fallback_order.

@ -268,11 +60,7 @@ class LLMRouter:
                "AI inference is disabled in the public demo. "
                "Run your own instance to use AI features."
            )
-        order = (
-            fallback_order
-            if fallback_order is not None
-            else self.config["fallback_order"]
-        )
+        order = fallback_order if fallback_order is not None else self.config["fallback_order"]
        for name in order:
            backend = self.config["backends"][name]

@ -294,14 +82,7 @@ class LLMRouter:
                continue

            if is_vision_service:
-                # cf_orch: try allocation first (same pattern as openai_compat).
-                # Allocation can start the vision service on-demand on the cluster.
-                orch_ctx = orch_alloc = None
-                orch_result = self._try_cf_orch_alloc(backend)
-                if orch_result is not None:
-                    orch_ctx, orch_alloc = orch_result
-                    backend = {**backend, "base_url": orch_alloc.url}
-                elif not self._is_reachable(backend["base_url"]):
+                if not self._is_reachable(backend["base_url"]):
                    print(f"[LLMRouter] {name}: unreachable, skipping")
                    continue
                try:
@ -319,21 +100,9 @@ class LLMRouter:
                except Exception as e:
                    print(f"[LLMRouter] {name}: error — {e}, trying next")
                    continue
-                finally:
-                    if orch_ctx is not None:
-                        orch_ctx.__exit__(None, None, None)

            elif backend["type"] == "openai_compat":
-                # cf_orch: try allocation first — this may start the service on-demand.
-                # Do NOT reachability-check before allocating; the service may be stopped
-                # and the allocation is what starts it.
-                orch_ctx = orch_alloc = None
-                orch_result = self._try_cf_orch_alloc(backend)
-                if orch_result is not None:
-                    orch_ctx, orch_alloc = orch_result
-                    backend = {**backend, "base_url": orch_alloc.url + "/v1"}
-                elif not self._is_reachable(backend["base_url"]):
-                    # Static backend (no cf-orch) — skip if not reachable.
+                if not self._is_reachable(backend["base_url"]):
                    print(f"[LLMRouter] {name}: unreachable, skipping")
                    continue
                try:
@ -349,14 +118,10 @@ class LLMRouter:
                    if images and supports_images:
                        content = [{"type": "text", "text": prompt}]
                        for img in images:
-                            content.append(
-                                {
-                                    "type": "image_url",
-                                    "image_url": {
-                                        "url": f"data:image/png;base64,{img}"
-                                    },
-                                }
-                            )
+                            content.append({
+                                "type": "image_url",
+                                "image_url": {"url": f"data:image/png;base64,{img}"},
+                            })
                        messages.append({"role": "user", "content": content})
                    else:
                        messages.append({"role": "user", "content": prompt})
@ -371,37 +136,22 @@ class LLMRouter:
                except Exception as e:
                    print(f"[LLMRouter] {name}: error — {e}, trying next")
                    continue
-                finally:
-                    if orch_ctx is not None:
-                        try:
-                            orch_ctx.__exit__(None, None, None)
-                        except Exception:
-                            pass

            elif backend["type"] == "anthropic":
                api_key = os.environ.get(backend["api_key_env"], "")
                if not api_key:
-                    print(
-                        f"[LLMRouter] {name}: {backend['api_key_env']} not set, skipping"
-                    )
+                    print(f"[LLMRouter] {name}: {backend['api_key_env']} not set, skipping")
                    continue
                try:
                    import anthropic as _anthropic
-
                    client = _anthropic.Anthropic(api_key=api_key)
                    if images and supports_images:
                        content = []
                        for img in images:
-                            content.append(
-                                {
-                                    "type": "image",
-                                    "source": {
-                                        "type": "base64",
-                                        "media_type": "image/png",
-                                        "data": img,
-                                    },
-                                }
-                            )
+                            content.append({
+                                "type": "image",
+                                "source": {"type": "base64", "media_type": "image/png", "data": img},
+                            })
                        content.append({"type": "text", "text": prompt})
                    else:
                        content = prompt
@ -421,84 +171,6 @@ class LLMRouter:

        raise RuntimeError("All LLM backends exhausted")

-    def embed(
-        self,
-        texts: list[str],
-        model_override: str | None = None,
-        fallback_order: list[str] | None = None,
-    ) -> list[list[float]]:
-        """
-        Generate embeddings for a list of texts.
-
-        Only openai_compat backends are tried — Ollama and vLLM expose
-        /v1/embeddings; anthropic and vision_service do not.
-
-        Uses ``embedding_model`` from backend config when present;
-        falls back to ``model`` (the chat model) otherwise.
-
-        Args:
-            texts:          Texts to embed (batched in a single API call).
-            model_override: Override the embedding model for this call.
-            fallback_order: Override the backend fallback order for this call.
-
-        Returns:
-            List of float vectors, one per input text, in input order.
-
-        Raises:
-            RuntimeError: If all eligible backends are exhausted.
-        """
-        if os.environ.get("DEMO_MODE", "").lower() in ("1", "true", "yes"):
-            raise RuntimeError(
-                "AI inference is disabled in the public demo. "
-                "Run your own instance to use AI features."
-            )
-        order = (
-            fallback_order
-            if fallback_order is not None
-            else self.config["fallback_order"]
-        )
-        for name in order:
-            backend = self.config["backends"][name]
-            if not backend.get("enabled", True):
-                continue
-            if backend["type"] != "openai_compat":
-                continue
-
-            orch_ctx = orch_alloc = None
-            orch_result = self._try_cf_orch_alloc(backend)
-            if orch_result is not None:
-                orch_ctx, orch_alloc = orch_result
-                backend = {**backend, "base_url": orch_alloc.url + "/v1"}
-            elif not self._is_reachable(backend["base_url"]):
-                print(f"[LLMRouter] {name}: unreachable, skipping")
-                continue
-
-            embed_model = model_override or backend.get(
-                "embedding_model", backend["model"]
-            )
-            self._check_ollama_model_pulled(backend["base_url"], embed_model)
-
-            try:
-                client = OpenAI(
-                    base_url=backend["base_url"],
-                    api_key=backend.get("api_key") or "any",
-                )
-                model = embed_model
-                resp = client.embeddings.create(model=model, input=texts)
-                print(f"[LLMRouter] embed: used backend {name} ({model})")
-                return [item.embedding for item in resp.data]
-            except Exception as e:
-                print(f"[LLMRouter] {name}: embed error — {e}, trying next")
-                continue
-            finally:
-                if orch_ctx is not None:
-                    try:
-                        orch_ctx.__exit__(None, None, None)
-                    except Exception:
-                        pass
-
-        raise RuntimeError("All LLM backends exhausted for embed()")
-

 # Module-level singleton for convenience
 _router: LLMRouter | None = None
--- a/circuitforge_core/manage/init.py
+++ b/circuitforge_core/manage/init.py
@ -1,12 +0,0 @@
-"""circuitforge_core.manage — cross-platform product process manager."""
-from .config import ManageConfig, NativeService
-from .docker_mode import DockerManager, docker_available
-from .native_mode import NativeManager
-
-__all__ = [
-    "ManageConfig",
-    "NativeService",
-    "DockerManager",
-    "docker_available",
-    "NativeManager",
-]
--- a/circuitforge_core/manage/main.py
+++ b/circuitforge_core/manage/main.py
@ -1,4 +0,0 @@
-"""Entry point for `python -m circuitforge_core.manage`."""
-from .cli import app
-
-app()
--- a/circuitforge_core/manage/cli.py
+++ b/circuitforge_core/manage/cli.py
@ -1,237 +0,0 @@
-"""
-circuitforge_core.manage.cli — cross-platform product manager CLI.
-
-Usage (from any product directory):
-    python -m circuitforge_core.manage start
-    python -m circuitforge_core.manage stop
-    python -m circuitforge_core.manage restart
-    python -m circuitforge_core.manage status
-    python -m circuitforge_core.manage logs [SERVICE]
-    python -m circuitforge_core.manage open
-    python -m circuitforge_core.manage build
-    python -m circuitforge_core.manage install-shims
-
-Products shim into this via a thin manage.sh / manage.ps1 that finds Python
-and delegates: exec python -m circuitforge_core.manage "$@"
-"""
-from __future__ import annotations
-
-import sys
-import webbrowser
-from enum import Enum
-from pathlib import Path
-from typing import Annotated, Optional
-
-import typer
-
-from .config import ManageConfig
-from .docker_mode import DockerManager, docker_available
-from .native_mode import NativeManager
-
-app = typer.Typer(
-    name="manage",
-    help="CircuitForge cross-platform product manager",
-    no_args_is_help=True,
-)
-
-
-class Mode(str, Enum):
-    auto = "auto"
-    docker = "docker"
-    native = "native"
-
-
-def _resolve(
-    mode: Mode,
-    root: Path,
-    config: ManageConfig,
-) -> tuple[str, DockerManager | NativeManager]:
-    """Return (mode_name, manager) based on mode flag and environment."""
-    if mode == Mode.docker or (
-        mode == Mode.auto
-        and docker_available()
-        and (root / config.docker.compose_file).exists()
-    ):
-        return "docker", DockerManager(config, root)
-    return "native", NativeManager(config, root)
-
-
-def _load(root: Path) -> ManageConfig:
-    return ManageConfig.from_cwd(root)
-
-
-# ── commands ──────────────────────────────────────────────────────────────────
-
-@app.command()
-def start(
-    service: Annotated[Optional[str], typer.Argument(help="Service name (omit for all)")] = None,
-    mode: Mode = Mode.auto,
-    root: Path = Path("."),
-) -> None:
-    """Start services."""
-    config = _load(root.resolve())
-    mode_name, mgr = _resolve(mode, root.resolve(), config)
-    typer.echo(f"[{config.app_name}] Starting ({mode_name} mode)…")
-    if isinstance(mgr, DockerManager):
-        mgr.start(service or "")
-    else:
-        started = mgr.start(service)
-        if started:
-            typer.echo(f"[{config.app_name}] Started: {', '.join(started)}")
-        else:
-            typer.echo(f"[{config.app_name}] All services already running")
-
-
-@app.command()
-def stop(
-    service: Annotated[Optional[str], typer.Argument(help="Service name (omit for all)")] = None,
-    mode: Mode = Mode.auto,
-    root: Path = Path("."),
-) -> None:
-    """Stop services."""
-    config = _load(root.resolve())
-    mode_name, mgr = _resolve(mode, root.resolve(), config)
-    typer.echo(f"[{config.app_name}] Stopping ({mode_name} mode)…")
-    if isinstance(mgr, DockerManager):
-        mgr.stop(service or "")
-    else:
-        stopped = mgr.stop(service)
-        if stopped:
-            typer.echo(f"[{config.app_name}] Stopped: {', '.join(stopped)}")
-        else:
-            typer.echo(f"[{config.app_name}] No running services to stop")
-
-
-@app.command()
-def restart(
-    service: Annotated[Optional[str], typer.Argument(help="Service name (omit for all)")] = None,
-    mode: Mode = Mode.auto,
-    root: Path = Path("."),
-) -> None:
-    """Restart services."""
-    config = _load(root.resolve())
-    mode_name, mgr = _resolve(mode, root.resolve(), config)
-    typer.echo(f"[{config.app_name}] Restarting ({mode_name} mode)…")
-    if isinstance(mgr, DockerManager):
-        mgr.restart(service or "")
-    else:
-        mgr.stop(service)
-        mgr.start(service)
-
-
-@app.command()
-def status(
-    mode: Mode = Mode.auto,
-    root: Path = Path("."),
-) -> None:
-    """Show service status."""
-    config = _load(root.resolve())
-    mode_name, mgr = _resolve(mode, root.resolve(), config)
-    if isinstance(mgr, DockerManager):
-        mgr.status()
-    else:
-        rows = mgr.status()
-        if not rows:
-            typer.echo(f"[{config.app_name}] No native services defined in manage.toml")
-            return
-        typer.echo(f"\n  {config.app_name} — native services\n")
-        for svc in rows:
-            indicator = typer.style("●", fg=typer.colors.GREEN) if svc.running \
-                else typer.style("○", fg=typer.colors.RED)
-            pid_str = f"  pid={svc.pid}" if svc.pid else ""
-            port_str = f"  port={svc.port}" if svc.port else ""
-            typer.echo(f"  {indicator} {svc.name:<20}{pid_str}{port_str}")
-        typer.echo("")
-
-
-@app.command()
-def logs(
-    service: Annotated[Optional[str], typer.Argument(help="Service name")] = None,
-    follow: bool = typer.Option(True, "--follow/--no-follow", "-f/-F"),
-    mode: Mode = Mode.auto,
-    root: Path = Path("."),
-) -> None:
-    """Tail service logs."""
-    config = _load(root.resolve())
-    mode_name, mgr = _resolve(mode, root.resolve(), config)
-    if isinstance(mgr, DockerManager):
-        mgr.logs(service or "", follow=follow)
-    else:
-        if not service:
-            # Default to first service when none specified
-            if not config.services:
-                typer.echo("No native services defined", err=True)
-                raise typer.Exit(1)
-            service = config.services[0].name
-        mgr.logs(service, follow=follow)
-
-
-@app.command()
-def build(
-    no_cache: bool = False,
-    mode: Mode = Mode.auto,
-    root: Path = Path("."),
-) -> None:
-    """Build/rebuild service images (Docker mode only)."""
-    config = _load(root.resolve())
-    mode_name, mgr = _resolve(mode, root.resolve(), config)
-    if isinstance(mgr, NativeManager):
-        typer.echo("build is only available in Docker mode", err=True)
-        raise typer.Exit(1)
-    typer.echo(f"[{config.app_name}] Building images…")
-    mgr.build(no_cache=no_cache)
-
-
-@app.command("open")
-def open_browser(
-    url: Annotated[Optional[str], typer.Option(help="Override URL")] = None,
-    root: Path = Path("."),
-) -> None:
-    """Open the product web UI in the default browser."""
-    config = _load(root.resolve())
-    target = url or config.default_url
-    if not target:
-        typer.echo("No URL configured. Set default_url in manage.toml or pass --url.", err=True)
-        raise typer.Exit(1)
-    typer.echo(f"Opening {target}")
-    webbrowser.open(target)
-
-
-@app.command("install-shims")
-def install_shims(
-    root: Path = Path("."),
-    force: bool = typer.Option(False, "--force", help="Overwrite existing shims"),
-) -> None:
-    """
-    Write manage.sh and manage.ps1 shims into the product directory.
-
-    The shims auto-detect the Python environment (conda, venv, or system Python)
-    and delegate all arguments to `python -m circuitforge_core.manage`.
-    """
-    from importlib.resources import files as _res_files
-
-    target = root.resolve()
-    templates_pkg = "circuitforge_core.manage.templates"
-
-    for filename in ("manage.sh", "manage.ps1"):
-        dest = target / filename
-        if dest.exists() and not force:
-            typer.echo(f"  skipped {filename} (already exists — use --force to overwrite)")
-            continue
-        content = (_res_files(templates_pkg) / filename).read_text()
-        dest.write_text(content)
-        if filename.endswith(".sh"):
-            dest.chmod(dest.stat().st_mode | 0o111)  # make executable
-        typer.echo(f"  wrote {dest}")
-
-    toml_example = target / "manage.toml.example"
-    if not toml_example.exists() or force:
-        content = (_res_files(templates_pkg) / "manage.toml.example").read_text()
-        toml_example.write_text(content)
-        typer.echo(f"  wrote {toml_example}")
-
-    typer.echo("\nDone. Rename manage.toml.example → manage.toml and edit for your services.")
-
-
-if __name__ == "__main__":
-    app()
--- a/circuitforge_core/manage/config.py
+++ b/circuitforge_core/manage/config.py
@ -1,119 +0,0 @@
-"""
-circuitforge_core.manage.config — ManageConfig parsed from manage.toml.
-
-Products drop a manage.toml in their root directory.  manage.py reads it to
-discover the app name, compose file, and native service definitions.
-
-Minimal manage.toml (Docker-only):
----------------------------------------------------------------------
-[app]
-name = "kiwi"
-default_url = "http://localhost:8511"
----------------------------------------------------------------------
-
-Full manage.toml (Docker + native services):
----------------------------------------------------------------------
-[app]
-name = "kiwi"
-default_url = "http://localhost:8511"
-
-[docker]
-compose_file = "compose.yml"     # default
-project = "kiwi"                 # defaults to app.name
-
-[[native.services]]
-name = "api"
-command = "uvicorn app.main:app --host 0.0.0.0 --port 8512"
-port = 8512
-
-[[native.services]]
-name = "frontend"
-command = "npm run preview -- --host --port 8511"
-port = 8511
-cwd = "frontend"
----------------------------------------------------------------------
-"""
-from __future__ import annotations
-
-import sys
-from dataclasses import dataclass, field
-from pathlib import Path
-
-if sys.version_info >= (3, 11):
-    import tomllib
-else:
-    try:
-        import tomllib  # type: ignore[no-redef]
-    except ImportError:
-        import tomli as tomllib  # type: ignore[no-redef]
-
-_DEFAULT_COMPOSE_FILE = "compose.yml"
-
-
-@dataclass
-class NativeService:
-    """One process to manage in native mode."""
-    name: str
-    command: str                        # shell command string
-    port: int = 0                       # for status / open URL
-    cwd: str = ""                       # relative to project root; "" = root
-    env: dict[str, str] = field(default_factory=dict)
-
-
-@dataclass
-class DockerConfig:
-    compose_file: str = _DEFAULT_COMPOSE_FILE
-    project: str = ""                   # docker compose -p; defaults to app name
-
-
-@dataclass
-class ManageConfig:
-    app_name: str
-    default_url: str = ""
-    docker: DockerConfig = field(default_factory=DockerConfig)
-    services: list[NativeService] = field(default_factory=list)
-
-    @classmethod
-    def load(cls, path: Path) -> "ManageConfig":
-        """Load from a manage.toml file."""
-        raw = tomllib.loads(path.read_text())
-        app = raw.get("app", {})
-        name = app.get("name") or path.parent.name  # fallback to directory name
-        default_url = app.get("default_url", "")
-
-        docker_raw = raw.get("docker", {})
-        docker = DockerConfig(
-            compose_file=docker_raw.get("compose_file", _DEFAULT_COMPOSE_FILE),
-            project=docker_raw.get("project", name),
-        )
-
-        services: list[NativeService] = []
-        for svc in raw.get("native", {}).get("services", []):
-            services.append(NativeService(
-                name=svc["name"],
-                command=svc["command"],
-                port=svc.get("port", 0),
-                cwd=svc.get("cwd", ""),
-                env=svc.get("env", {}),
-            ))
-
-        return cls(
-            app_name=name,
-            default_url=default_url,
-            docker=docker,
-            services=services,
-        )
-
-    @classmethod
-    def from_cwd(cls, cwd: Path | None = None) -> "ManageConfig":
-        """
-        Load from manage.toml in cwd, or return a minimal config derived from
-        the directory name if no manage.toml exists (Docker-only products work
-        without one).
-        """
-        root = cwd or Path.cwd()
-        toml_path = root / "manage.toml"
-        if toml_path.exists():
-            return cls.load(toml_path)
-        # Fallback: infer from directory name, look for compose.yml
-        return cls(app_name=root.name)
--- a/circuitforge_core/manage/docker_mode.py
+++ b/circuitforge_core/manage/docker_mode.py
@ -1,115 +0,0 @@
-"""
-circuitforge_core.manage.docker_mode — Docker Compose wrapper.
-
-All commands delegate to `docker compose` (v2 plugin syntax).
-Falls back to `docker-compose` (v1 standalone) if the plugin is unavailable.
-"""
-from __future__ import annotations
-
-import shutil
-import subprocess
-import sys
-from pathlib import Path
-
-from .config import ManageConfig
-
-
-def _compose_bin() -> list[str]:
-    """Return the docker compose command as a list (handles v1/v2 difference)."""
-    # Docker Compose v2: `docker compose` (space, built-in plugin)
-    # Docker Compose v1: `docker-compose` (hyphen, standalone binary)
-    if shutil.which("docker"):
-        return ["docker", "compose"]
-    if shutil.which("docker-compose"):
-        return ["docker-compose"]
-    raise RuntimeError("Neither 'docker' nor 'docker-compose' found on PATH")
-
-
-def docker_available() -> bool:
-    """Return True if Docker is reachable (docker info succeeds)."""
-    try:
-        subprocess.run(
-            ["docker", "info"],
-            stdout=subprocess.DEVNULL,
-            stderr=subprocess.DEVNULL,
-            timeout=5,
-        )
-        return True
-    except Exception:
-        return False
-
-
-class DockerManager:
-    """
-    Wraps `docker compose` for a single product directory.
-
-    Args:
-        config:   ManageConfig for the current product.
-        root:     Product root directory (where compose file lives).
-    """
-
-    def __init__(self, config: ManageConfig, root: Path) -> None:
-        self.config = config
-        self.root = root
-        self._compose_file = root / config.docker.compose_file
-
-    def _run(self, *args: str, check: bool = True) -> subprocess.CompletedProcess:  # type: ignore[type-arg]
-        cmd = [
-            *_compose_bin(),
-            "-f", str(self._compose_file),
-            "-p", self.config.docker.project or self.config.app_name,
-            *args,
-        ]
-        return subprocess.run(cmd, cwd=self.root, check=check)
-
-    def _stream(self, *args: str) -> None:
-        """Run a compose command, streaming output directly to the terminal."""
-        cmd = [
-            *_compose_bin(),
-            "-f", str(self._compose_file),
-            "-p", self.config.docker.project or self.config.app_name,
-            *args,
-        ]
-        with subprocess.Popen(cmd, cwd=self.root) as proc:
-            try:
-                proc.wait()
-            except KeyboardInterrupt:
-                proc.terminate()
-
-    def compose_file_exists(self) -> bool:
-        return self._compose_file.exists()
-
-    def start(self, service: str = "") -> None:
-        args = ["up", "-d", "--build"]
-        if service:
-            args.append(service)
-        self._run(*args)
-
-    def stop(self, service: str = "") -> None:
-        if service:
-            self._run("stop", service)
-        else:
-            self._run("down")
-
-    def restart(self, service: str = "") -> None:
-        args = ["restart"]
-        if service:
-            args.append(service)
-        self._run(*args)
-
-    def status(self) -> None:
-        self._run("ps", check=False)
-
-    def logs(self, service: str = "", follow: bool = True) -> None:
-        args = ["logs"]
-        if follow:
-            args.append("-f")
-        if service:
-            args.append(service)
-        self._stream(*args)
-
-    def build(self, no_cache: bool = False) -> None:
-        args = ["build"]
-        if no_cache:
-            args.append("--no-cache")
-        self._run(*args)
--- a/circuitforge_core/manage/native_mode.py
+++ b/circuitforge_core/manage/native_mode.py
@ -1,217 +0,0 @@
-"""
-circuitforge_core.manage.native_mode — PID-file process manager.
-
-Manages processes directly without Docker.  Designed for Windows (no WSL2,
-no Docker), but works identically on Linux/macOS.
-
-Platform conventions (via platformdirs):
-  PID files : user_runtime_dir(app_name) / <service>.pid
-  Log files : user_log_dir(app_name)     / <service>.log
-
-PID file format (one line each):
-  <pid>
-  <command_fingerprint>   (first 80 chars of command — used to sanity-check
-                           that the PID belongs to our process, not a recycled one)
-"""
-from __future__ import annotations
-
-import os
-import platform
-import shlex
-import subprocess
-import sys
-import time
-from dataclasses import dataclass
-from pathlib import Path
-
-from platformdirs import user_log_dir, user_runtime_dir
-
-from .config import ManageConfig, NativeService
-
-_IS_WINDOWS = platform.system() == "Windows"
-_LOG_TAIL_LINES = 50
-_FOLLOW_POLL_S = 0.25
-
-
-@dataclass
-class ServiceStatus:
-    name: str
-    running: bool
-    pid: int | None
-    port: int
-    log_path: Path
-
-
-class NativeManager:
-    """
-    Start, stop, and monitor native processes for a product.
-
-    Args:
-        config: ManageConfig for the current product.
-        root:   Product root directory.
-    """
-
-    def __init__(self, config: ManageConfig, root: Path) -> None:
-        self.config = config
-        self.root = root
-        self._pid_dir = Path(user_runtime_dir(config.app_name, ensure_exists=True))
-        self._log_dir = Path(user_log_dir(config.app_name, ensure_exists=True))
-
-    # ── helpers ───────────────────────────────────────────────────────────────
-
-    def _pid_path(self, name: str) -> Path:
-        return self._pid_dir / f"{name}.pid"
-
-    def _log_path(self, name: str) -> Path:
-        return self._log_dir / f"{name}.log"
-
-    def _write_pid(self, name: str, pid: int, command: str) -> None:
-        self._pid_path(name).write_text(f"{pid}\n{command[:80]}\n")
-
-    def _read_pid(self, name: str) -> int | None:
-        p = self._pid_path(name)
-        if not p.exists():
-            return None
-        try:
-            return int(p.read_text().splitlines()[0].strip())
-        except (ValueError, IndexError):
-            return None
-
-    def _pid_alive(self, pid: int) -> bool:
-        """Return True if a process with this PID is currently running."""
-        if _IS_WINDOWS:
-            try:
-                result = subprocess.run(
-                    ["tasklist", "/FI", f"PID eq {pid}", "/NH"],
-                    capture_output=True, text=True,
-                )
-                return str(pid) in result.stdout
-            except Exception:
-                return False
-        else:
-            try:
-                os.kill(pid, 0)   # signal 0 = existence check only
-                return True
-            except (OSError, ProcessLookupError):
-                return False
-
-    def _kill(self, pid: int) -> None:
-        """Terminate a process gracefully, then force-kill if needed."""
-        if _IS_WINDOWS:
-            subprocess.run(["taskkill", "/F", "/PID", str(pid)],
-                           capture_output=True)
-        else:
-            import signal
-            try:
-                os.kill(pid, signal.SIGTERM)
-                for _ in range(30):          # wait up to 3 s
-                    time.sleep(0.1)
-                    if not self._pid_alive(pid):
-                        return
-                os.kill(pid, signal.SIGKILL)
-            except (OSError, ProcessLookupError):
-                pass
-
-    def _svc(self, name: str) -> NativeService | None:
-        return next((s for s in self.config.services if s.name == name), None)
-
-    # ── public API ────────────────────────────────────────────────────────────
-
-    def is_running(self, name: str) -> bool:
-        pid = self._read_pid(name)
-        return pid is not None and self._pid_alive(pid)
-
-    def status(self) -> list[ServiceStatus]:
-        result = []
-        for svc in self.config.services:
-            pid = self._read_pid(svc.name)
-            running = pid is not None and self._pid_alive(pid)
-            result.append(ServiceStatus(
-                name=svc.name,
-                running=running,
-                pid=pid if running else None,
-                port=svc.port,
-                log_path=self._log_path(svc.name),
-            ))
-        return result
-
-    def start(self, name: str | None = None) -> list[str]:
-        """Start one or all services. Returns list of started service names."""
-        targets = [self._svc(name)] if name else self.config.services
-        started: list[str] = []
-        for svc in targets:
-            if svc is None:
-                raise ValueError(f"Unknown service: {name!r}")
-            if self.is_running(svc.name):
-                continue
-            cwd = (self.root / svc.cwd) if svc.cwd else self.root
-            log_file = open(self._log_path(svc.name), "a")  # noqa: WPS515
-            env = {**os.environ, **svc.env}
-            if _IS_WINDOWS:
-                cmd = svc.command          # Windows: pass as string to shell
-                shell = True
-            else:
-                cmd = shlex.split(svc.command)
-                shell = False
-            proc = subprocess.Popen(
-                cmd,
-                cwd=cwd,
-                env=env,
-                shell=shell,
-                stdout=log_file,
-                stderr=log_file,
-                start_new_session=True,    # detach from terminal (Unix)
-            )
-            self._write_pid(svc.name, proc.pid, svc.command)
-            started.append(svc.name)
-        return started
-
-    def stop(self, name: str | None = None) -> list[str]:
-        """Stop one or all services. Returns list of stopped service names."""
-        names = [name] if name else [s.name for s in self.config.services]
-        stopped: list[str] = []
-        for n in names:
-            pid = self._read_pid(n)
-            if pid and self._pid_alive(pid):
-                self._kill(pid)
-                stopped.append(n)
-            pid_path = self._pid_path(n)
-            if pid_path.exists():
-                pid_path.unlink()
-        return stopped
-
-    def logs(self, name: str, follow: bool = True, lines: int = _LOG_TAIL_LINES) -> None:
-        """
-        Print the last N lines of a service log, then optionally follow.
-
-        Uses polling rather than `tail -f` so it works on Windows.
-        """
-        log_path = self._log_path(name)
-        if not log_path.exists():
-            print(f"[{name}] No log file found at {log_path}", file=sys.stderr)
-            return
-
-        # Print last N lines
-        content = log_path.read_bytes()
-        lines_data = content.splitlines()[-lines:]
-        for line in lines_data:
-            print(line.decode("utf-8", errors="replace"))
-
-        if not follow:
-            return
-
-        # Poll for new content
-        offset = len(content)
-        try:
-            while True:
-                time.sleep(_FOLLOW_POLL_S)
-                new_size = log_path.stat().st_size
-                if new_size > offset:
-                    with open(log_path, "rb") as f:
-                        f.seek(offset)
-                        chunk = f.read()
-                    offset = new_size
-                    for line in chunk.splitlines():
-                        print(line.decode("utf-8", errors="replace"))
-        except KeyboardInterrupt:
-            pass
--- a/circuitforge_core/manage/templates/manage.ps1
+++ b/circuitforge_core/manage/templates/manage.ps1
@ -1,30 +0,0 @@
-# manage.ps1 — CircuitForge cross-platform product manager shim (Windows)
-#
-# Auto-detects the Python environment and delegates to
-# `python -m circuitforge_core.manage`.
-#
-# Generated by: python -m circuitforge_core.manage install-shims
-# Do not edit the logic here; edit manage.toml for product configuration.
-
-# ── Python detection ──────────────────────────────────────────────────────────
-$Python = $null
-
-if (Test-Path ".venv\Scripts\python.exe") {
-    $Python = ".venv\Scripts\python.exe"
-} elseif (Test-Path "venv\Scripts\python.exe") {
-    $Python = "venv\Scripts\python.exe"
-} elseif ($env:CONDA_DEFAULT_ENV -and (Get-Command conda -ErrorAction SilentlyContinue)) {
-    # Conda: run via `conda run` so the env is activated correctly
-    & conda run -n $env:CONDA_DEFAULT_ENV python -m circuitforge_core.manage @args
-    exit $LASTEXITCODE
-} elseif (Get-Command python -ErrorAction SilentlyContinue) {
-    $Python = "python"
-} elseif (Get-Command python3 -ErrorAction SilentlyContinue) {
-    $Python = "python3"
-} else {
-    Write-Error "No Python interpreter found. Install Python 3.11+, activate a venv, or activate a conda environment."
-    exit 1
-}
-
-& $Python -m circuitforge_core.manage @args
-exit $LASTEXITCODE
--- a/circuitforge_core/manage/templates/manage.sh
+++ b/circuitforge_core/manage/templates/manage.sh
@ -1,28 +0,0 @@
-#!/usr/bin/env bash
-# manage.sh — CircuitForge cross-platform product manager shim
-#
-# Auto-detects the Python environment and delegates to
-# `python -m circuitforge_core.manage`.
-#
-# Generated by: python -m circuitforge_core.manage install-shims
-# Do not edit the logic here; edit manage.toml for product configuration.
-set -euo pipefail
-
-# ── Python detection ──────────────────────────────────────────────────────────
-if [ -f ".venv/bin/python" ]; then
-    PYTHON=".venv/bin/python"
-elif [ -f "venv/bin/python" ]; then
-    PYTHON="venv/bin/python"
-elif command -v conda &>/dev/null && [ -n "${CONDA_DEFAULT_ENV:-}" ]; then
-    PYTHON="conda run -n ${CONDA_DEFAULT_ENV} python"
-elif command -v python3 &>/dev/null; then
-    PYTHON="python3"
-elif command -v python &>/dev/null; then
-    PYTHON="python"
-else
-    echo "ERROR: No Python interpreter found." >&2
-    echo "Install Python 3.11+, activate a venv, or activate a conda environment." >&2
-    exit 1
-fi
-
-exec $PYTHON -m circuitforge_core.manage "$@"
--- a/circuitforge_core/manage/templates/manage.toml.example
+++ b/circuitforge_core/manage/templates/manage.toml.example
@ -1,38 +0,0 @@
-# manage.toml — CircuitForge product manager configuration
-#
-# Drop this file (renamed from manage.toml.example) in your product root.
-# Docker-only products only need [app]; native services require [[native.services]].
-
-[app]
-# Product name — used for log/PID directory names and display.
-name = "myproduct"
-
-# URL opened by `manage.py open`. Typically the frontend port.
-default_url = "http://localhost:8511"
-
-[docker]
-# Path to the Docker Compose file, relative to this directory.
-compose_file = "compose.yml"
-
-# Docker Compose project name (defaults to app.name).
-# project = "myproduct"
-
-# ── Native mode services ───────────────────────────────────────────────────────
-# Define one [[native.services]] block per process.
-# Used when Docker is unavailable (Windows without Docker, or --mode native).
-
-[[native.services]]
-name = "api"
-# Full shell command to launch the backend.
-command = "uvicorn app.main:app --host 0.0.0.0 --port 8512 --reload"
-port = 8512
-# cwd is relative to the project root. Leave empty for the project root itself.
-cwd = ""
-# Optional extra environment variables.
-# env = { PYTHONPATH = ".", DEBUG = "1" }
-
-[[native.services]]
-name = "frontend"
-command = "npm run preview -- --host 0.0.0.0 --port 8511"
-port = 8511
-cwd = "frontend"
--- a/circuitforge_core/memory/init.py
+++ b/circuitforge_core/memory/init.py
@ -1,54 +0,0 @@
-"""circuitforge_core.memory — persistent knowledge graph via mnemo sidecar.
-
-MIT licensed.
-
-Requires the mnemo sidecar to be running (https://github.com/zaydmulani09/mnemo).
-If the sidecar is not available, all operations silently no-op so products
-can call memory methods unconditionally.
-
-Quick start (in a FastAPI lifespan)::
-
-    from circuitforge_core.memory import MemoryClient, MemoryConfig
-
-    memory = MemoryClient(MemoryConfig.from_env())
-
-    @asynccontextmanager
-    async def lifespan(app):
-        await memory.connect()
-        yield
-        await memory.close()
-
-    # In a route:
-    await memory.remember("User avoids shellfish", source="dietary-prefs")
-    context = await memory.recall("What are this user's food restrictions?")
-
-Docker Compose setup::
-
-    services:
-      mnemo:
-        image: ghcr.io/zaydmulani09/mnemo:latest
-        ports: ["8080:8080"]
-        environment:
-          MNEMO_LLM_PROVIDER: ollama
-          MNEMO_LLM_BASE_URL: http://ollama:11434/v1
-          MNEMO_LLM_MODEL: llama3
-        volumes:
-          - mnemo-data:/data
-
-Environment variables (for MemoryConfig.from_env())::
-
-    MNEMO_HOST     — default: localhost
-    MNEMO_PORT     — default: 8080
-    MNEMO_TIMEOUT  — default: 10.0
-"""
-
-from circuitforge_core.memory.client import MemoryClient, MemoryUnavailableError
-from circuitforge_core.memory.models import MemoryConfig, MemoryEntity, MemoryStats
-
-__all__ = [
-    "MemoryClient",
-    "MemoryConfig",
-    "MemoryEntity",
-    "MemoryStats",
-    "MemoryUnavailableError",
-]
--- a/circuitforge_core/memory/client.py
+++ b/circuitforge_core/memory/client.py
@ -1,317 +0,0 @@
-"""MemoryClient — async wrapper around the mnemo persistent knowledge graph.
-
-mnemo is an optional sidecar (https://github.com/zaydmulani09/mnemo).
-When the sidecar is not running, all operations silently no-op so products
-can call memory methods unconditionally without try/except.
-
-MIT licensed.
-"""
-from __future__ import annotations
-
-import logging
-import time
-from typing import Any
-
-from circuitforge_core.memory.models import MemoryConfig, MemoryEntity, MemoryStats
-
-logger = logging.getLogger(__name__)
-
-# Backoff schedule: 5 * 2^(failure-1), capped at _MAX_BACKOFF seconds.
-# failure 1 →  5s, 2 → 10s, 3 → 20s, 4 → 40s, 5+ → 60s
-_MAX_FAILURES: int = 3
-_MAX_BACKOFF: float = 60.0
-
-
-class MemoryUnavailableError(RuntimeError):
-    """Raised only when strict=True and mnemo is not reachable."""
-
-
-class MemoryClient:
-    """Async interface to the mnemo knowledge graph sidecar.
-
-    Resilience model:
-    - If the sidecar is unreachable at connect(), logs once and enters no-op mode.
-    - If a live call fails, the failure is counted. Each failure schedules an
-      exponentially increasing cooldown before the next reconnect attempt.
-    - After _MAX_FAILURES consecutive failures the client is marked unavailable;
-      all calls no-op until the cooldown elapses and a reconnect succeeds.
-    - Any successful call resets the failure counter.
-
-    Usage (in a FastAPI lifespan)::
-
-        from circuitforge_core.memory import MemoryClient, MemoryConfig
-
-        memory = MemoryClient(MemoryConfig.from_env())
-
-        @asynccontextmanager
-        async def lifespan(app):
-            await memory.connect()
-            yield
-            await memory.close()
-
-    Then in handlers::
-
-        await memory.remember("User prefers dark mode", source="settings")
-        context = await memory.recall("What are the user's UI preferences?")
-    """
-
-    def __init__(self, config: MemoryConfig | None = None, *, strict: bool = False) -> None:
-        """
-        Args:
-            config: connection settings; defaults to MemoryConfig.from_env()
-            strict: if True, MemoryUnavailableError is raised on connect failure
-                or after _MAX_FAILURES consecutive call failures
-        """
-        self._config = config or MemoryConfig.from_env()
-        self._strict = strict
-        self._available = False
-        self._client: Any = None       # mnemo AsyncMnemoClient, set in connect()
-        self._failure_count: int = 0
-        self._retry_at: float | None = None  # monotonic timestamp; None = no retry pending
-
-    @property
-    def available(self) -> bool:
-        """True if the mnemo sidecar was reachable at last health check."""
-        return self._available
-
-    @property
-    def failure_count(self) -> int:
-        """Consecutive call failures since the last success."""
-        return self._failure_count
-
-    # ── Lifecycle ─────────────────────────────────────────────────────────────
-
-    async def connect(self) -> None:
-        """Attempt to connect to the mnemo sidecar and run a health check.
-
-        Safe to call multiple times (used internally for reconnect). If the
-        sidecar is not reachable, logs a warning and enters no-op mode.
-        Does NOT raise unless strict=True.
-        """
-        try:
-            from mnemo import AsyncMnemoClient
-        except ImportError:
-            logger.debug(
-                "mnemo-sdk not installed — memory module disabled. "
-                "Install with: pip install circuitforge-core[memory]"
-            )
-            self._available = False
-            return
-
-        self._client = AsyncMnemoClient(
-            base_url=self._config.base_url,
-            timeout=self._config.timeout,
-        )
-        try:
-            health = await self._client.health()
-            if health.status == "ok":
-                self._available = True
-                self._on_call_success()
-                logger.info(
-                    "mnemo memory sidecar connected at %s (LLM: %s/%s)",
-                    self._config.base_url,
-                    health.provider_type,
-                    health.provider_model,
-                )
-            else:
-                self._handle_unavailable("connect", reason=f"health status={health.status!r}")
-        except Exception as exc:
-            self._handle_unavailable("connect", reason=str(exc))
-
-    async def close(self) -> None:
-        """Close the underlying HTTP client."""
-        if self._client is not None:
-            try:
-                await self._client.__aexit__(None, None, None)
-            except Exception:
-                pass
-            self._client = None
-        self._available = False
-        self._retry_at = None
-
-    # ── Core API ──────────────────────────────────────────────────────────────
-
-    async def remember(
-        self,
-        text: str,
-        *,
-        source: str = "cf-core",
-        session_id: str | None = None,
-    ) -> bool:
-        """Store a text fragment in the knowledge graph.
-
-        mnemo extracts named entities and relationships from the text and
-        updates its graph. Large texts should be pre-chunked by the caller
-        (mnemo stores each call as a single chunk with no sub-splitting).
-
-        Args:
-            text: the text to store (conversation turn, fact, note, etc.)
-            source: label for the origin (e.g. "chat", "settings", "search")
-            session_id: optional session grouping for multi-turn retrieval
-
-        Returns:
-            True if stored, False if sidecar unavailable.
-        """
-        if not await self._maybe_reconnect():
-            return False
-        try:
-            await self._client.ingest(content=text, source=source, session_id=session_id)
-            self._on_call_success()
-            return True
-        except Exception as exc:
-            self._on_call_error("remember", exc)
-            return False
-
-    async def recall(
-        self,
-        query: str,
-        *,
-        session_id: str | None = None,
-    ) -> str:
-        """Retrieve a formatted context block relevant to query.
-
-        Returns a prompt-ready string (or empty string if unavailable).
-        Inject the result directly into a system prompt::
-
-            context = await memory.recall("user dietary restrictions")
-            system = f"You are a helpful assistant.\\n\\n{context}"
-
-        Args:
-            query: natural language question or topic to retrieve context for
-            session_id: restrict retrieval to a specific session (optional)
-
-        Returns:
-            Formatted context string, or "" if sidecar unavailable.
-        """
-        if not await self._maybe_reconnect():
-            return ""
-        try:
-            result = await self._client.get_context(text=query, session_id=session_id)
-            self._failure_count = 0
-            return result
-        except Exception as exc:
-            self._on_call_error("recall", exc)
-            return ""
-
-    async def entities(self, *, limit: int = 50) -> list[MemoryEntity]:
-        """Return the most recent named entities in the knowledge graph.
-
-        Args:
-            limit: max entities to return (default 50)
-
-        Returns:
-            List of MemoryEntity objects, or [] if unavailable.
-        """
-        if not await self._maybe_reconnect():
-            return []
-        try:
-            raw = await self._client.list_entities(limit=limit)
-            self._on_call_success()
-            return [MemoryEntity.from_mnemo(e) for e in raw]
-        except Exception as exc:
-            self._on_call_error("entities", exc)
-            return []
-
-    async def stats(self) -> MemoryStats | None:
-        """Return knowledge graph statistics, or None if unavailable."""
-        if not await self._maybe_reconnect():
-            return None
-        try:
-            s = await self._client.stats()
-            self._on_call_success()
-            return MemoryStats(
-                entity_count=s.entity_count,
-                chunk_count=s.chunk_count,
-                node_count=s.node_count,
-                edge_count=s.edge_count,
-                uptime_seconds=s.uptime_seconds,
-                available=True,
-            )
-        except Exception as exc:
-            self._on_call_error("stats", exc)
-            return None
-
-    async def wipe(self) -> bool:
-        """Delete all stored memory. Irreversible.
-
-        Returns True on success, False if unavailable or failed.
-        """
-        if not await self._maybe_reconnect():
-            return False
-        try:
-            await self._client.wipe()
-            self._on_call_success()
-            logger.warning("mnemo memory wiped — all entities and chunks deleted")
-            return True
-        except Exception as exc:
-            self._on_call_error("wipe", exc)
-            return False
-
-    # ── Internal ──────────────────────────────────────────────────────────────
-
-    async def _maybe_reconnect(self) -> bool:
-        """Return True if the client is available (or just became available).
-
-        Called at the top of every public method. If the client is unavailable
-        but the retry cooldown has elapsed, silently attempts reconnect before
-        answering. No-ops immediately if still within the cooldown window.
-        """
-        if self._available:
-            return True
-        if self._retry_at is not None and time.monotonic() >= self._retry_at:
-            logger.info(
-                "mnemo: cooldown elapsed after %d failure(s) — attempting reconnect",
-                self._failure_count,
-            )
-            self._retry_at = None
-            self._client = None
-            await self.connect()
-        return self._available
-
-    def _on_call_success(self) -> None:
-        """Reset failure state after a successful call."""
-        self._failure_count = 0
-        self._retry_at = None
-
-    def _handle_unavailable(self, operation: str, reason: str = "") -> None:
-        """Called when the sidecar is unreachable at connect() time."""
-        self._available = False
-        msg = f"mnemo memory sidecar unavailable (operation={operation!r})"
-        if reason:
-            msg += f": {reason}"
-        if self._strict:
-            raise MemoryUnavailableError(msg)
-        logger.warning("%s — memory features disabled", msg)
-
-    def _on_call_error(self, operation: str, exc: Exception) -> None:
-        """Count consecutive failures and schedule exponential backoff retry.
-
-        Backoff: 5 * 2^(failure-1) seconds, capped at 60s.
-            failure 1 →  5s
-            failure 2 → 10s
-            failure 3 → 20s  ← _MAX_FAILURES default; client disabled here
-            failure 4 → 40s
-            failure 5+ → 60s
-
-        After _MAX_FAILURES, _available is set to False and all calls no-op
-        until _maybe_reconnect() fires after the cooldown elapses.
-        """
-        self._failure_count += 1
-        backoff = min(5.0 * (2 ** (self._failure_count - 1)), _MAX_BACKOFF)
-        self._retry_at = time.monotonic() + backoff
-
-        if self._failure_count >= _MAX_FAILURES:
-            self._available = False
-            logger.warning(
-                "mnemo %r failed %d consecutive times (%s) — disabled, reconnect in %.0fs",
-                operation, self._failure_count, exc, backoff,
-            )
-            if self._strict:
-                raise MemoryUnavailableError(
-                    f"mnemo {operation!r} failed {self._failure_count} consecutive times: {exc}"
-                )
-        else:
-            logger.warning(
-                "mnemo %r failed (%d/%d): %s — retry in %.0fs",
-                operation, self._failure_count, _MAX_FAILURES, exc, backoff,
-            )
--- a/circuitforge_core/memory/models.py
+++ b/circuitforge_core/memory/models.py
@ -1,73 +0,0 @@
-"""Data models for the cf-core memory module.
-
-MIT licensed.
-"""
-from __future__ import annotations
-
-import os
-from dataclasses import dataclass, field
-from datetime import datetime
-
-
-@dataclass(frozen=True)
-class MemoryConfig:
-    """Connection config for a mnemo sidecar."""
-
-    host: str = "localhost"
-    port: int = 8080
-    timeout: float = 10.0
-
-    @classmethod
-    def from_env(cls) -> MemoryConfig:
-        """Read config from environment variables.
-
-        Variables:
-            MNEMO_HOST  — default: localhost
-            MNEMO_PORT  — default: 8080
-            MNEMO_TIMEOUT — default: 10.0
-        """
-        return cls(
-            host=os.environ.get("MNEMO_HOST", "localhost"),
-            port=int(os.environ.get("MNEMO_PORT", "8080")),
-            timeout=float(os.environ.get("MNEMO_TIMEOUT", "10.0")),
-        )
-
-    @property
-    def base_url(self) -> str:
-        return f"http://{self.host}:{self.port}"
-
-
-@dataclass(frozen=True)
-class MemoryEntity:
-    """A named entity extracted and stored by the mnemo knowledge graph."""
-
-    entity_id: str
-    name: str
-    entity_type: str
-    aliases: list[str] = field(default_factory=list)
-    confidence: float = 1.0
-    source_count: int = 1
-
-    @classmethod
-    def from_mnemo(cls, obj) -> MemoryEntity:
-        """Convert a mnemo-sdk Entity object to MemoryEntity."""
-        return cls(
-            entity_id=str(obj.id),
-            name=obj.name,
-            entity_type=obj.entity_type,
-            aliases=list(obj.aliases or []),
-            confidence=float(obj.confidence or 1.0),
-            source_count=int(obj.source_count or 1),
-        )
-
-
-@dataclass(frozen=True)
-class MemoryStats:
-    """Snapshot of the mnemo knowledge graph state."""
-
-    entity_count: int
-    chunk_count: int
-    node_count: int
-    edge_count: int
-    uptime_seconds: float
-    available: bool
--- a/circuitforge_core/mqtt/init.py
+++ b/circuitforge_core/mqtt/init.py
@ -1,42 +0,0 @@
-"""circuitforge_core.mqtt — async MQTT client with topic routing and
-Meshtastic adapter support.
-
-MIT licensed.
-
-Quick start::
-
-    from circuitforge_core.mqtt import MQTTClient, MQTTConfig
-
-    cfg = MQTTConfig(host="localhost")
-    client = MQTTClient(cfg)
-
-    @client.on("sensors/#")
-    async def handle(msg):
-        print(msg.topic, msg.text())
-
-    await client.run()
-
-For Meshtastic::
-
-    from circuitforge_core.mqtt.meshtastic import make_backend
-
-    backend = make_backend({
-        "backend": "mqtt",
-        "broker_host": "mqtt.example.com",
-        "topic_prefix": "msh/#",
-    })
-    async for pkt in backend.packets():
-        print(pkt.summary())
-"""
-
-from circuitforge_core.mqtt.client import MQTTClient
-from circuitforge_core.mqtt.models import MQTTConfig, MQTTMessage
-from circuitforge_core.mqtt.router import TopicRouter, matches
-
-__all__ = [
-    "MQTTClient",
-    "MQTTConfig",
-    "MQTTMessage",
-    "TopicRouter",
-    "matches",
-]
--- a/circuitforge_core/mqtt/client.py
+++ b/circuitforge_core/mqtt/client.py
@ -1,152 +0,0 @@
-"""Async MQTT client wrapper around aiomqtt.
-
-MIT licensed.
-"""
-from __future__ import annotations
-
-import asyncio
-import logging
-from collections.abc import AsyncIterator
-from contextlib import asynccontextmanager
-from datetime import datetime, timezone
-from typing import Any
-
-from circuitforge_core.mqtt.models import MQTTConfig, MQTTMessage
-from circuitforge_core.mqtt.router import TopicRouter
-
-logger = logging.getLogger(__name__)
-
-
-class MQTTClient:
-    """Async MQTT client that subscribes to topics and dispatches messages.
-
-    Usage (with a router)::
-
-        cfg = MQTTConfig(host="localhost")
-        client = MQTTClient(cfg)
-
-        @client.on("msh/#")
-        async def handle_mesh(msg: MQTTMessage):
-            print(msg.topic, msg.text())
-
-        await client.run()
-
-    Usage (iterate raw messages)::
-
-        async with MQTTClient(cfg) as messages:
-            async for msg in messages:
-                print(msg.topic)
-    """
-
-    def __init__(self, config: MQTTConfig, router: TopicRouter | None = None) -> None:
-        self._config = config
-        self._router = router or TopicRouter()
-
-    def on(self, pattern: str):
-        """Shorthand decorator — forwards to the internal router."""
-        return self._router.on(pattern)
-
-    async def run(self) -> None:
-        """Subscribe to all registered patterns and dispatch until cancelled.
-
-        Reconnects automatically if the connection drops.
-        """
-        try:
-            import aiomqtt
-        except ImportError as exc:
-            raise ImportError(
-                "aiomqtt is required for MQTTClient. "
-                "Install with: pip install circuitforge-core[mqtt]"
-            ) from exc
-
-        cfg = self._config
-        while True:
-            try:
-                kwargs: dict[str, Any] = {
-                    "hostname": cfg.host,
-                    "port": cfg.port,
-                    "keepalive": cfg.keepalive,
-                    "tls_params": aiomqtt.TLSParameters() if cfg.tls else None,
-                }
-                if cfg.client_id:
-                    kwargs["identifier"] = cfg.client_id
-                if cfg.username is not None:
-                    kwargs["username"] = cfg.username
-                if cfg.password is not None:
-                    kwargs["password"] = cfg.password
-
-                async with aiomqtt.Client(**kwargs) as ac:
-                    patterns = self._router.patterns
-                    if not patterns:
-                        logger.warning("MQTTClient started with no subscriptions")
-                    for p in patterns:
-                        await ac.subscribe(p)
-                        logger.debug("Subscribed to %r on %s:%d", p, cfg.host, cfg.port)
-                    logger.info("MQTT connected to %s:%d", cfg.host, cfg.port)
-
-                    async for raw in ac.messages:
-                        msg = MQTTMessage(
-                            topic=str(raw.topic),
-                            payload=raw.payload if isinstance(raw.payload, bytes) else str(raw.payload).encode(),
-                            qos=raw.qos,
-                            retain=raw.retain,
-                            received_at=datetime.now(tz=timezone.utc),
-                        )
-                        await self._router.dispatch(msg)
-
-            except asyncio.CancelledError:
-                logger.info("MQTTClient cancelled")
-                raise
-            except Exception as exc:
-                logger.warning(
-                    "MQTT connection to %s:%d failed (%s), retrying in %.0fs",
-                    cfg.host, cfg.port, exc, cfg.reconnect_interval,
-                )
-                await asyncio.sleep(cfg.reconnect_interval)
-
-    @asynccontextmanager
-    async def connect(self) -> AsyncIterator[AsyncIterator[MQTTMessage]]:
-        """Context manager that yields an async iterator of raw messages.
-
-        Useful when the caller wants to do its own routing::
-
-            async with client.connect() as messages:
-                async for msg in messages:
-                    ...
-        """
-        try:
-            import aiomqtt
-        except ImportError as exc:
-            raise ImportError(
-                "aiomqtt is required. Install with: pip install circuitforge-core[mqtt]"
-            ) from exc
-
-        cfg = self._config
-        kwargs: dict[str, Any] = {
-            "hostname": cfg.host,
-            "port": cfg.port,
-            "keepalive": cfg.keepalive,
-            "tls_params": aiomqtt.TLSParameters() if cfg.tls else None,
-        }
-        if cfg.client_id:
-            kwargs["identifier"] = cfg.client_id
-        if cfg.username is not None:
-            kwargs["username"] = cfg.username
-        if cfg.password is not None:
-            kwargs["password"] = cfg.password
-
-        async with aiomqtt.Client(**kwargs) as ac:
-            for p in self._router.patterns:
-                await ac.subscribe(p)
-
-            async def _iter() -> AsyncIterator[MQTTMessage]:
-                async for raw in ac.messages:
-                    yield MQTTMessage(
-                        topic=str(raw.topic),
-                        payload=raw.payload if isinstance(raw.payload, bytes) else str(raw.payload).encode(),
-                        qos=raw.qos,
-                        retain=raw.retain,
-                        received_at=datetime.now(tz=timezone.utc),
-                    )
-
-            yield _iter()
--- a/circuitforge_core/mqtt/meshtastic/init.py
+++ b/circuitforge_core/mqtt/meshtastic/init.py
@ -1,76 +0,0 @@
-"""Meshtastic adapter for circuitforge-core.
-
-Two backends are available:
-
- ``MQTTMeshtasticBackend``  — subscribes to a Meshtastic MQTT bridge
- ``SerialMeshtasticBackend`` — direct serial/TCP connection via the
-  ``meshtastic`` Python library
-
-Use ``make_backend()`` for config-driven selection.
-
-MIT licensed.
-"""
-from __future__ import annotations
-
-from circuitforge_core.mqtt.meshtastic.interface import MeshtasticInterface
-from circuitforge_core.mqtt.meshtastic.models import (
-    MeshtasticPacket,
-    MeshtasticPosition,
-    MeshtasticTelemetry,
-)
-from circuitforge_core.mqtt.meshtastic.mqtt_backend import MQTTMeshtasticBackend
-from circuitforge_core.mqtt.meshtastic.serial_backend import SerialMeshtasticBackend
-from circuitforge_core.mqtt.models import MQTTConfig
-
-
-def make_backend(config: dict) -> MeshtasticInterface:
-    """Construct a Meshtastic backend from a config dict.
-
-    Config keys:
-        backend (str): ``"mqtt"`` or ``"serial"`` (required)
-
-        For ``"mqtt"`` backend:
-            broker_host (str): MQTT broker hostname
-            broker_port (int): MQTT broker port (default 1883)
-            broker_username (str|None): optional
-            broker_password (str|None): optional
-            topic_prefix (str): topic to subscribe to (default ``msh/#``)
-
-        For ``"serial"`` backend:
-            dev_path (str|None): serial device, e.g. ``/dev/ttyUSB0``
-            tcp_host (str|None): TCP hostname for TCP mode
-            tcp_port (int): TCP port (default 4403)
-    """
-    backend = config.get("backend", "mqtt").lower()
-
-    if backend == "mqtt":
-        mqtt_cfg = MQTTConfig(
-            host=config["broker_host"],
-            port=int(config.get("broker_port", 1883)),
-            username=config.get("broker_username"),
-            password=config.get("broker_password"),
-        )
-        return MQTTMeshtasticBackend(
-            mqtt_config=mqtt_cfg,
-            topic_prefix=config.get("topic_prefix", "msh/#"),
-        )
-
-    if backend == "serial":
-        return SerialMeshtasticBackend(
-            dev_path=config.get("dev_path"),
-            tcp_host=config.get("tcp_host"),
-            tcp_port=int(config.get("tcp_port", 4403)),
-        )
-
-    raise ValueError(f"Unknown Meshtastic backend: {backend!r}. Must be 'mqtt' or 'serial'.")
-
-
-__all__ = [
-    "MeshtasticInterface",
-    "MeshtasticPacket",
-    "MeshtasticPosition",
-    "MeshtasticTelemetry",
-    "MQTTMeshtasticBackend",
-    "SerialMeshtasticBackend",
-    "make_backend",
-]
--- a/circuitforge_core/mqtt/meshtastic/interface.py
+++ b/circuitforge_core/mqtt/meshtastic/interface.py
@ -1,36 +0,0 @@
-"""Abstract interface for Meshtastic backends.
-
-MIT licensed.
-"""
-from __future__ import annotations
-
-from abc import ABC, abstractmethod
-from collections.abc import AsyncIterator
-
-
-class MeshtasticInterface(ABC):
-    """Async interface for receiving and sending Meshtastic packets.
-
-    Two concrete backends exist:
-
-    - MQTTMeshtasticBackend  — subscribes to a Meshtastic MQTT bridge
-    - SerialMeshtasticBackend — connects directly via the meshtastic Python library
-    """
-
-    @abstractmethod
-    def packets(self) -> AsyncIterator:
-        """Async generator of MeshtasticPacket objects.
-
-        Yields packets as they arrive. Runs until cancelled.
-        Concrete types are ``MeshtasticPacket`` from
-        ``circuitforge_core.mqtt.meshtastic.models``.
-        """
-
-    @abstractmethod
-    async def send_text(
-        self,
-        text: str,
-        dest_id: int = 0xFFFFFFFF,
-        channel: int = 0,
-    ) -> None:
-        """Send a text message to dest_id (default: broadcast)."""
--- a/circuitforge_core/mqtt/meshtastic/models.py
+++ b/circuitforge_core/mqtt/meshtastic/models.py
@ -1,83 +0,0 @@
-"""Data models for Meshtastic packets.
-
-MIT licensed.
-"""
-from __future__ import annotations
-
-from dataclasses import dataclass, field
-from datetime import datetime, timezone
-from typing import Literal
-
-# Meshtastic portnum → our label
-PacketType = Literal[
-    "text",
-    "position",
-    "nodeinfo",
-    "telemetry",
-    "routing",
-    "admin",
-    "unknown",
-]
-
-
-@dataclass(frozen=True)
-class MeshtasticPosition:
-    latitude: float | None = None
-    longitude: float | None = None
-    altitude_m: int | None = None
-    timestamp: datetime | None = None
-
-
-@dataclass(frozen=True)
-class MeshtasticTelemetry:
-    battery_level: int | None = None     # 0-100 %
-    voltage: float | None = None         # volts
-    channel_util: float | None = None    # 0-100 %
-    air_util_tx: float | None = None     # 0-100 %
-
-
-@dataclass(frozen=True)
-class MeshtasticPacket:
-    """Normalized Meshtastic packet from any backend."""
-
-    packet_type: PacketType
-    from_id: str                          # hex node ID, e.g. "!deadbeef"
-    from_num: int                         # numeric node ID
-    to_num: int                           # 0xffffffff = broadcast
-    channel: int
-    received_at: datetime = field(default_factory=lambda: datetime.now(tz=timezone.utc))
-
-    # Type-specific payloads (only one is populated per packet type)
-    text: str | None = None
-    position: MeshtasticPosition | None = None
-    telemetry: MeshtasticTelemetry | None = None
-    node_longname: str | None = None
-    node_shortname: str | None = None
-    hardware: int | None = None
-
-    # Original raw payload dict for downstream consumers that need all fields
-    raw: dict = field(default_factory=dict, compare=False, hash=False)
-
-    @property
-    def is_broadcast(self) -> bool:
-        return self.to_num == 0xFFFFFFFF
-
-    def summary(self) -> str:
-        """One-line human-readable description."""
-        src = self.from_id or f"!{self.from_num:08x}"
-        if self.packet_type == "text":
-            return f"[{src}] {self.text}"
-        if self.packet_type == "position" and self.position:
-            p = self.position
-            return f"[{src}] position {p.latitude:.5f},{p.longitude:.5f}"
-        if self.packet_type == "nodeinfo":
-            return f"[{src}] node info: {self.node_longname!r} ({self.node_shortname})"
-        if self.packet_type == "telemetry" and self.telemetry:
-            t = self.telemetry
-            parts = []
-            if t.battery_level is not None:
-                parts.append(f"batt={t.battery_level}%")
-            if t.voltage is not None:
-                parts.append(f"v={t.voltage:.2f}V")
-            return f"[{src}] telemetry {' '.join(parts)}"
-        return f"[{src}] {self.packet_type} packet"
--- a/circuitforge_core/mqtt/meshtastic/mqtt_backend.py
+++ b/circuitforge_core/mqtt/meshtastic/mqtt_backend.py
@ -1,214 +0,0 @@
-"""Meshtastic MQTT bridge backend.
-
-Subscribes to the JSON MQTT topics that Meshtastic firmware publishes when
-the MQTT uplink is enabled on a node.
-
-Topic schema (Meshtastic firmware >=2.1):
-    msh/{region}/{gateway}/2/json/{portnum}/{fromId}
-
-The payload is a JSON object. Examples by type:
-
-Text message:
-    {"channel":0,"from":123456789,"id":987,"payload":{"text":"hello"},
-     "sender":"!07558d85","timestamp":1716200000,"to":4294967295,"type":"sendtext"}
-
-Position:
-    {"channel":0,"from":123456789,"payload":{"altitude":50,
-     "latitude_i":374208130,"longitude_i":-1220848320,"time":1716200000},
-     "type":"position"}
-
-Node info:
-    {"channel":0,"from":123456789,"payload":{"hardware":43,
-     "id":"!07558d85","longname":"Alan Node","shortname":"AN"},
-     "type":"nodeinfo"}
-
-Telemetry:
-    {"channel":0,"from":123456789,"payload":{"battery_level":82,
-     "voltage":4.09,"channel_utilization":0.5,"air_util_tx":0.01,
-     "time":1716200000},"type":"telemetry"}
-
-MIT licensed.
-"""
-from __future__ import annotations
-
-import asyncio
-import json
-import logging
-from collections.abc import AsyncIterator
-from datetime import datetime, timezone
-
-from circuitforge_core.mqtt.client import MQTTClient
-from circuitforge_core.mqtt.meshtastic.interface import MeshtasticInterface
-from circuitforge_core.mqtt.meshtastic.models import (
-    MeshtasticPacket,
-    MeshtasticPosition,
-    MeshtasticTelemetry,
-)
-from circuitforge_core.mqtt.models import MQTTConfig, MQTTMessage
-
-logger = logging.getLogger(__name__)
-
-# latitude_i / longitude_i are stored as integer × 1e7 in Meshtastic protobuf.
-_COORD_SCALE = 1e-7
-
-
-def _parse_packet(raw_json: str | bytes, topic: str) -> MeshtasticPacket | None:
-    """Parse a Meshtastic MQTT JSON payload into a MeshtasticPacket.
-
-    Returns None if the payload cannot be parsed or is an encrypted packet
-    (payload is a base64 blob instead of a dict).
-    """
-    try:
-        obj = json.loads(raw_json)
-    except json.JSONDecodeError:
-        logger.debug("Non-JSON Meshtastic payload on topic %r", topic)
-        return None
-
-    payload = obj.get("payload")
-    if not isinstance(payload, dict):
-        # Encrypted packet — payload is a base64 string; skip.
-        return None
-
-    from_num: int = obj.get("from", 0)
-    sender: str = obj.get("sender", f"!{from_num:08x}")
-    channel: int = obj.get("channel", 0)
-    to_num: int = obj.get("to", 0xFFFFFFFF)
-    raw_ts: int | None = payload.get("time") or obj.get("timestamp")
-    received_at = (
-        datetime.fromtimestamp(raw_ts, tz=timezone.utc) if raw_ts else datetime.now(tz=timezone.utc)
-    )
-
-    ptype: str = obj.get("type", "unknown").lower()
-
-    if ptype in ("sendtext", "text"):
-        return MeshtasticPacket(
-            packet_type="text",
-            from_id=sender,
-            from_num=from_num,
-            to_num=to_num,
-            channel=channel,
-            received_at=received_at,
-            text=payload.get("text", ""),
-            raw=obj,
-        )
-
-    if ptype == "position":
-        lat_i: int | None = payload.get("latitude_i")
-        lon_i: int | None = payload.get("longitude_i")
-        return MeshtasticPacket(
-            packet_type="position",
-            from_id=sender,
-            from_num=from_num,
-            to_num=to_num,
-            channel=channel,
-            received_at=received_at,
-            position=MeshtasticPosition(
-                latitude=lat_i * _COORD_SCALE if lat_i is not None else None,
-                longitude=lon_i * _COORD_SCALE if lon_i is not None else None,
-                altitude_m=payload.get("altitude"),
-                timestamp=received_at,
-            ),
-            raw=obj,
-        )
-
-    if ptype == "nodeinfo":
-        return MeshtasticPacket(
-            packet_type="nodeinfo",
-            from_id=sender,
-            from_num=from_num,
-            to_num=to_num,
-            channel=channel,
-            received_at=received_at,
-            node_longname=payload.get("longname"),
-            node_shortname=payload.get("shortname"),
-            hardware=payload.get("hardware"),
-            raw=obj,
-        )
-
-    if ptype == "telemetry":
-        return MeshtasticPacket(
-            packet_type="telemetry",
-            from_id=sender,
-            from_num=from_num,
-            to_num=to_num,
-            channel=channel,
-            received_at=received_at,
-            telemetry=MeshtasticTelemetry(
-                battery_level=payload.get("battery_level"),
-                voltage=payload.get("voltage"),
-                channel_util=payload.get("channel_utilization"),
-                air_util_tx=payload.get("air_util_tx"),
-            ),
-            raw=obj,
-        )
-
-    # Routing, admin, and other packet types — return minimal packet.
-    return MeshtasticPacket(
-        packet_type="unknown",
-        from_id=sender,
-        from_num=from_num,
-        to_num=to_num,
-        channel=channel,
-        received_at=received_at,
-        raw=obj,
-    )
-
-
-class MQTTMeshtasticBackend(MeshtasticInterface):
-    """Receive Meshtastic packets via a Meshtastic MQTT bridge.
-
-    Requires a Meshtastic node with the MQTT uplink enabled, publishing to
-    the configured broker. Set ``topic_prefix`` to match the region prefix
-    configured on the node (default ``msh/#`` matches all regions).
-
-    Args:
-        mqtt_config: broker connection settings
-        topic_prefix: MQTT topic pattern to subscribe to (default ``msh/#``)
-    """
-
-    def __init__(
-        self,
-        mqtt_config: MQTTConfig,
-        topic_prefix: str = "msh/#",
-    ) -> None:
-        self._mqtt_config = mqtt_config
-        self._topic_prefix = topic_prefix
-
-    async def packets(self) -> AsyncIterator[MeshtasticPacket]:
-        client = MQTTClient(self._mqtt_config)
-
-        queue: asyncio.Queue[MeshtasticPacket] = asyncio.Queue()
-
-        @client.on(self._topic_prefix)
-        async def _handle(msg: MQTTMessage) -> None:
-            pkt = _parse_packet(msg.payload, msg.topic)
-            if pkt is not None:
-                await queue.put(pkt)
-
-        runner = asyncio.create_task(client.run())
-        try:
-            while True:
-                yield await queue.get()
-        finally:
-            runner.cancel()
-            try:
-                await runner
-            except asyncio.CancelledError:
-                pass
-
-    async def send_text(
-        self,
-        text: str,
-        dest_id: int = 0xFFFFFFFF,
-        channel: int = 0,
-    ) -> None:
-        """Publishing back to MQTT is not supported by this backend.
-
-        Meshtastic nodes consume from MQTT in a different topic namespace;
-        use the serial backend or a direct Meshtastic MQTT channel config
-        for two-way messaging.
-        """
-        raise NotImplementedError(
-            "MQTTMeshtasticBackend is receive-only. "
-            "Use SerialMeshtasticBackend for send support."
-        )
--- a/circuitforge_core/mqtt/meshtastic/serial_backend.py
+++ b/circuitforge_core/mqtt/meshtastic/serial_backend.py
@ -1,210 +0,0 @@
-"""Meshtastic serial/TCP backend using the meshtastic Python library.
-
-Connects directly to a Meshtastic node over serial port or TCP (e.g.
-when a node exposes Meshtastic's native TCP API on port 4403).
-
-The ``meshtastic`` library is synchronous and uses threading + PyPubSub
-for callbacks. This backend bridges into asyncio via an asyncio.Queue:
-the sync callback puts packets on the queue, and ``packets()`` awaits
-items from it.
-
-MIT licensed.
-"""
-from __future__ import annotations
-
-import asyncio
-import logging
-from collections.abc import AsyncIterator
-from datetime import datetime, timezone
-
-from circuitforge_core.mqtt.meshtastic.interface import MeshtasticInterface
-from circuitforge_core.mqtt.meshtastic.models import (
-    MeshtasticPacket,
-    MeshtasticPosition,
-    MeshtasticTelemetry,
-)
-
-logger = logging.getLogger(__name__)
-
-_COORD_SCALE = 1e-7
-
-
-def _packet_from_decoded(decoded: dict, from_id: int) -> MeshtasticPacket:
-    """Convert a meshtastic-library decoded packet dict to MeshtasticPacket."""
-    portnum: str = decoded.get("portnum", "UNKNOWN_APP")
-    sender = f"!{from_id:08x}"
-    to_num: int = decoded.get("to", 0xFFFFFFFF)
-    channel: int = decoded.get("channel", 0)
-    now = datetime.now(tz=timezone.utc)
-
-    if portnum == "TEXT_MESSAGE_APP":
-        return MeshtasticPacket(
-            packet_type="text",
-            from_id=sender,
-            from_num=from_id,
-            to_num=to_num,
-            channel=channel,
-            received_at=now,
-            text=decoded.get("decoded", {}).get("text", ""),
-            raw=decoded,
-        )
-
-    if portnum == "POSITION_APP":
-        pos = decoded.get("decoded", {}).get("position", {})
-        lat_i = pos.get("latitudeI")
-        lon_i = pos.get("longitudeI")
-        alt = pos.get("altitude")
-        return MeshtasticPacket(
-            packet_type="position",
-            from_id=sender,
-            from_num=from_id,
-            to_num=to_num,
-            channel=channel,
-            received_at=now,
-            position=MeshtasticPosition(
-                latitude=lat_i * _COORD_SCALE if lat_i is not None else None,
-                longitude=lon_i * _COORD_SCALE if lon_i is not None else None,
-                altitude_m=alt,
-                timestamp=now,
-            ),
-            raw=decoded,
-        )
-
-    if portnum == "NODEINFO_APP":
-        info = decoded.get("decoded", {}).get("user", {})
-        return MeshtasticPacket(
-            packet_type="nodeinfo",
-            from_id=sender,
-            from_num=from_id,
-            to_num=to_num,
-            channel=channel,
-            received_at=now,
-            node_longname=info.get("longName"),
-            node_shortname=info.get("shortName"),
-            hardware=info.get("hwModel"),
-            raw=decoded,
-        )
-
-    if portnum == "TELEMETRY_APP":
-        telem = decoded.get("decoded", {}).get("telemetry", {})
-        dev = telem.get("deviceMetrics", {})
-        return MeshtasticPacket(
-            packet_type="telemetry",
-            from_id=sender,
-            from_num=from_id,
-            to_num=to_num,
-            channel=channel,
-            received_at=now,
-            telemetry=MeshtasticTelemetry(
-                battery_level=dev.get("batteryLevel"),
-                voltage=dev.get("voltage"),
-                channel_util=dev.get("channelUtilization"),
-                air_util_tx=dev.get("airUtilTx"),
-            ),
-            raw=decoded,
-        )
-
-    return MeshtasticPacket(
-        packet_type="unknown",
-        from_id=sender,
-        from_num=from_id,
-        to_num=to_num,
-        channel=channel,
-        received_at=now,
-        raw=decoded,
-    )
-
-
-class SerialMeshtasticBackend(MeshtasticInterface):
-    """Receive and send Meshtastic packets via serial port or TCP.
-
-    Args:
-        dev_path: serial device path (e.g. ``/dev/ttyUSB0``) or ``None``
-            to auto-detect the first connected Meshtastic device.
-        tcp_host: hostname for TCP connection. If set, ``dev_path`` is ignored
-            and a TCP connection to port 4403 is used.
-        tcp_port: TCP port (default 4403).
-    """
-
-    def __init__(
-        self,
-        dev_path: str | None = None,
-        tcp_host: str | None = None,
-        tcp_port: int = 4403,
-    ) -> None:
-        self._dev_path = dev_path
-        self._tcp_host = tcp_host
-        self._tcp_port = tcp_port
-
-    def _make_interface(self):
-        try:
-            import meshtastic.serial_interface
-            import meshtastic.tcp_interface
-        except ImportError as exc:
-            raise ImportError(
-                "meshtastic is required for SerialMeshtasticBackend. "
-                "Install with: pip install circuitforge-core[meshtastic-serial]"
-            ) from exc
-
-        if self._tcp_host:
-            return meshtastic.tcp_interface.TCPInterface(
-                hostname=self._tcp_host,
-                portNumber=self._tcp_port,
-            )
-        return meshtastic.serial_interface.SerialInterface(devPath=self._dev_path)
-
-    async def packets(self) -> AsyncIterator[MeshtasticPacket]:
-        loop = asyncio.get_running_loop()
-        queue: asyncio.Queue[MeshtasticPacket | None] = asyncio.Queue()
-
-        def _on_receive(packet: dict, interface) -> None:
-            try:
-                from_id: int = packet.get("from", 0)
-                pkt = _packet_from_decoded(packet, from_id)
-                loop.call_soon_threadsafe(queue.put_nowait, pkt)
-            except Exception:
-                logger.exception("Error decoding Meshtastic serial packet")
-
-        def _on_connection_closed(interface) -> None:
-            logger.warning("Meshtastic serial connection closed")
-            loop.call_soon_threadsafe(queue.put_nowait, None)
-
-        iface = await loop.run_in_executor(None, self._make_interface)
-
-        try:
-            from pubsub import pub
-            pub.subscribe(_on_receive, "meshtastic.receive")
-            pub.subscribe(_on_connection_closed, "meshtastic.connection.lost")
-        except ImportError:
-            await loop.run_in_executor(None, iface.close)
-            raise ImportError(
-                "pypubsub is required for SerialMeshtasticBackend. "
-                "Install with: pip install circuitforge-core[meshtastic-serial]"
-            )
-
-        try:
-            while True:
-                pkt = await queue.get()
-                if pkt is None:
-                    break
-                yield pkt
-        finally:
-            pub.unsubscribe(_on_receive, "meshtastic.receive")
-            pub.unsubscribe(_on_connection_closed, "meshtastic.connection.lost")
-            await loop.run_in_executor(None, iface.close)
-
-    async def send_text(
-        self,
-        text: str,
-        dest_id: int = 0xFFFFFFFF,
-        channel: int = 0,
-    ) -> None:
-        loop = asyncio.get_running_loop()
-        iface = await loop.run_in_executor(None, self._make_interface)
-        try:
-            await loop.run_in_executor(
-                None,
-                lambda: iface.sendText(text, destinationId=dest_id, channelIndex=channel),
-            )
-        finally:
-            await loop.run_in_executor(None, iface.close)
--- a/circuitforge_core/mqtt/models.py
+++ b/circuitforge_core/mqtt/models.py
@ -1,44 +0,0 @@
-"""Data models for the MQTT client module.
-
-MIT licensed.
-"""
-from __future__ import annotations
-
-import json
-from dataclasses import dataclass, field
-from datetime import datetime, timezone
-
-
-@dataclass(frozen=True)
-class MQTTConfig:
-    """Connection config for an MQTT broker."""
-
-    host: str
-    port: int = 1883
-    username: str | None = None
-    password: str | None = None
-    client_id: str = ""
-    keepalive: int = 60
-    tls: bool = False
-    reconnect_interval: float = 5.0
-
-
-@dataclass(frozen=True)
-class MQTTMessage:
-    """A single received MQTT message."""
-
-    topic: str
-    payload: bytes
-    qos: int = 0
-    retain: bool = False
-    received_at: datetime = field(default_factory=lambda: datetime.now(tz=timezone.utc))
-
-    def text(self, encoding: str = "utf-8") -> str:
-        return self.payload.decode(encoding, errors="replace")
-
-    def json(self) -> dict:
-        return json.loads(self.payload)
-
-    @property
-    def topic_parts(self) -> list[str]:
-        return self.topic.split("/")
--- a/circuitforge_core/mqtt/router.py
+++ b/circuitforge_core/mqtt/router.py
@ -1,74 +0,0 @@
-"""MQTT topic router with wildcard pattern matching.
-
-MIT licensed.
-"""
-from __future__ import annotations
-
-import asyncio
-import inspect
-import logging
-from collections.abc import Callable, Coroutine
-from typing import Any
-
-from circuitforge_core.mqtt.models import MQTTMessage
-
-logger = logging.getLogger(__name__)
-
-Handler = Callable[[MQTTMessage], Coroutine[Any, Any, None]]
-
-
-def matches(pattern: str, topic: str) -> bool:
-    """Return True if topic matches the MQTT wildcard pattern.
-
-    MQTT wildcard rules:
-    - '+' matches exactly one topic level (segment between '/' separators)
-    - '#' matches zero or more levels and MUST appear at the end of the pattern
-    - All other characters match literally
-
-    Examples:
-        matches("sensor/+/temp", "sensor/room1/temp")       → True
-        matches("sensor/+/temp", "sensor/a/b/temp")         → False
-        matches("sensor/#", "sensor/room1/temp")            → True
-        matches("sensor/#", "sensor")                       → True  (# = zero levels)
-        matches("#", "any/topic/here")                      → True
-        matches("a/b/c", "a/b/c")                          → True
-    """
-    # TODO: implement wildcard matching
-    # Hint: split both pattern and topic on '/' and walk them in parallel.
-    # Handle '#' early (if it appears, everything past that point in topic matches).
-    # '+' must cover exactly one (non-empty) level.
-    raise NotImplementedError("matches() is not yet implemented")
-
-
-class TopicRouter:
-    """Register async handlers for MQTT topic patterns and dispatch messages."""
-
-    def __init__(self) -> None:
-        self._routes: list[tuple[str, Handler]] = []
-
-    @property
-    def patterns(self) -> list[str]:
-        return [p for p, _ in self._routes]
-
-    def register(self, pattern: str, handler: Handler) -> None:
-        """Add a handler for the given topic pattern."""
-        self._routes.append((pattern, handler))
-
-    def on(self, pattern: str) -> Callable[[Handler], Handler]:
-        """Decorator: @router.on("sensor/#") async def handle(msg): ..."""
-        def decorator(fn: Handler) -> Handler:
-            self.register(pattern, fn)
-            return fn
-        return decorator
-
-    async def dispatch(self, message: MQTTMessage) -> None:
-        """Call all handlers whose pattern matches message.topic."""
-        for pattern, handler in self._routes:
-            try:
-                if matches(pattern, message.topic):
-                    if inspect.iscoroutinefunction(handler):
-                        await handler(message)
-                    else:
-                        handler(message)
-            except Exception:
-                logger.exception("Handler for %r raised on topic %r", pattern, message.topic)
--- a/circuitforge_core/musicgen/init.py
+++ b/circuitforge_core/musicgen/init.py
@ -1 +0,0 @@
-"""circuitforge_core.musicgen — music continuation service (BSL 1.1)."""
--- a/circuitforge_core/musicgen/app.py
+++ b/circuitforge_core/musicgen/app.py
@ -1,138 +0,0 @@
-"""
-cf-musicgen FastAPI service — managed by cf-orch.
-
-Endpoints:
-  GET  /health     -> {"status": "ok", "model": str, "vram_mb": int}
-  POST /continue   -> audio bytes (Content-Type: audio/wav or audio/mpeg)
-
-Usage:
-    python -m circuitforge_core.musicgen.app \
-        --model facebook/musicgen-melody \
-        --port 8006 \
-        --gpu-id 0
-
-The service streams back raw audio bytes. Headers include:
-  X-Duration-S      generated duration in seconds
-  X-Prompt-Duration-S   how many seconds of the input were used as prompt
-  X-Model           model name
-  X-Sample-Rate     output sample rate (32000 for all MusicGen variants)
-
-Model weights are cached at /Library/Assets/LLM/musicgen/.
-"""
-from __future__ import annotations
-
-import argparse
-import logging
-import os
-from typing import Annotated
-
-from fastapi import FastAPI, File, Form, HTTPException, UploadFile
-from fastapi.responses import Response
-
-from circuitforge_core.musicgen.backends.base import (
-    MODEL_MELODY,
-    MODEL_SMALL,
-    AudioFormat,
-    MusicGenBackend,
-    make_musicgen_backend,
-)
-
-_CONTENT_TYPES: dict[str, str] = {
-    "wav": "audio/wav",
-    "mp3": "audio/mpeg",
-}
-
-app = FastAPI(title="cf-musicgen", version="0.1.0")
-_backend: MusicGenBackend | None = None
-
-
-@app.get("/health")
-def health() -> dict:
-    if _backend is None:
-        raise HTTPException(503, detail="backend not initialised")
-    return {
-        "status": "ok",
-        "model": _backend.model_name,
-        "vram_mb": _backend.vram_mb,
-    }
-
-
-@app.post("/continue")
-async def continue_audio(
-    audio: UploadFile = File(..., description="Audio file (WAV, MP3, FLAC, OGG, ...)"),
-    description: Annotated[str | None, Form()] = None,
-    duration_s: Annotated[float, Form()] = 15.0,
-    prompt_duration_s: Annotated[float, Form()] = 10.0,
-    format: Annotated[AudioFormat, Form()] = "wav",
-) -> Response:
-    if _backend is None:
-        raise HTTPException(503, detail="backend not initialised")
-    if duration_s <= 0 or duration_s > 60:
-        raise HTTPException(422, detail="duration_s must be between 0 and 60")
-    if prompt_duration_s <= 0 or prompt_duration_s > 30:
-        raise HTTPException(422, detail="prompt_duration_s must be between 0 and 30")
-
-    audio_bytes = await audio.read()
-    if not audio_bytes:
-        raise HTTPException(400, detail="Empty audio file")
-
-    try:
-        result = _backend.continue_audio(
-            audio_bytes,
-            description=description or None,
-            duration_s=duration_s,
-            prompt_duration_s=prompt_duration_s,
-            format=format,
-        )
-    except Exception as exc:
-        logging.exception("Music continuation failed")
-        raise HTTPException(500, detail=str(exc)) from exc
-
-    return Response(
-        content=result.audio_bytes,
-        media_type=_CONTENT_TYPES.get(result.format, "audio/wav"),
-        headers={
-            "X-Duration-S": str(round(result.duration_s, 3)),
-            "X-Prompt-Duration-S": str(round(result.prompt_duration_s, 3)),
-            "X-Model": result.model,
-            "X-Sample-Rate": str(result.sample_rate),
-        },
-    )
-
-
-def _parse_args() -> argparse.Namespace:
-    p = argparse.ArgumentParser(description="cf-musicgen service")
-    p.add_argument(
-        "--model",
-        default=MODEL_MELODY,
-        choices=[MODEL_MELODY, MODEL_SMALL, "facebook/musicgen-medium", "facebook/musicgen-large"],
-        help="MusicGen model variant",
-    )
-    p.add_argument("--port", type=int, default=8006)
-    p.add_argument("--host", default="0.0.0.0")
-    p.add_argument("--gpu-id", type=int, default=0,
-                   help="CUDA device index (sets CUDA_VISIBLE_DEVICES)")
-    p.add_argument("--device", default="cuda", choices=["cuda", "cpu"])
-    p.add_argument("--mock", action="store_true",
-                   help="Run with mock backend (no GPU, for testing)")
-    return p.parse_args()
-
-
-if __name__ == "__main__":
-    import uvicorn
-
-    logging.basicConfig(
-        level=logging.INFO,
-        format="%(asctime)s %(levelname)s %(name)s  %(message)s",
-    )
-    args = _parse_args()
-
-    if args.device == "cuda" and not args.mock:
-        os.environ.setdefault("CUDA_VISIBLE_DEVICES", str(args.gpu_id))
-
-    mock = args.mock or args.model == "mock"
-    device = "cpu" if mock else args.device
-
-    _backend = make_musicgen_backend(model_name=args.model, mock=mock, device=device)
-
-    uvicorn.run(app, host=args.host, port=args.port, log_level="info")
--- a/circuitforge_core/musicgen/backends/init.py
+++ b/circuitforge_core/musicgen/backends/init.py
@ -1 +0,0 @@
-"""MusicGen backend implementations."""
--- a/circuitforge_core/musicgen/backends/audiocraft.py
+++ b/circuitforge_core/musicgen/backends/audiocraft.py
@ -1,128 +0,0 @@
-"""
-AudioCraft MusicGen backend — music continuation via Meta's MusicGen.
-
-Models are downloaded to /Library/Assets/LLM/musicgen/ (HF hub cache).
-The melody model (~8 GB VRAM) is the default; small (~1.5 GB) is available
-for lower-VRAM nodes.
-
-Continuation workflow:
-  1. Decode input audio with torchaudio (any format ffmpeg understands)
-  2. Trim to the last `prompt_duration_s` seconds — this anchors the generation
-  3. Call model.generate_continuation(prompt_waveform, prompt_sample_rate, ...)
-  4. Output tensor is the NEW audio only (not prompt + continuation)
-  5. Encode to the requested format and return
-"""
-from __future__ import annotations
-
-import logging
-import os
-
-from circuitforge_core.musicgen.backends.base import (
-    AudioFormat,
-    MusicContinueResult,
-    decode_audio,
-    encode_audio,
-)
-
-# All MusicGen/AudioCraft weights land here — consistent with other CF model dirs.
-_MUSICGEN_CACHE = "/Library/Assets/LLM/musicgen"
-
-# VRAM estimates (MB) per model variant
-_VRAM_MB: dict[str, int] = {
-    "facebook/musicgen-small": 1500,
-    "facebook/musicgen-medium": 4500,
-    "facebook/musicgen-melody": 8000,
-    "facebook/musicgen-large": 8500,
-}
-
-logger = logging.getLogger(__name__)
-
-
-class AudioCraftBackend:
-    """MusicGen backend using Meta's AudioCraft library."""
-
-    def __init__(self, model_name: str = "facebook/musicgen-melody", device: str = "cuda") -> None:
-        # Redirect HF hub cache before the first import so weights go to /Library/Assets
-        os.environ.setdefault("HF_HOME", _MUSICGEN_CACHE)
-        os.makedirs(_MUSICGEN_CACHE, exist_ok=True)
-
-        from audiocraft.models import MusicGen  # noqa: PLC0415
-
-        logger.info("Loading MusicGen model: %s on %s", model_name, device)
-        self._model = MusicGen.get_pretrained(model_name, device=device)
-        self._model_name = model_name
-        self._device = device
-        logger.info("MusicGen ready: %s", model_name)
-
-    @property
-    def model_name(self) -> str:
-        return self._model_name
-
-    @property
-    def vram_mb(self) -> int:
-        return _VRAM_MB.get(self._model_name, 8000)
-
-    def continue_audio(
-        self,
-        audio_bytes: bytes,
-        *,
-        description: str | None = None,
-        duration_s: float = 15.0,
-        prompt_duration_s: float = 10.0,
-        format: AudioFormat = "wav",
-    ) -> MusicContinueResult:
-        import torch
-
-        # Decode input audio -> [C, T] tensor
-        wav, sr = decode_audio(audio_bytes)
-
-        # Trim to the last `prompt_duration_s` seconds to form the conditioning prompt.
-        # Using the end of the track (not the beginning) gives the model the musical
-        # context closest to where we want to continue.
-        max_prompt_samples = int(prompt_duration_s * sr)
-        if wav.shape[-1] > max_prompt_samples:
-            wav = wav[..., -max_prompt_samples:]
-
-        # MusicGen expects [batch, channels, time]
-        prompt_tensor = wav.unsqueeze(0).to(self._device)
-
-        # Build descriptions list — one entry per batch item (batch=1 here)
-        descriptions = [description] if description else [None]
-
-        self._model.set_generation_params(
-            duration=duration_s,
-            top_k=250,
-            temperature=1.0,
-            cfg_coef=3.0,
-        )
-
-        logger.info(
-            "Generating %.1fs continuation (prompt=%.1fs) model=%s",
-            duration_s,
-            prompt_duration_s,
-            self._model_name,
-        )
-
-        with torch.no_grad():
-            output = self._model.generate_continuation(
-                prompt=prompt_tensor,
-                prompt_sample_rate=sr,
-                descriptions=descriptions,
-                progress=True,
-            )
-
-        # output: [batch, channels, time] at model sample rate (32 kHz)
-        output_wav = output[0]  # [C, T]
-        model_sr = self._model.sample_rate
-
-        actual_duration_s = output_wav.shape[-1] / model_sr
-        audio_bytes_out = encode_audio(output_wav, model_sr, format)
-
-        return MusicContinueResult(
-            audio_bytes=audio_bytes_out,
-            sample_rate=model_sr,
-            duration_s=actual_duration_s,
-            format=format,
-            model=self._model_name,
-            prompt_duration_s=prompt_duration_s,
-        )
--- a/circuitforge_core/musicgen/backends/base.py
+++ b/circuitforge_core/musicgen/backends/base.py
@ -1,97 +0,0 @@
-"""
-MusicGenBackend Protocol — backend-agnostic music continuation interface.
-
-All backends accept an audio prompt (raw bytes, any ffmpeg-readable format) and
-return MusicContinueResult with the generated continuation as audio bytes.
-
-The continuation is the *new* audio only (not prompt + continuation). Callers
-that want a seamless joined file can concatenate the original + result themselves.
-"""
-from __future__ import annotations
-
-import io
-from dataclasses import dataclass
-from typing import Literal, Protocol, runtime_checkable
-
-AudioFormat = Literal["wav", "mp3"]
-
-MODEL_SMALL = "facebook/musicgen-small"
-MODEL_MELODY = "facebook/musicgen-melody"
-
-
-@dataclass(frozen=True)
-class MusicContinueResult:
-    audio_bytes: bytes
-    sample_rate: int
-    duration_s: float
-    format: AudioFormat
-    model: str
-    prompt_duration_s: float
-
-
-@runtime_checkable
-class MusicGenBackend(Protocol):
-    def continue_audio(
-        self,
-        audio_bytes: bytes,
-        *,
-        description: str | None = None,
-        duration_s: float = 15.0,
-        prompt_duration_s: float = 10.0,
-        format: AudioFormat = "wav",
-    ) -> MusicContinueResult: ...
-
-    @property
-    def model_name(self) -> str: ...
-
-    @property
-    def vram_mb(self) -> int: ...
-
-
-def encode_audio(wav_tensor, sample_rate: int, format: AudioFormat) -> bytes:
-    """Encode a [C, T] or [1, C, T] torch tensor to audio bytes."""
-    import io
-    import torch
-    import torchaudio
-
-    wav = wav_tensor
-    if wav.dim() == 3:
-        wav = wav.squeeze(0)          # [1, C, T] -> [C, T]
-    if wav.dim() == 1:
-        wav = wav.unsqueeze(0)        # [T] -> [1, T]
-    wav = wav.to(torch.float32).cpu()
-
-    buf = io.BytesIO()
-    if format == "wav":
-        torchaudio.save(buf, wav, sample_rate, format="wav")
-    elif format == "mp3":
-        try:
-            torchaudio.save(buf, wav, sample_rate, format="mp3")
-        except Exception:
-            # ffmpeg backend not available; fall back to wav
-            buf = io.BytesIO()
-            torchaudio.save(buf, wav, sample_rate, format="wav")
-    return buf.getvalue()
-
-
-def decode_audio(audio_bytes: bytes) -> tuple:
-    """Decode arbitrary audio bytes to (waveform [C, T], sample_rate)."""
-    import io
-    import torchaudio
-
-    buf = io.BytesIO(audio_bytes)
-    wav, sr = torchaudio.load(buf)
-    return wav, sr
-
-
-def make_musicgen_backend(
-    model_name: str = MODEL_MELODY,
-    *,
-    mock: bool = False,
-    device: str = "cuda",
-) -> MusicGenBackend:
-    if mock:
-        from circuitforge_core.musicgen.backends.mock import MockMusicGenBackend
-        return MockMusicGenBackend()
-    from circuitforge_core.musicgen.backends.audiocraft import AudioCraftBackend
-    return AudioCraftBackend(model_name=model_name, device=device)
--- a/circuitforge_core/musicgen/backends/mock.py
+++ b/circuitforge_core/musicgen/backends/mock.py
@ -1,53 +0,0 @@
-"""
-Mock MusicGenBackend — returns silent WAV audio; no GPU required.
-
-Used in unit tests and CI where GPU is unavailable.
-"""
-from __future__ import annotations
-
-import io
-import struct
-import wave
-
-from circuitforge_core.musicgen.backends.base import AudioFormat, MusicContinueResult
-
-
-class MockMusicGenBackend:
-    """Returns a silent WAV file of the requested duration."""
-
-    @property
-    def model_name(self) -> str:
-        return "mock"
-
-    @property
-    def vram_mb(self) -> int:
-        return 0
-
-    def continue_audio(
-        self,
-        audio_bytes: bytes,
-        *,
-        description: str | None = None,
-        duration_s: float = 15.0,
-        prompt_duration_s: float = 10.0,
-        format: AudioFormat = "wav",
-    ) -> MusicContinueResult:
-        sample_rate = 32000
-        n_samples = int(duration_s * sample_rate)
-        silent_samples = b"\x00\x00" * n_samples  # 16-bit PCM silence
-
-        buf = io.BytesIO()
-        with wave.open(buf, "wb") as wf:
-            wf.setnchannels(1)
-            wf.setsampwidth(2)
-            wf.setframerate(sample_rate)
-            wf.writeframes(silent_samples)
-
-        return MusicContinueResult(
-            audio_bytes=buf.getvalue(),
-            sample_rate=sample_rate,
-            duration_s=duration_s,
-            format="wav",
-            model="mock",
-            prompt_duration_s=prompt_duration_s,
-        )
--- a/circuitforge_core/pipeline/init.py
+++ b/circuitforge_core/pipeline/init.py
@ -1,43 +1,3 @@
-# circuitforge_core/pipeline — FPGA→ASIC crystallization engine
-#
-# Public API: call pipeline.run() from product code instead of llm.router directly.
-# The module transparently checks for crystallized workflows first, falls back
-# to LLM when none match, and records each run for future crystallization.
-from __future__ import annotations
-
-from typing import Any, Callable
-
-from .crystallizer import CrystallizerConfig, crystallize, evaluate_new_run, should_crystallize
-from .executor import ExecutionResult, Executor, StepResult
-from .models import CrystallizedWorkflow, PipelineRun, Step, hash_input
-from .multimodal import MultimodalConfig, MultimodalPipeline, PageResult
-from .recorder import Recorder
-from .registry import Registry
 from .staging import StagingDB

-__all__ = [
-    # models
-    "PipelineRun",
-    "CrystallizedWorkflow",
-    "Step",
-    "hash_input",
-    # recorder
-    "Recorder",
-    # crystallizer
-    "CrystallizerConfig",
-    "crystallize",
-    "evaluate_new_run",
-    "should_crystallize",
-    # registry
-    "Registry",
-    # executor
-    "Executor",
-    "ExecutionResult",
-    "StepResult",
-    # multimodal
-    "MultimodalPipeline",
-    "MultimodalConfig",
-    "PageResult",
-    # legacy stub
-    "StagingDB",
-]
+__all__ = ["StagingDB"]
--- a/circuitforge_core/pipeline/crystallizer.py
+++ b/circuitforge_core/pipeline/crystallizer.py
@ -1,177 +0,0 @@
-# circuitforge_core/pipeline/crystallizer.py — promote approved runs → workflows
-#
-# MIT — pure logic, no inference backends.
-from __future__ import annotations
-
-import logging
-import warnings
-from collections import Counter
-from dataclasses import dataclass, field
-from datetime import datetime, timezone
-from typing import Literal
-
-from .models import CrystallizedWorkflow, PipelineRun, Step
-from .recorder import Recorder
-
-log = logging.getLogger(__name__)
-
-# Minimum milliseconds of review that counts as "genuine".
-# Runs shorter than this are accepted but trigger a warning.
-_RUBBER_STAMP_THRESHOLD_MS = 5_000
-
-
-@dataclass
-class CrystallizerConfig:
-    """Tuning knobs for one product/task-type pair.
-
-    threshold:
-        Minimum number of approved runs required before crystallization.
-        Osprey sets this to 1 (first successful IVR navigation is enough);
-        Peregrine uses 3+ for cover-letter templates.
-    min_review_ms:
-        Approved runs with review_duration_ms below this value generate a
-        warning.  Set to 0 to silence the check (tests, automated approvals).
-    strategy:
-        ``"most_recent"`` — use the latest approved run's steps verbatim.
-        ``"majority"`` — pick each step by majority vote across runs (requires
-        runs to have the same step count; falls back to most_recent otherwise).
-    """
-    threshold: int = 3
-    min_review_ms: int = _RUBBER_STAMP_THRESHOLD_MS
-    strategy: Literal["most_recent", "majority"] = "most_recent"
-
-
-# ── Helpers ───────────────────────────────────────────────────────────────────
-
-def _majority_steps(runs: list[PipelineRun]) -> list[Step] | None:
-    """Return majority-voted steps, or None if run lengths differ."""
-    lengths = {len(r.steps) for r in runs}
-    if len(lengths) != 1:
-        return None
-    n = lengths.pop()
-    result: list[Step] = []
-    for i in range(n):
-        counter: Counter[str] = Counter()
-        step_by_action: dict[str, Step] = {}
-        for r in runs:
-            s = r.steps[i]
-            counter[s.action] += 1
-            step_by_action[s.action] = s
-        winner = counter.most_common(1)[0][0]
-        result.append(step_by_action[winner])
-    return result
-
-
-def _check_review_quality(runs: list[PipelineRun],
-                          min_review_ms: int) -> None:
-    """Warn if any run has a suspiciously short review duration."""
-    if min_review_ms <= 0:
-        return
-    flagged = [r for r in runs if r.review_duration_ms < min_review_ms]
-    if flagged:
-        ids = ", ".join(r.run_id for r in flagged)
-        warnings.warn(
-            f"Crystallizing from {len(flagged)} run(s) with review_duration_ms "
-            f"< {min_review_ms} ms — possible rubber-stamp approval: [{ids}]. "
-            "Verify these were genuinely human-reviewed before deployment.",
-            stacklevel=3,
-        )
-
-
-# ── Public API ────────────────────────────────────────────────────────────────
-
-def should_crystallize(runs: list[PipelineRun],
-                       config: CrystallizerConfig) -> bool:
-    """Return True if *runs* meet the threshold for crystallization."""
-    approved = [r for r in runs if r.approved]
-    return len(approved) >= config.threshold
-
-
-def crystallize(runs: list[PipelineRun],
-                config: CrystallizerConfig,
-                existing_version: int = 0) -> CrystallizedWorkflow:
-    """Promote *runs* into a CrystallizedWorkflow.
-
-    Raises
-    ------
-    ValueError
-        If fewer approved runs than ``config.threshold``, or if the runs
-        span more than one (product, task_type, input_hash) triple.
-    """
-    approved = [r for r in runs if r.approved]
-    if len(approved) < config.threshold:
-        raise ValueError(
-            f"Need {config.threshold} approved runs, got {len(approved)}."
-        )
-
-    # Validate homogeneity
-    products = {r.product for r in approved}
-    task_types = {r.task_type for r in approved}
-    hashes = {r.input_hash for r in approved}
-    if len(products) != 1 or len(task_types) != 1 or len(hashes) != 1:
-        raise ValueError(
-            "All runs must share the same product, task_type, and input_hash. "
-            f"Got products={products}, task_types={task_types}, hashes={hashes}."
-        )
-
-    product = products.pop()
-    task_type = task_types.pop()
-    input_hash = hashes.pop()
-
-    _check_review_quality(approved, config.min_review_ms)
-
-    # Pick canonical steps
-    if config.strategy == "majority":
-        steps = _majority_steps(approved) or approved[-1].steps
-    else:
-        steps = sorted(approved, key=lambda r: r.timestamp)[-1].steps
-
-    avg_ms = sum(r.review_duration_ms for r in approved) // len(approved)
-    all_unmodified = all(not r.output_modified for r in approved)
-
-    workflow_id = f"{product}:{task_type}:{input_hash[:12]}"
-    return CrystallizedWorkflow(
-        workflow_id=workflow_id,
-        product=product,
-        task_type=task_type,
-        input_hash=input_hash,
-        steps=steps,
-        crystallized_at=datetime.now(timezone.utc).isoformat(),
-        run_ids=[r.run_id for r in approved],
-        approval_count=len(approved),
-        avg_review_duration_ms=avg_ms,
-        all_output_unmodified=all_unmodified,
-        version=existing_version + 1,
-    )
-
-
-def evaluate_new_run(
-    run: PipelineRun,
-    recorder: Recorder,
-    config: CrystallizerConfig,
-    existing_version: int = 0,
-) -> CrystallizedWorkflow | None:
-    """Record *run* and return a new workflow if the threshold is now met.
-
-    Products call this after each human-approved execution.  Returns a
-    ``CrystallizedWorkflow`` if crystallization was triggered, ``None``
-    otherwise.
-    """
-    recorder.record(run)
-    if not run.approved:
-        return None
-
-    all_runs = recorder.load_approved(run.product, run.task_type, run.input_hash)
-    if not should_crystallize(all_runs, config):
-        log.debug(
-            "pipeline: %d/%d approved runs for %s:%s — not yet crystallizing",
-            len(all_runs), config.threshold, run.product, run.task_type,
-        )
-        return None
-
-    workflow = crystallize(all_runs, config, existing_version=existing_version)
-    log.info(
-        "pipeline: crystallized %s after %d approvals",
-        workflow.workflow_id, workflow.approval_count,
-    )
-    return workflow
--- a/circuitforge_core/pipeline/executor.py
+++ b/circuitforge_core/pipeline/executor.py
@ -1,157 +0,0 @@
-# circuitforge_core/pipeline/executor.py — deterministic execution with LLM fallback
-#
-# MIT — orchestration logic only; calls product-supplied callables.
-from __future__ import annotations
-
-import logging
-from dataclasses import dataclass, field
-from typing import Any, Callable
-
-from .models import CrystallizedWorkflow, Step
-
-log = logging.getLogger(__name__)
-
-
-@dataclass
-class StepResult:
-    step: Step
-    success: bool
-    output: Any = None
-    error: str | None = None
-
-
-@dataclass
-class ExecutionResult:
-    """Result of running a workflow (deterministic or LLM-assisted).
-
-    Attributes
-    ----------
-    success:
-        True if all steps completed without error.
-    used_deterministic:
-        True if a crystallized workflow was used; False if LLM was called.
-    step_results:
-        Per-step outcomes from the deterministic path.
-    llm_output:
-        Raw output from the LLM fallback path, if used.
-    workflow_id:
-        ID of the workflow used, or None for LLM path.
-    error:
-        Error message if the run failed entirely.
-    """
-    success: bool
-    used_deterministic: bool
-    step_results: list[StepResult] = field(default_factory=list)
-    llm_output: Any = None
-    workflow_id: str | None = None
-    error: str | None = None
-
-
-# ── Executor ──────────────────────────────────────────────────────────────────
-
-class Executor:
-    """Runs crystallized workflows with transparent LLM fallback.
-
-    Parameters
-    ----------
-    step_fn:
-        Called for each Step: ``step_fn(step) -> (success, output)``.
-        The product supplies this — it knows how to turn a Step into a real
-        action (DTMF dial, HTTP call, form field write, etc.).
-    llm_fn:
-        Called when no workflow matches or a step fails: ``llm_fn() -> output``.
-        Products wire this to ``cf_core.llm.router`` or equivalent.
-    llm_fallback:
-        If False, raise RuntimeError instead of calling llm_fn on miss.
-    """
-
-    def __init__(
-        self,
-        step_fn: Callable[[Step], tuple[bool, Any]],
-        llm_fn: Callable[[], Any],
-        llm_fallback: bool = True,
-    ) -> None:
-        self._step_fn = step_fn
-        self._llm_fn = llm_fn
-        self._llm_fallback = llm_fallback
-
-    def execute(
-        self,
-        workflow: CrystallizedWorkflow,
-    ) -> ExecutionResult:
-        """Run *workflow* deterministically.
-
-        If a step fails, falls back to LLM (if ``llm_fallback`` is enabled).
-        """
-        step_results: list[StepResult] = []
-        for step in workflow.steps:
-            try:
-                success, output = self._step_fn(step)
-            except Exception as exc:
-                log.warning("step %s raised: %s", step.action, exc)
-                success, output = False, None
-                error_str = str(exc)
-            else:
-                error_str = None if success else "step_fn returned success=False"
-
-            step_results.append(StepResult(step=step, success=success,
-                                           output=output, error=error_str))
-            if not success:
-                log.info(
-                    "workflow %s: step %s failed — triggering LLM fallback",
-                    workflow.workflow_id, step.action,
-                )
-                return self._llm_fallback_result(
-                    step_results, workflow.workflow_id
-                )
-
-        log.info("workflow %s: all %d steps succeeded",
-                 workflow.workflow_id, len(workflow.steps))
-        return ExecutionResult(
-            success=True,
-            used_deterministic=True,
-            step_results=step_results,
-            workflow_id=workflow.workflow_id,
-        )
-
-    def run_with_fallback(
-        self,
-        workflow: CrystallizedWorkflow | None,
-    ) -> ExecutionResult:
-        """Run *workflow* if provided; otherwise call the LLM directly."""
-        if workflow is None:
-            return self._llm_fallback_result([], workflow_id=None)
-        return self.execute(workflow)
-
-    # ── Internal ──────────────────────────────────────────────────────────────
-
-    def _llm_fallback_result(
-        self,
-        partial_steps: list[StepResult],
-        workflow_id: str | None,
-    ) -> ExecutionResult:
-        if not self._llm_fallback:
-            return ExecutionResult(
-                success=False,
-                used_deterministic=True,
-                step_results=partial_steps,
-                workflow_id=workflow_id,
-                error="LLM fallback disabled and deterministic path failed.",
-            )
-        try:
-            llm_output = self._llm_fn()
-        except Exception as exc:
-            return ExecutionResult(
-                success=False,
-                used_deterministic=False,
-                step_results=partial_steps,
-                workflow_id=workflow_id,
-                error=f"LLM fallback raised: {exc}",
-            )
-        return ExecutionResult(
-            success=True,
-            used_deterministic=False,
-            step_results=partial_steps,
-            llm_output=llm_output,
-            workflow_id=workflow_id,
-        )
--- a/circuitforge_core/pipeline/models.py
+++ b/circuitforge_core/pipeline/models.py
@ -1,216 +0,0 @@
-# circuitforge_core/pipeline/models.py — crystallization data models
-#
-# MIT — protocol and model types only; no inference backends.
-from __future__ import annotations
-
-import hashlib
-import json
-from dataclasses import dataclass, field
-from datetime import datetime, timezone
-from typing import Any
-
-
-# ── Utilities ─────────────────────────────────────────────────────────────────
-
-def hash_input(features: dict[str, Any]) -> str:
-    """Return a stable SHA-256 hex digest of *features*.
-
-    Sorts keys before serialising so insertion order doesn't affect the hash.
-    Only call this on already-normalised, PII-free feature dicts — the hash is
-    opaque but the source dict should never contain raw user data.
-    """
-    canonical = json.dumps(features, sort_keys=True, ensure_ascii=True)
-    return hashlib.sha256(canonical.encode()).hexdigest()
-
-
-# ── Step ──────────────────────────────────────────────────────────────────────
-
-@dataclass
-class Step:
-    """One atomic action in a deterministic workflow.
-
-    The ``action`` string is product-defined (e.g. ``"dtmf"``, ``"field_fill"``,
-    ``"api_call"``).  ``params`` carries action-specific values; ``description``
-    is a plain-English summary for the approval UI.
-    """
-    action: str
-    params: dict[str, Any]
-    description: str = ""
-
-    def to_dict(self) -> dict[str, Any]:
-        return {"action": self.action, "params": self.params,
-                "description": self.description}
-
-    @classmethod
-    def from_dict(cls, d: dict[str, Any]) -> "Step":
-        return cls(action=d["action"], params=d.get("params", {}),
-                   description=d.get("description", ""))
-
-
-# ── PipelineRun ───────────────────────────────────────────────────────────────
-
-@dataclass
-class PipelineRun:
-    """Record of one LLM-assisted execution — the raw material for crystallization.
-
-    Fields
-    ------
-    run_id:
-        UUID or unique string identifying this run.
-    product:
-        CF product code (``"osprey"``, ``"falcon"``, ``"peregrine"`` …).
-    task_type:
-        Product-defined task category (``"ivr_navigate"``, ``"form_fill"`` …).
-    input_hash:
-        SHA-256 of normalised, PII-free input features.  Never store raw input.
-    steps:
-        Ordered list of Steps the LLM proposed.
-    approved:
-        True if a human approved this run before execution.
-    review_duration_ms:
-        Wall-clock milliseconds between displaying the proposal and the approval
-        click.  Values under ~5 000 ms indicate a rubber-stamp — the
-        crystallizer may reject runs with suspiciously short reviews.
-    output_modified:
-        True if the user edited any step before approving.  Modifications suggest
-        the LLM proposal was imperfect; too-easy crystallization from unmodified
-        runs may mean the task is already deterministic and the LLM is just
-        echoing a fixed pattern.
-    timestamp:
-        ISO 8601 UTC creation time.
-    llm_model:
-        Model ID that generated the steps, e.g. ``"llama3:8b-instruct"``.
-    metadata:
-        Freeform dict for product-specific extra fields.
-    """
-
-    run_id: str
-    product: str
-    task_type: str
-    input_hash: str
-    steps: list[Step]
-    approved: bool
-    review_duration_ms: int
-    output_modified: bool
-    timestamp: str = field(default_factory=lambda: datetime.now(timezone.utc).isoformat())
-    llm_model: str | None = None
-    metadata: dict[str, Any] = field(default_factory=dict)
-
-    def to_dict(self) -> dict[str, Any]:
-        return {
-            "run_id": self.run_id,
-            "product": self.product,
-            "task_type": self.task_type,
-            "input_hash": self.input_hash,
-            "steps": [s.to_dict() for s in self.steps],
-            "approved": self.approved,
-            "review_duration_ms": self.review_duration_ms,
-            "output_modified": self.output_modified,
-            "timestamp": self.timestamp,
-            "llm_model": self.llm_model,
-            "metadata": self.metadata,
-        }
-
-    @classmethod
-    def from_dict(cls, d: dict[str, Any]) -> "PipelineRun":
-        return cls(
-            run_id=d["run_id"],
-            product=d["product"],
-            task_type=d["task_type"],
-            input_hash=d["input_hash"],
-            steps=[Step.from_dict(s) for s in d.get("steps", [])],
-            approved=d["approved"],
-            review_duration_ms=d["review_duration_ms"],
-            output_modified=d.get("output_modified", False),
-            timestamp=d.get("timestamp", ""),
-            llm_model=d.get("llm_model"),
-            metadata=d.get("metadata", {}),
-        )
-
-
-# ── CrystallizedWorkflow ──────────────────────────────────────────────────────
-
-@dataclass
-class CrystallizedWorkflow:
-    """A deterministic workflow promoted from N approved PipelineRuns.
-
-    Once crystallized, the executor runs ``steps`` directly — no LLM required
-    unless an edge case is encountered.
-
-    Fields
-    ------
-    workflow_id:
-        Unique identifier (typically ``{product}:{task_type}:{input_hash[:12]}``).
-    product / task_type / input_hash:
-        Same semantics as PipelineRun; the hash is the lookup key.
-    steps:
-        Canonical deterministic step sequence (majority-voted or most-recent,
-        per CrystallizerConfig.strategy).
-    crystallized_at:
-        ISO 8601 UTC timestamp.
-    run_ids:
-        IDs of the source PipelineRuns that contributed to this workflow.
-    approval_count:
-        Number of approved runs that went into crystallization.
-    avg_review_duration_ms:
-        Mean review_duration_ms across all source runs — low values are a
-        warning sign that approvals may not have been genuine.
-    all_output_unmodified:
-        True if every contributing run had output_modified=False.  Combined with
-        a very short avg_review_duration_ms this can flag workflows that may
-        have crystallized from rubber-stamp approvals.
-    active:
-        Whether this workflow is in use.  Set to False to disable without
-        deleting the record.
-    version:
-        Increments each time the workflow is re-crystallized from new runs.
-    """
-
-    workflow_id: str
-    product: str
-    task_type: str
-    input_hash: str
-    steps: list[Step]
-    crystallized_at: str
-    run_ids: list[str]
-    approval_count: int
-    avg_review_duration_ms: int
-    all_output_unmodified: bool
-    active: bool = True
-    version: int = 1
-    metadata: dict[str, Any] = field(default_factory=dict)
-
-    def to_dict(self) -> dict[str, Any]:
-        return {
-            "workflow_id": self.workflow_id,
-            "product": self.product,
-            "task_type": self.task_type,
-            "input_hash": self.input_hash,
-            "steps": [s.to_dict() for s in self.steps],
-            "crystallized_at": self.crystallized_at,
-            "run_ids": self.run_ids,
-            "approval_count": self.approval_count,
-            "avg_review_duration_ms": self.avg_review_duration_ms,
-            "all_output_unmodified": self.all_output_unmodified,
-            "active": self.active,
-            "version": self.version,
-            "metadata": self.metadata,
-        }
-
-    @classmethod
-    def from_dict(cls, d: dict[str, Any]) -> "CrystallizedWorkflow":
-        return cls(
-            workflow_id=d["workflow_id"],
-            product=d["product"],
-            task_type=d["task_type"],
-            input_hash=d["input_hash"],
-            steps=[Step.from_dict(s) for s in d.get("steps", [])],
-            crystallized_at=d["crystallized_at"],
-            run_ids=d.get("run_ids", []),
-            approval_count=d["approval_count"],
-            avg_review_duration_ms=d["avg_review_duration_ms"],
-            all_output_unmodified=d.get("all_output_unmodified", True),
-            active=d.get("active", True),
-            version=d.get("version", 1),
-            metadata=d.get("metadata", {}),
-        )
--- a/circuitforge_core/pipeline/multimodal.py
+++ b/circuitforge_core/pipeline/multimodal.py
@ -1,234 +0,0 @@
-# circuitforge_core/pipeline/multimodal.py — cf-docuvision + cf-text pipeline
-#
-# MIT — orchestration only; vision and text inference stay in their own modules.
-#
-# Usage (minimal):
-#
-#   from circuitforge_core.pipeline.multimodal import MultimodalPipeline, MultimodalConfig
-#
-#   pipe = MultimodalPipeline(MultimodalConfig())
-#   for result in pipe.run(page_bytes_list):
-#       print(f"Page {result.page_idx}: {result.generated[:80]}")
-#
-# Streaming (token-by-token):
-#
-#   for page_idx, token in pipe.stream(page_bytes_list):
-#       ui.append(page_idx, token)
-#
-from __future__ import annotations
-
-import logging
-from collections.abc import Callable, Iterable, Iterator
-from dataclasses import dataclass, field
-from typing import Any
-
-from circuitforge_core.documents.client import DocuvisionClient
-from circuitforge_core.documents.models import StructuredDocument
-
-log = logging.getLogger(__name__)
-
-
-# ── Config ────────────────────────────────────────────────────────────────────
-
-def _default_prompt(page_idx: int, doc: StructuredDocument) -> str:
-    """Build a generation prompt from a StructuredDocument."""
-    header = f"[Page {page_idx + 1}]\n" if page_idx > 0 else ""
-    return header + doc.raw_text
-
-
-@dataclass
-class MultimodalConfig:
-    """Configuration for MultimodalPipeline.
-
-    vision_url:
-        Base URL of the cf-docuvision service.
-    hint:
-        Docuvision extraction hint — ``"auto"`` | ``"document"`` | ``"form"``
-        | ``"table"`` | ``"figure"``.
-    max_tokens:
-        Passed to cf-text generate per page.
-    temperature:
-        Sampling temperature for text generation.
-    vram_serialise:
-        When True, ``swap_fn`` is called between the vision and text steps
-        on each page.  Use this on 8GB GPUs where Dolphin-v2 and the text
-        model cannot be resident simultaneously.
-    prompt_fn:
-        Callable ``(page_idx, StructuredDocument) -> str`` that builds the
-        generation prompt.  Defaults to using ``doc.raw_text`` directly.
-        Products override this to add system context, few-shot examples, etc.
-    vision_timeout:
-        HTTP timeout in seconds for each cf-docuvision request.
-    """
-    vision_url: str = "http://localhost:8003"
-    hint: str = "auto"
-    max_tokens: int = 512
-    temperature: float = 0.7
-    vram_serialise: bool = False
-    prompt_fn: Callable[[int, StructuredDocument], str] = field(
-        default_factory=lambda: _default_prompt
-    )
-    vision_timeout: int = 60
-
-
-# ── Results ───────────────────────────────────────────────────────────────────
-
-@dataclass
-class PageResult:
-    """Result of processing one page through the vision + text pipeline.
-
-    page_idx:
-        Zero-based page index.
-    doc:
-        StructuredDocument from cf-docuvision.
-    generated:
-        Full text output from cf-text for this page.
-    error:
-        Non-None if extraction or generation failed for this page.
-    """
-    page_idx: int
-    doc: StructuredDocument | None
-    generated: str
-    error: str | None = None
-
-
-# ── Pipeline ──────────────────────────────────────────────────────────────────
-
-class MultimodalPipeline:
-    """Chunk a multi-page document through vision extraction + text generation.
-
-    Parameters
-    ----------
-    config:
-        Pipeline configuration.
-    swap_fn:
-        Optional callable with no arguments, called between the vision and text
-        steps on each page when ``config.vram_serialise=True``.  Products using
-        cf-orch wire this to the VRAM budget API so Dolphin-v2 can offload
-        before the text model loads.  A no-op lambda works for testing.
-    generate_fn:
-        Text generation callable: ``(prompt, max_tokens, temperature) -> str``.
-        Defaults to ``circuitforge_core.text.generate``.  Override in tests or
-        when the product manages its own text backend.
-    stream_fn:
-        Streaming text callable: ``(prompt, max_tokens, temperature) -> Iterator[str]``.
-        Defaults to ``circuitforge_core.text.generate`` with ``stream=True``.
-    """
-
-    def __init__(
-        self,
-        config: MultimodalConfig | None = None,
-        *,
-        swap_fn: Callable[[], None] | None = None,
-        generate_fn: Callable[..., str] | None = None,
-        stream_fn: Callable[..., Iterator[str]] | None = None,
-    ) -> None:
-        self._cfg = config or MultimodalConfig()
-        self._vision = DocuvisionClient(
-            base_url=self._cfg.vision_url,
-            timeout=self._cfg.vision_timeout,
-        )
-        self._swap_fn = swap_fn
-        self._generate_fn = generate_fn
-        self._stream_fn = stream_fn
-
-    # ── Public ────────────────────────────────────────────────────────────────
-
-    def run(self, pages: Iterable[bytes]) -> Iterator[PageResult]:
-        """Process each page and yield a PageResult as soon as it is ready.
-
-        Callers receive pages one at a time — the UI can begin rendering
-        page 0 while pages 1..N are still being extracted and generated.
-        """
-        for page_idx, page_bytes in enumerate(pages):
-            yield self._process_page(page_idx, page_bytes)
-
-    def stream(self, pages: Iterable[bytes]) -> Iterator[tuple[int, str]]:
-        """Yield ``(page_idx, token)`` tuples for token-level progressive rendering.
-
-        Each page is fully extracted before text generation begins, but tokens
-        are yielded as the text model produces them rather than waiting for the
-        full page output.
-        """
-        for page_idx, page_bytes in enumerate(pages):
-            doc, err = self._extract(page_idx, page_bytes)
-            if err:
-                yield (page_idx, f"[extraction error: {err}]")
-                continue
-
-            self._maybe_swap()
-
-            prompt = self._cfg.prompt_fn(page_idx, doc)
-            try:
-                for token in self._stream_tokens(prompt):
-                    yield (page_idx, token)
-            except Exception as exc:
-                log.error("page %d text streaming failed: %s", page_idx, exc)
-                yield (page_idx, f"[generation error: {exc}]")
-
-    # ── Internal ──────────────────────────────────────────────────────────────
-
-    def _process_page(self, page_idx: int, page_bytes: bytes) -> PageResult:
-        doc, err = self._extract(page_idx, page_bytes)
-        if err:
-            return PageResult(page_idx=page_idx, doc=None, generated="", error=err)
-
-        self._maybe_swap()
-
-        prompt = self._cfg.prompt_fn(page_idx, doc)
-        try:
-            text = self._generate(prompt)
-        except Exception as exc:
-            log.error("page %d generation failed: %s", page_idx, exc)
-            return PageResult(page_idx=page_idx, doc=doc, generated="",
-                              error=str(exc))
-
-        return PageResult(page_idx=page_idx, doc=doc, generated=text)
-
-    def _extract(
-        self, page_idx: int, page_bytes: bytes
-    ) -> tuple[StructuredDocument | None, str | None]:
-        try:
-            doc = self._vision.extract(page_bytes, hint=self._cfg.hint)
-            log.debug("page %d extracted: %d chars", page_idx, len(doc.raw_text))
-            return doc, None
-        except Exception as exc:
-            log.error("page %d vision extraction failed: %s", page_idx, exc)
-            return None, str(exc)
-
-    def _maybe_swap(self) -> None:
-        if self._cfg.vram_serialise and self._swap_fn is not None:
-            log.debug("vram_serialise: calling swap_fn")
-            self._swap_fn()
-
-    def _generate(self, prompt: str) -> str:
-        if self._generate_fn is not None:
-            return self._generate_fn(
-                prompt,
-                max_tokens=self._cfg.max_tokens,
-                temperature=self._cfg.temperature,
-            )
-        from circuitforge_core.text import generate
-        result = generate(
-            prompt,
-            max_tokens=self._cfg.max_tokens,
-            temperature=self._cfg.temperature,
-        )
-        return result.text
-
-    def _stream_tokens(self, prompt: str) -> Iterator[str]:
-        if self._stream_fn is not None:
-            yield from self._stream_fn(
-                prompt,
-                max_tokens=self._cfg.max_tokens,
-                temperature=self._cfg.temperature,
-            )
-            return
-        from circuitforge_core.text import generate
-        tokens = generate(
-            prompt,
-            max_tokens=self._cfg.max_tokens,
-            temperature=self._cfg.temperature,
-            stream=True,
-        )
-        yield from tokens
--- a/circuitforge_core/pipeline/recorder.py
+++ b/circuitforge_core/pipeline/recorder.py
@ -1,70 +0,0 @@
-# circuitforge_core/pipeline/recorder.py — write and load PipelineRun records
-#
-# MIT — local file I/O only; no inference.
-from __future__ import annotations
-
-import json
-import logging
-from pathlib import Path
-from typing import Iterable
-
-from .models import PipelineRun
-
-log = logging.getLogger(__name__)
-
-_DEFAULT_ROOT = Path.home() / ".config" / "circuitforge" / "pipeline" / "runs"
-
-
-class Recorder:
-    """Writes PipelineRun JSON records to a local directory tree.
-
-    Layout::
-
-        {root}/{product}/{task_type}/{run_id}.json
-
-    The recorder is intentionally append-only — it never deletes or modifies
-    existing records.  Old runs accumulate as an audit trail; products that
-    want retention limits should prune the directory themselves.
-    """
-
-    def __init__(self, root: Path | None = None) -> None:
-        self._root = Path(root) if root else _DEFAULT_ROOT
-
-    # ── Write ─────────────────────────────────────────────────────────────────
-
-    def record(self, run: PipelineRun) -> Path:
-        """Persist *run* to disk and return the file path written."""
-        dest = self._path_for(run.product, run.task_type, run.run_id)
-        dest.parent.mkdir(parents=True, exist_ok=True)
-        dest.write_text(json.dumps(run.to_dict(), indent=2), encoding="utf-8")
-        log.debug("recorded pipeline run %s → %s", run.run_id, dest)
-        return dest
-
-    # ── Read ──────────────────────────────────────────────────────────────────
-
-    def load_runs(self, product: str, task_type: str) -> list[PipelineRun]:
-        """Return all runs for *(product, task_type)*, newest-first."""
-        directory = self._root / product / task_type
-        if not directory.is_dir():
-            return []
-        runs: list[PipelineRun] = []
-        for p in directory.glob("*.json"):
-            try:
-                runs.append(PipelineRun.from_dict(json.loads(p.read_text())))
-            except Exception:
-                log.warning("skipping unreadable run file %s", p)
-        runs.sort(key=lambda r: r.timestamp, reverse=True)
-        return runs
-
-    def load_approved(self, product: str, task_type: str,
-                      input_hash: str) -> list[PipelineRun]:
-        """Return approved runs that match *input_hash*, newest-first."""
-        return [
-            r for r in self.load_runs(product, task_type)
-            if r.approved and r.input_hash == input_hash
-        ]
-
-    # ── Internal ──────────────────────────────────────────────────────────────
-
-    def _path_for(self, product: str, task_type: str, run_id: str) -> Path:
-        return self._root / product / task_type / f"{run_id}.json"
--- a/circuitforge_core/pipeline/registry.py
+++ b/circuitforge_core/pipeline/registry.py
@ -1,134 +0,0 @@
-# circuitforge_core/pipeline/registry.py — workflow lookup
-#
-# MIT — file I/O and matching logic only.
-from __future__ import annotations
-
-import json
-import logging
-from pathlib import Path
-from typing import Callable
-
-from .models import CrystallizedWorkflow
-
-log = logging.getLogger(__name__)
-
-_DEFAULT_ROOT = Path.home() / ".config" / "circuitforge" / "pipeline" / "workflows"
-
-
-class Registry:
-    """Loads and matches CrystallizedWorkflows from the local filesystem.
-
-    Layout::
-
-        {root}/{product}/{task_type}/{workflow_id}.json
-
-    Exact matching is always available.  Products that need fuzzy/semantic
-    matching can supply a ``similarity_fn`` — a callable that takes two input
-    hashes and returns a float in [0, 1].  The registry returns the first
-    active workflow whose similarity score meets ``fuzzy_threshold``.
-    """
-
-    def __init__(
-        self,
-        root: Path | None = None,
-        similarity_fn: Callable[[str, str], float] | None = None,
-        fuzzy_threshold: float = 0.8,
-    ) -> None:
-        self._root = Path(root) if root else _DEFAULT_ROOT
-        self._similarity_fn = similarity_fn
-        self._fuzzy_threshold = fuzzy_threshold
-
-    # ── Write ─────────────────────────────────────────────────────────────────
-
-    def register(self, workflow: CrystallizedWorkflow) -> Path:
-        """Persist *workflow* and return the path written."""
-        dest = self._path_for(workflow.product, workflow.task_type,
-                              workflow.workflow_id)
-        dest.parent.mkdir(parents=True, exist_ok=True)
-        dest.write_text(json.dumps(workflow.to_dict(), indent=2), encoding="utf-8")
-        log.info("registered workflow %s (v%d)", workflow.workflow_id,
-                 workflow.version)
-        return dest
-
-    def deactivate(self, workflow_id: str, product: str,
-                   task_type: str) -> bool:
-        """Set ``active=False`` on a stored workflow.  Returns True if found."""
-        path = self._path_for(product, task_type, workflow_id)
-        if not path.exists():
-            return False
-        data = json.loads(path.read_text())
-        data["active"] = False
-        path.write_text(json.dumps(data, indent=2), encoding="utf-8")
-        log.info("deactivated workflow %s", workflow_id)
-        return True
-
-    # ── Read ──────────────────────────────────────────────────────────────────
-
-    def load_all(self, product: str, task_type: str) -> list[CrystallizedWorkflow]:
-        """Return all (including inactive) workflows for *(product, task_type)*."""
-        directory = self._root / product / task_type
-        if not directory.is_dir():
-            return []
-        workflows: list[CrystallizedWorkflow] = []
-        for p in directory.glob("*.json"):
-            try:
-                workflows.append(
-                    CrystallizedWorkflow.from_dict(json.loads(p.read_text()))
-                )
-            except Exception:
-                log.warning("skipping unreadable workflow file %s", p)
-        return workflows
-
-    # ── Match ─────────────────────────────────────────────────────────────────
-
-    def match(self, product: str, task_type: str,
-              input_hash: str) -> CrystallizedWorkflow | None:
-        """Return the active workflow for an exact input_hash match, or None."""
-        for wf in self.load_all(product, task_type):
-            if wf.active and wf.input_hash == input_hash:
-                log.debug("registry exact match: %s", wf.workflow_id)
-                return wf
-        return None
-
-    def fuzzy_match(self, product: str, task_type: str,
-                    input_hash: str) -> CrystallizedWorkflow | None:
-        """Return a workflow above the similarity threshold, or None.
-
-        Requires a ``similarity_fn`` to have been supplied at construction.
-        If none was provided, raises ``RuntimeError``.
-        """
-        if self._similarity_fn is None:
-            raise RuntimeError(
-                "fuzzy_match() requires a similarity_fn — none was supplied "
-                "to Registry.__init__()."
-            )
-        best: CrystallizedWorkflow | None = None
-        best_score = 0.0
-        for wf in self.load_all(product, task_type):
-            if not wf.active:
-                continue
-            score = self._similarity_fn(wf.input_hash, input_hash)
-            if score >= self._fuzzy_threshold and score > best_score:
-                best = wf
-                best_score = score
-        if best:
-            log.debug("registry fuzzy match: %s (score=%.2f)", best.workflow_id,
-                      best_score)
-        return best
-
-    def find(self, product: str, task_type: str,
-             input_hash: str) -> CrystallizedWorkflow | None:
-        """Exact match first; fuzzy match second (if similarity_fn is set)."""
-        exact = self.match(product, task_type, input_hash)
-        if exact:
-            return exact
-        if self._similarity_fn is not None:
-            return self.fuzzy_match(product, task_type, input_hash)
-        return None
-
-    # ── Internal ──────────────────────────────────────────────────────────────
-
-    def _path_for(self, product: str, task_type: str,
-                  workflow_id: str) -> Path:
-        safe_id = workflow_id.replace(":", "_")
-        return self._root / product / task_type / f"{safe_id}.json"
--- a/Show more
+++ b/Show more
				`@ -1 +0,0 @@`
				`"""circuitforge_core.musicgen — music continuation service (BSL 1.1)."""`