From ae0ac19505b8b32fd5c3257c8fb70667348dc5e6 Mon Sep 17 00:00:00 2001
From: pyr0ball <pyroballpcs@gmail.com>
Date: Wed, 8 Apr 2026 06:18:12 -0700
Subject: [PATCH] chore: retire Streamlit app, scaffold sft branch
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Delete app/label_tool.py (Streamlit UI retired; Vue SPA is sole UI)
- Extract _strip_html and _extract_body into app/utils.py (stdlib-only, reusable)
- Update tests/test_label_tool.py import to app.utils
- Rename start-api/stop-api/restart-api/open-api → start/stop/restart/open in manage.sh
- Remove STREAMLIT variable and all Streamlit-specific case blocks from manage.sh
- Update manage.sh usage section to reflect Vue+FastAPI-only commands
- Add data/sft_candidates.jsonl and data/sft_approved.jsonl to .gitignore
- Add sft.bench_results_dir key to config/label_tool.yaml.example
---
 .gitignore                     |    2 +
 app/label_tool.py              | 1186 --------------------------------
 app/utils.py                   |   85 +++
 config/label_tool.yaml.example |    5 +
 manage.sh                      |  200 ++----
 tests/test_label_tool.py       |    2 +-
 6 files changed, 135 insertions(+), 1345 deletions(-)
 delete mode 100644 app/label_tool.py
 create mode 100644 app/utils.py

diff --git a/.gitignore b/.gitignore
index 06104ed..fc48446 100644
--- a/.gitignore
+++ b/.gitignore
@@ -11,6 +11,8 @@ config/label_tool.yaml
 data/email_score.jsonl
 data/email_label_queue.jsonl
 data/email_compare_sample.jsonl
+data/sft_candidates.jsonl
+data/sft_approved.jsonl
 
 # Conda/pip artifacts
 .env
diff --git a/app/label_tool.py b/app/label_tool.py
deleted file mode 100644
index c86d09b..0000000
--- a/app/label_tool.py
+++ /dev/null
@@ -1,1186 +0,0 @@
-"""Email Label Tool — card-stack UI for building classifier benchmark data.
-
-Philosophy: Scrape → Store → Process
-  Fetch (IMAP, wide search, multi-account) → data/email_label_queue.jsonl
-  Label (card stack)                       → data/email_score.jsonl
-
-Run:
-    conda run -n job-seeker streamlit run app/label_tool.py --server.port 8503
-
-Config: config/label_tool.yaml  (gitignored — see config/label_tool.yaml.example)
-"""
-from __future__ import annotations
-
-import email as _email_lib
-import hashlib
-import html as _html
-from html.parser import HTMLParser
-import imaplib
-import json
-import re
-import sys
-from datetime import datetime, timedelta
-from email.header import decode_header as _raw_decode
-from pathlib import Path
-from typing import Any
-
-import os
-import subprocess
-
-import streamlit as st
-import yaml
-
-# ── Path setup ─────────────────────────────────────────────────────────────
-_ROOT = Path(__file__).parent.parent
-sys.path.insert(0, str(_ROOT))
-
-_QUEUE_FILE = _ROOT / "data" / "email_label_queue.jsonl"
-_SCORE_FILE = _ROOT / "data" / "email_score.jsonl"
-_CFG_FILE   = _ROOT / "config" / "label_tool.yaml"
-
-# ── Labels ─────────────────────────────────────────────────────────────────
-LABELS = [
-    "interview_scheduled",
-    "offer_received",
-    "rejected",
-    "positive_response",
-    "survey_received",
-    "neutral",
-    "event_rescheduled",
-    "digest",
-    "new_lead",
-    "hired",
-]
-
-_LABEL_META: dict[str, dict] = {
-    "interview_scheduled": {"emoji": "🗓️", "color": "#4CAF50", "key": "1"},
-    "offer_received":      {"emoji": "🎉", "color": "#2196F3", "key": "2"},
-    "rejected":            {"emoji": "❌", "color": "#F44336", "key": "3"},
-    "positive_response":   {"emoji": "👍", "color": "#FF9800", "key": "4"},
-    "survey_received":     {"emoji": "📋", "color": "#9C27B0", "key": "5"},
-    "neutral":             {"emoji": "⬜", "color": "#607D8B", "key": "6"},
-    "event_rescheduled":   {"emoji": "🔄", "color": "#FF5722", "key": "7"},
-    "digest":              {"emoji": "📰", "color": "#00BCD4", "key": "8"},
-    "new_lead":            {"emoji": "🤝", "color": "#009688", "key": "9"},
-    "hired":               {"emoji": "🎊", "color": "#FFC107", "key": "h"},
-}
-
-# ── HTML sanitiser ───────────────────────────────────────────────────────────
-# Valid chars per XML 1.0 §2.2 (same set HTML5 innerHTML enforces):
-#   #x9 | #xA | #xD | [#x20–#xD7FF] | [#xE000–#xFFFD] | [#x10000–#x10FFFF]
-# Anything outside this range causes InvalidCharacterError in the browser.
-_INVALID_XML_CHARS = re.compile(
-    r"[^\x09\x0A\x0D\x20-\uD7FF\uE000-\uFFFD\U00010000-\U0010FFFF]"
-)
-
-def _to_html(text: str, newlines_to_br: bool = False) -> str:
-    """Strip invalid XML chars, HTML-escape the result, optionally convert \\n → <br>."""
-    if not text:
-        return ""
-    cleaned = _INVALID_XML_CHARS.sub("", text)
-    escaped = _html.escape(cleaned)
-    if newlines_to_br:
-        escaped = escaped.replace("\n", "<br>")
-    return escaped
-
-
-# ── HTML → plain-text extractor ─────────────────────────────────────────────
-
-class _TextExtractor(HTMLParser):
-    """Extract visible text from an HTML email body, preserving line breaks."""
-    _BLOCK = {"p","div","br","li","tr","h1","h2","h3","h4","h5","h6","blockquote"}
-    _SKIP  = {"script","style","head","noscript"}
-
-    def __init__(self):
-        super().__init__(convert_charrefs=True)
-        self._parts: list[str] = []
-        self._depth_skip = 0
-
-    def handle_starttag(self, tag, attrs):
-        tag = tag.lower()
-        if tag in self._SKIP:
-            self._depth_skip += 1
-        elif tag in self._BLOCK:
-            self._parts.append("\n")
-
-    def handle_endtag(self, tag):
-        if tag.lower() in self._SKIP:
-            self._depth_skip = max(0, self._depth_skip - 1)
-
-    def handle_data(self, data):
-        if not self._depth_skip:
-            self._parts.append(data)
-
-    def get_text(self) -> str:
-        text = "".join(self._parts)
-        lines = [ln.strip() for ln in text.splitlines()]
-        return "\n".join(ln for ln in lines if ln)
-
-
-def _strip_html(html_str: str) -> str:
-    """Convert HTML email body to plain text. Pure stdlib, no dependencies."""
-    try:
-        extractor = _TextExtractor()
-        extractor.feed(html_str)
-        return extractor.get_text()
-    except Exception:
-        return re.sub(r"<[^>]+>", " ", html_str).strip()
-
-
-# ── Wide IMAP search terms (cast a net across all 10 categories) ────────────
-_WIDE_TERMS = [
-    # interview_scheduled
-    "interview", "phone screen", "video call", "zoom link", "schedule a call",
-    # offer_received
-    "offer letter", "job offer", "offer of employment", "pleased to offer",
-    # rejected
-    "unfortunately", "not moving forward", "other candidates", "regret to inform",
-    "no longer", "decided not to", "decided to go with",
-    # positive_response
-    "opportunity", "interested in your background", "reached out", "great fit",
-    "exciting role", "love to connect",
-    # survey_received
-    "assessment", "questionnaire", "culture fit", "culture-fit", "online assessment",
-    # neutral / ATS confirms
-    "application received", "thank you for applying", "application confirmation",
-    "you applied", "your application for",
-    # event_rescheduled
-    "reschedule", "rescheduled", "new time", "moved to", "postponed", "new date",
-    # digest
-    "job digest", "jobs you may like", "recommended jobs", "jobs for you",
-    "new jobs", "job alert",
-    # new_lead
-    "came across your profile", "reaching out about", "great fit for a role",
-    "exciting opportunity", "love to connect",
-    # hired / onboarding
-    "welcome to the team", "start date", "onboarding", "first day", "we're excited to have you",
-    # general recruitment
-    "application", "recruiter", "recruiting", "hiring", "candidate",
-]
-
-
-# ── IMAP helpers ────────────────────────────────────────────────────────────
-
-def _decode_str(value: str | None) -> str:
-    if not value:
-        return ""
-    parts = _raw_decode(value)
-    out = []
-    for part, enc in parts:
-        if isinstance(part, bytes):
-            out.append(part.decode(enc or "utf-8", errors="replace"))
-        else:
-            out.append(str(part))
-    return " ".join(out).strip()
-
-
-def _extract_body(msg: Any) -> str:
-    """Return plain-text body. Strips HTML when no text/plain part exists."""
-    if msg.is_multipart():
-        html_fallback: str | None = None
-        for part in msg.walk():
-            ct = part.get_content_type()
-            if ct == "text/plain":
-                try:
-                    charset = part.get_content_charset() or "utf-8"
-                    return part.get_payload(decode=True).decode(charset, errors="replace")
-                except Exception:
-                    pass
-            elif ct == "text/html" and html_fallback is None:
-                try:
-                    charset = part.get_content_charset() or "utf-8"
-                    raw = part.get_payload(decode=True).decode(charset, errors="replace")
-                    html_fallback = _strip_html(raw)
-                except Exception:
-                    pass
-        return html_fallback or ""
-    else:
-        try:
-            charset = msg.get_content_charset() or "utf-8"
-            raw = msg.get_payload(decode=True).decode(charset, errors="replace")
-            if msg.get_content_type() == "text/html":
-                return _strip_html(raw)
-            return raw
-        except Exception:
-            pass
-    return ""
-
-
-def _test_imap_connection(acc: dict) -> tuple[bool, str]:
-    """Try connect → login → select folder. Returns (ok, human message)."""
-    host     = acc.get("host", "")
-    port     = int(acc.get("port", 993))
-    use_ssl  = acc.get("use_ssl", True)
-    username = acc.get("username", "")
-    password = acc.get("password", "")
-    folder   = acc.get("folder", "INBOX")
-    if not host or not username or not password:
-        return False, "Host, username, and password are all required."
-    try:
-        conn = (imaplib.IMAP4_SSL if use_ssl else imaplib.IMAP4)(host, port)
-        conn.login(username, password)
-        typ, data = conn.select(folder, readonly=True)
-        count = data[0].decode() if data and data[0] else "?"
-        conn.logout()
-        return True, f"Connected — {count} message(s) in {folder}."
-    except Exception as exc:
-        return False, str(exc)
-
-
-def _fetch_account(cfg: dict, days: int, limit: int, known_keys: set[str],
-                   progress_cb=None) -> list[dict]:
-    """Fetch emails from one IMAP account using wide recruitment search terms."""
-    since = (datetime.now() - timedelta(days=days)).strftime("%d-%b-%Y")
-    host     = cfg.get("host", "imap.gmail.com")
-    port     = int(cfg.get("port", 993))
-    use_ssl  = cfg.get("use_ssl", True)
-    username = cfg["username"]
-    password = cfg["password"]
-    name     = cfg.get("name", username)
-
-    conn = (imaplib.IMAP4_SSL if use_ssl else imaplib.IMAP4)(host, port)
-    conn.login(username, password)
-
-    seen_uids: dict[bytes, None] = {}
-    conn.select("INBOX", readonly=True)
-    for term in _WIDE_TERMS:
-        try:
-            _, data = conn.search(None, f'(SUBJECT "{term}" SINCE "{since}")')
-            for uid in (data[0] or b"").split():
-                seen_uids[uid] = None
-        except Exception:
-            pass
-
-    emails: list[dict] = []
-    uids = list(seen_uids.keys())[:limit * 3]  # overfetch; filter after dedup
-    for i, uid in enumerate(uids):
-        if len(emails) >= limit:
-            break
-        if progress_cb:
-            progress_cb(i / len(uids), f"{name}: {len(emails)} fetched…")
-        try:
-            _, raw_data = conn.fetch(uid, "(RFC822)")
-            if not raw_data or not raw_data[0]:
-                continue
-            msg  = _email_lib.message_from_bytes(raw_data[0][1])
-            subj = _decode_str(msg.get("Subject", ""))
-            from_addr = _decode_str(msg.get("From", ""))
-            date  = _decode_str(msg.get("Date", ""))
-            body  = _extract_body(msg)[:800]
-            entry = {
-                "subject":   subj,
-                "body":      body,
-                "from_addr": from_addr,
-                "date":      date,
-                "account":   name,
-            }
-            key = _entry_key(entry)
-            if key not in known_keys:
-                known_keys.add(key)
-                emails.append(entry)
-        except Exception:
-            pass
-
-    try:
-        conn.logout()
-    except Exception:
-        pass
-    return emails
-
-
-def _fetch_targeted(
-    cfg: dict,
-    since_dt: datetime, before_dt: datetime,
-    term: str, field: str,
-    limit: int,
-    known_keys: set[str],
-    progress_cb=None,
-) -> list[dict]:
-    """Fetch emails within a date range, optionally filtered by sender/subject.
-
-    field: "from" | "subject" | "either" | "none"
-    """
-    since  = since_dt.strftime("%d-%b-%Y")
-    before = before_dt.strftime("%d-%b-%Y")
-    host    = cfg.get("host", "imap.gmail.com")
-    port    = int(cfg.get("port", 993))
-    use_ssl = cfg.get("use_ssl", True)
-    username = cfg["username"]
-    password = cfg["password"]
-    name    = cfg.get("name", username)
-
-    conn = (imaplib.IMAP4_SSL if use_ssl else imaplib.IMAP4)(host, port)
-    conn.login(username, password)
-    conn.select("INBOX", readonly=True)
-
-    date_part = f'SINCE "{since}" BEFORE "{before}"'
-    if term and field == "from":
-        search_str = f'(FROM "{term}") {date_part}'
-    elif term and field == "subject":
-        search_str = f'(SUBJECT "{term}") {date_part}'
-    elif term and field == "either":
-        search_str = f'(OR (FROM "{term}") (SUBJECT "{term}")) {date_part}'
-    else:
-        search_str = date_part
-
-    try:
-        _, data = conn.search(None, search_str)
-        uids = (data[0] or b"").split()
-    except Exception:
-        uids = []
-
-    emails: list[dict] = []
-    for i, uid in enumerate(uids):
-        if len(emails) >= limit:
-            break
-        if progress_cb:
-            progress_cb(i / max(len(uids), 1), f"{name}: {len(emails)} fetched…")
-        try:
-            _, raw_data = conn.fetch(uid, "(RFC822)")
-            if not raw_data or not raw_data[0]:
-                continue
-            msg = _email_lib.message_from_bytes(raw_data[0][1])
-            subj     = _decode_str(msg.get("Subject", ""))
-            from_addr = _decode_str(msg.get("From", ""))
-            date      = _decode_str(msg.get("Date", ""))
-            body      = _extract_body(msg)[:800]
-            entry = {
-                "subject": subj, "body": body,
-                "from_addr": from_addr, "date": date,
-                "account": name,
-            }
-            key = _entry_key(entry)
-            if key not in known_keys:
-                known_keys.add(key)
-                emails.append(entry)
-        except Exception:
-            pass
-
-    try:
-        conn.logout()
-    except Exception:
-        pass
-    return emails
-
-
-# ── Queue / score file helpers ───────────────────────────────────────────────
-
-def _entry_key(e: dict) -> str:
-    return hashlib.md5(
-        (e.get("subject", "") + (e.get("body") or "")[:100]).encode()
-    ).hexdigest()
-
-
-def _load_jsonl(path: Path) -> list[dict]:
-    if not path.exists():
-        return []
-    rows = []
-    with path.open() as f:
-        for line in f:
-            line = line.strip()
-            if line:
-                try:
-                    rows.append(json.loads(line))
-                except Exception:
-                    pass
-    return rows
-
-
-def _save_jsonl(path: Path, rows: list[dict]) -> None:
-    path.parent.mkdir(parents=True, exist_ok=True)
-    with path.open("w") as f:
-        for row in rows:
-            f.write(json.dumps(row, ensure_ascii=False) + "\n")
-
-
-def _append_jsonl(path: Path, row: dict) -> None:
-    path.parent.mkdir(parents=True, exist_ok=True)
-    with path.open("a") as f:
-        f.write(json.dumps(row, ensure_ascii=False) + "\n")
-
-
-# ── Config ──────────────────────────────────────────────────────────────────
-
-def _load_config() -> list[dict]:
-    if not _CFG_FILE.exists():
-        return []
-    cfg = yaml.safe_load(_CFG_FILE.read_text()) or {}
-    return cfg.get("accounts", [])
-
-
-# ── Page setup ──────────────────────────────────────────────────────────────
-
-st.set_page_config(
-    page_title="Avocet — Email Labeler",
-    page_icon="📬",
-    layout="wide",
-)
-
-st.markdown("""
-<style>
-/* Card stack */
-.email-card {
-    border: 1px solid rgba(128,128,128,0.25);
-    border-radius: 14px;
-    padding: 28px 32px;
-    box-shadow: 0 6px 24px rgba(0,0,0,0.18);
-    margin-bottom: 4px;
-    position: relative;
-}
-.card-stack-hint {
-    height: 10px;
-    border-radius: 0 0 12px 12px;
-    border: 1px solid rgba(128,128,128,0.15);
-    margin: 0 16px;
-    box-shadow: 0 4px 12px rgba(0,0,0,0.10);
-}
-.card-stack-hint2 {
-    height: 8px;
-    border-radius: 0 0 10px 10px;
-    border: 1px solid rgba(128,128,128,0.08);
-    margin: 0 32px;
-}
-/* Subject line */
-.card-subject { font-size: 1.3rem; font-weight: 700; margin-bottom: 6px; }
-.card-meta { font-size: 0.82rem; opacity: 0.6; margin-bottom: 16px; }
-.card-body { font-size: 0.92rem; opacity: 0.85; white-space: pre-wrap; line-height: 1.5; }
-/* Bucket buttons */
-div[data-testid="stButton"] > button.bucket-btn {
-    height: 70px;
-    font-size: 1.05rem;
-    font-weight: 600;
-    border-radius: 12px;
-}
-</style>
-""", unsafe_allow_html=True)
-
-st.title("📬 Avocet — Email Label Tool")
-st.caption("Scrape → Store → Process  |  card-stack edition")
-
-# ── Session state init ───────────────────────────────────────────────────────
-
-if "queue" not in st.session_state:
-    st.session_state.queue: list[dict] = _load_jsonl(_QUEUE_FILE)
-
-if "labeled" not in st.session_state:
-    st.session_state.labeled: list[dict] = _load_jsonl(_SCORE_FILE)
-    st.session_state.labeled_keys: set[str] = {
-        _entry_key(r) for r in st.session_state.labeled
-    }
-
-if "idx" not in st.session_state:
-    # Start past already-labeled entries in the queue
-    labeled_keys = st.session_state.labeled_keys
-    for i, entry in enumerate(st.session_state.queue):
-        if _entry_key(entry) not in labeled_keys:
-            st.session_state.idx = i
-            break
-    else:
-        st.session_state.idx = len(st.session_state.queue)
-
-if "history" not in st.session_state:
-    st.session_state.history: list[tuple[int, str]] = []  # (queue_idx, label)
-
-
-# ── Sidebar stats ────────────────────────────────────────────────────────────
-
-with st.sidebar:
-    labeled = st.session_state.labeled
-    queue   = st.session_state.queue
-    unlabeled = [e for e in queue if _entry_key(e) not in st.session_state.labeled_keys]
-
-    st.metric("✅ Labeled", len(labeled))
-    st.metric("📥 Queue", len(unlabeled))
-
-    if labeled:
-        st.caption("**Label distribution**")
-        counts = {lbl: 0 for lbl in LABELS}
-        for r in labeled:
-            counts[r.get("label", "")] = counts.get(r.get("label", ""), 0) + 1
-        for lbl in LABELS:
-            m = _LABEL_META[lbl]
-            st.caption(f"{m['emoji']} {lbl}: **{counts[lbl]}**")
-
-
-# ── Tabs ─────────────────────────────────────────────────────────────────────
-
-tab_label, tab_fetch, tab_stats, tab_settings, tab_benchmark = st.tabs(
-    ["🃏 Label", "📥 Fetch", "📊 Stats", "⚙️ Settings", "🔬 Benchmark"]
-)
-
-
-# ══════════════════════════════════════════════════════════════════════════════
-# FETCH TAB
-# ══════════════════════════════════════════════════════════════════════════════
-
-with tab_fetch:
-    accounts = _load_config()
-
-    if not accounts:
-        st.warning(
-            f"No accounts configured. Copy `config/label_tool.yaml.example` → "
-            f"`config/label_tool.yaml` and add your IMAP accounts.",
-            icon="⚠️",
-        )
-    else:
-        st.markdown(f"**{len(accounts)} account(s) configured:**")
-        for acc in accounts:
-            st.caption(f"• {acc.get('name', acc.get('username'))} ({acc.get('host')})")
-
-    col_days, col_limit = st.columns(2)
-    days  = col_days.number_input("Days back", min_value=7, max_value=730, value=180)
-    limit = col_limit.number_input("Max emails per account", min_value=10, max_value=1000, value=150)
-
-    all_accs = [a.get("name", a.get("username")) for a in accounts]
-    selected = st.multiselect("Accounts to fetch", all_accs, default=all_accs)
-
-    if st.button("📥 Fetch from IMAP", disabled=not accounts or not selected, type="primary"):
-        existing_keys = {_entry_key(e) for e in st.session_state.queue}
-        existing_keys.update(st.session_state.labeled_keys)
-
-        fetched_all: list[dict] = []
-        status = st.status("Fetching…", expanded=True)
-        # Single updatable slot for per-email progress — overwrites instead of appending
-        _live = status.empty()
-
-        for acc in accounts:
-            name = acc.get("name", acc.get("username"))
-            if name not in selected:
-                continue
-            status.write(f"Connecting to **{name}**…")
-            try:
-                emails = _fetch_account(
-                    acc, days=int(days), limit=int(limit),
-                    known_keys=existing_keys,
-                    progress_cb=lambda p, msg: _live.markdown(f"⏳ {msg}"),
-                )
-                _live.empty()  # clear progress line once account is done
-                fetched_all.extend(emails)
-                status.write(f"✓ {name}: {len(emails)} new emails")
-            except Exception as e:
-                _live.empty()
-                status.write(f"✗ {name}: {e}")
-
-        if fetched_all:
-            _save_jsonl(_QUEUE_FILE, st.session_state.queue + fetched_all)
-            st.session_state.queue = _load_jsonl(_QUEUE_FILE)
-            # Reset idx to first unlabeled
-            labeled_keys = st.session_state.labeled_keys
-            for i, entry in enumerate(st.session_state.queue):
-                if _entry_key(entry) not in labeled_keys:
-                    st.session_state.idx = i
-                    break
-            status.update(label=f"Done — {len(fetched_all)} new emails added to queue", state="complete")
-        else:
-            status.update(label="No new emails found (all already in queue or score file)", state="complete")
-
-    # ── Targeted fetch ───────────────────────────────────────────────────────
-    st.divider()
-    with st.expander("🎯 Targeted Fetch — date range + keyword"):
-        st.caption(
-            "Pull emails within a specific date window, optionally filtered by "
-            "sender or subject. Use this to retrieve historical hiring threads."
-        )
-
-        _t1, _t2 = st.columns(2)
-        _one_year_ago = (datetime.now() - timedelta(days=365)).date()
-        t_since  = _t1.date_input("From date", value=_one_year_ago, key="t_since")
-        t_before = _t2.date_input("To date",   value=datetime.now().date(), key="t_before")
-
-        t_term = st.text_input(
-            "Filter by keyword (optional)",
-            placeholder="e.g. Stateside",
-            key="t_term",
-        )
-        _tf1, _tf2 = st.columns(2)
-        t_field_label = _tf1.selectbox(
-            "Search in",
-            ["Either (from or subject)", "Sender/from", "Subject line"],
-            key="t_field",
-        )
-        t_limit = _tf2.number_input("Max emails", min_value=10, max_value=1000, value=300, key="t_limit")
-
-        t_accs = st.multiselect("Accounts", all_accs, default=all_accs, key="t_accs")
-
-        _field_map = {
-            "Either (from or subject)": "either",
-            "Sender/from": "from",
-            "Subject line": "subject",
-        }
-
-        _t_invalid = not accounts or not t_accs or t_since >= t_before
-        if st.button("🎯 Targeted Fetch", disabled=_t_invalid, type="primary", key="btn_targeted"):
-            _t_since_dt  = datetime(t_since.year,  t_since.month,  t_since.day)
-            _t_before_dt = datetime(t_before.year, t_before.month, t_before.day)
-            _t_field     = _field_map[t_field_label]
-
-            existing_keys = {_entry_key(e) for e in st.session_state.queue}
-            existing_keys.update(st.session_state.labeled_keys)
-
-            fetched_all: list[dict] = []
-            status = st.status("Fetching…", expanded=True)
-            _live = status.empty()
-
-            for acc in accounts:
-                name = acc.get("name", acc.get("username"))
-                if name not in t_accs:
-                    continue
-                status.write(f"Connecting to **{name}**…")
-                try:
-                    emails = _fetch_targeted(
-                        acc,
-                        since_dt=_t_since_dt, before_dt=_t_before_dt,
-                        term=t_term.strip(), field=_t_field,
-                        limit=int(t_limit),
-                        known_keys=existing_keys,
-                        progress_cb=lambda p, msg: _live.markdown(f"⏳ {msg}"),
-                    )
-                    _live.empty()
-                    fetched_all.extend(emails)
-                    status.write(f"✓ {name}: {len(emails)} new emails")
-                except Exception as e:
-                    _live.empty()
-                    status.write(f"✗ {name}: {e}")
-
-            if fetched_all:
-                _save_jsonl(_QUEUE_FILE, st.session_state.queue + fetched_all)
-                st.session_state.queue = _load_jsonl(_QUEUE_FILE)
-                labeled_keys = st.session_state.labeled_keys
-                for i, entry in enumerate(st.session_state.queue):
-                    if _entry_key(entry) not in labeled_keys:
-                        st.session_state.idx = i
-                        break
-                status.update(
-                    label=f"Done — {len(fetched_all)} new emails added to queue",
-                    state="complete",
-                )
-            else:
-                status.update(
-                    label="No new emails found in that date range",
-                    state="complete",
-                )
-
-
-# ══════════════════════════════════════════════════════════════════════════════
-# LABEL TAB
-# ══════════════════════════════════════════════════════════════════════════════
-
-with tab_label:
-    queue   = st.session_state.queue
-    labeled_keys = st.session_state.labeled_keys
-    idx     = st.session_state.idx
-
-    # Advance idx past already-labeled entries
-    while idx < len(queue) and _entry_key(queue[idx]) in labeled_keys:
-        idx += 1
-    st.session_state.idx = idx
-
-    unlabeled = [e for e in queue if _entry_key(e) not in labeled_keys]
-    total_in_queue = len(queue)
-    n_labeled = len(st.session_state.labeled)
-
-    if not queue:
-        st.info("Queue is empty — go to **Fetch** to pull emails from IMAP.", icon="📥")
-    elif not unlabeled:
-        st.success(
-            f"🎉 All {n_labeled} emails labeled! Go to **Stats** to review and export.",
-            icon="✅",
-        )
-    else:
-        # Progress
-        labeled_in_queue = total_in_queue - len(unlabeled)
-        progress_pct = labeled_in_queue / total_in_queue if total_in_queue else 0
-        st.progress(progress_pct, text=f"{labeled_in_queue} / {total_in_queue} labeled in queue")
-
-        # Current email
-        entry = queue[idx]
-
-        # Card HTML
-        subj  = entry.get("subject", "(no subject)") or "(no subject)"
-        from_ = entry.get("from_addr", "") or ""
-        date_ = entry.get("date", "") or ""
-        acct  = entry.get("account", "") or ""
-        body  = (entry.get("body") or "").strip()
-
-        st.markdown(
-            f"""<div class="email-card">
-<div class="card-meta">{_to_html(from_)} &nbsp;·&nbsp; {_to_html(date_[:16])} &nbsp;·&nbsp; <em>{_to_html(acct)}</em></div>
-<div class="card-subject">{_to_html(subj)}</div>
-<div class="card-body">{_to_html(body[:500], newlines_to_br=True)}</div>
-</div>""",
-            unsafe_allow_html=True,
-        )
-        if len(body) > 500:
-            with st.expander("Show full body"):
-                st.text(body)
-
-        # Stack hint (visual depth)
-        st.markdown('<div class="card-stack-hint"></div>', unsafe_allow_html=True)
-        st.markdown('<div class="card-stack-hint2"></div>', unsafe_allow_html=True)
-
-        st.markdown("")  # spacer
-
-        # ── Bucket buttons ────────────────────────────────────────────────
-        def _do_label(label: str) -> None:
-            row = {"subject": entry.get("subject", ""), "body": body[:600], "label": label}
-            st.session_state.labeled.append(row)
-            st.session_state.labeled_keys.add(_entry_key(entry))
-            _append_jsonl(_SCORE_FILE, row)
-            st.session_state.history.append((idx, label))
-            # Advance
-            next_idx = idx + 1
-            while next_idx < len(queue) and _entry_key(queue[next_idx]) in labeled_keys:
-                next_idx += 1
-            st.session_state.idx = next_idx
-
-        # Pre-compute per-label counts once
-        _counts: dict[str, int] = {}
-        for _r in st.session_state.labeled:
-            _lbl_r = _r.get("label", "")
-            _counts[_lbl_r] = _counts.get(_lbl_r, 0) + 1
-
-        row1_cols = st.columns(5)
-        row2_cols = st.columns(5)
-        bucket_pairs = [
-            (row1_cols[0], "interview_scheduled"),
-            (row1_cols[1], "offer_received"),
-            (row1_cols[2], "rejected"),
-            (row1_cols[3], "positive_response"),
-            (row1_cols[4], "survey_received"),
-            (row2_cols[0], "neutral"),
-            (row2_cols[1], "event_rescheduled"),
-            (row2_cols[2], "digest"),
-            (row2_cols[3], "new_lead"),
-            (row2_cols[4], "hired"),
-        ]
-        for col, lbl in bucket_pairs:
-            m = _LABEL_META[lbl]
-            cnt = _counts.get(lbl, 0)
-            label_display = f"{m['emoji']} **{lbl}** [{cnt}]\n`{m['key']}`"
-            if col.button(label_display, key=f"lbl_{lbl}", use_container_width=True):
-                _do_label(lbl)
-                st.rerun()
-
-        # ── Wildcard label ─────────────────────────────────────────────────
-        if "show_custom" not in st.session_state:
-            st.session_state.show_custom = False
-
-        other_col, _ = st.columns([1, 2])
-        if other_col.button("🏷️ Other… `0`", key="lbl_other_toggle", use_container_width=True):
-            st.session_state.show_custom = not st.session_state.show_custom
-            st.rerun()
-
-        if st.session_state.get("show_custom"):
-            custom_cols = st.columns([3, 1])
-            custom_val = custom_cols[0].text_input(
-                "Custom label:", key="custom_label_text",
-                placeholder="e.g. linkedin_outreach",
-                label_visibility="collapsed",
-            )
-            if custom_cols[1].button(
-                "✓ Apply", key="apply_custom", type="primary",
-                disabled=not (custom_val or "").strip(),
-            ):
-                _do_label(custom_val.strip().lower().replace(" ", "_"))
-                st.session_state.show_custom = False
-                st.rerun()
-
-        # ── Navigation ────────────────────────────────────────────────────
-        st.markdown("")
-        nav_cols = st.columns([2, 1, 1, 1])
-
-        remaining = len(unlabeled) - 1
-        nav_cols[0].caption(f"**{remaining}** remaining  ·  Keys: 1–9, H = label, 0 = other, S = skip, U = undo")
-
-        if nav_cols[1].button("↩ Undo", disabled=not st.session_state.history, use_container_width=True):
-            prev_idx, prev_label = st.session_state.history.pop()
-            # Remove the last labeled entry
-            if st.session_state.labeled:
-                removed = st.session_state.labeled.pop()
-                st.session_state.labeled_keys.discard(_entry_key(removed))
-                _save_jsonl(_SCORE_FILE, st.session_state.labeled)
-            st.session_state.idx = prev_idx
-            st.rerun()
-
-        if nav_cols[2].button("→ Skip", use_container_width=True):
-            next_idx = idx + 1
-            while next_idx < len(queue) and _entry_key(queue[next_idx]) in labeled_keys:
-                next_idx += 1
-            st.session_state.idx = next_idx
-            st.rerun()
-
-        if nav_cols[3].button("🗑️ Discard", use_container_width=True):
-            # Remove from queue entirely — not written to score file
-            st.session_state.queue = [e for e in queue if _entry_key(e) != _entry_key(entry)]
-            _save_jsonl(_QUEUE_FILE, st.session_state.queue)
-            next_idx = min(idx, len(st.session_state.queue) - 1)
-            while next_idx < len(st.session_state.queue) and _entry_key(st.session_state.queue[next_idx]) in labeled_keys:
-                next_idx += 1
-            st.session_state.idx = max(next_idx, 0)
-            st.rerun()
-
-        # Keyboard shortcut capture (JS → hidden button click)
-        st.components.v1.html(
-            """<script>
-document.addEventListener('keydown', function(e) {
-    if (e.target.tagName === 'INPUT' || e.target.tagName === 'TEXTAREA') return;
-    const keyToLabel = {
-        '1':'interview_scheduled','2':'offer_received','3':'rejected',
-        '4':'positive_response','5':'survey_received','6':'neutral',
-        '7':'event_rescheduled','8':'digest','9':'new_lead'
-    };
-    const label = keyToLabel[e.key];
-    if (label) {
-        const btns = window.parent.document.querySelectorAll('button');
-        for (const btn of btns) {
-            if (btn.innerText.toLowerCase().includes(label.replace('_',' '))) {
-                btn.click(); break;
-            }
-        }
-    } else if (e.key === '0') {
-        const btns = window.parent.document.querySelectorAll('button');
-        for (const btn of btns) {
-            if (btn.innerText.includes('Other')) { btn.click(); break; }
-        }
-    } else if (e.key.toLowerCase() === 'h') {
-        const btns = window.parent.document.querySelectorAll('button');
-        for (const btn of btns) {
-            if (btn.innerText.toLowerCase().includes('hired')) { btn.click(); break; }
-        }
-    } else if (e.key.toLowerCase() === 's') {
-        const btns = window.parent.document.querySelectorAll('button');
-        for (const btn of btns) {
-            if (btn.innerText.includes('Skip')) { btn.click(); break; }
-        }
-    } else if (e.key.toLowerCase() === 'u') {
-        const btns = window.parent.document.querySelectorAll('button');
-        for (const btn of btns) {
-            if (btn.innerText.includes('Undo')) { btn.click(); break; }
-        }
-    }
-});
-</script>""",
-            height=0,
-        )
-
-
-# ══════════════════════════════════════════════════════════════════════════════
-# STATS TAB
-# ══════════════════════════════════════════════════════════════════════════════
-
-with tab_stats:
-    labeled = st.session_state.labeled
-
-    if not labeled:
-        st.info("No labeled emails yet.")
-    else:
-        counts: dict[str, int] = {}
-        for r in labeled:
-            lbl = r.get("label", "")
-            if lbl:
-                counts[lbl] = counts.get(lbl, 0) + 1
-
-        st.markdown(f"**{len(labeled)} labeled emails total**")
-
-        # Show known labels first, then any custom labels
-        all_display_labels = list(LABELS) + [l for l in counts if l not in LABELS]
-        max_count = max(counts.values()) if counts else 1
-        for lbl in all_display_labels:
-            if lbl not in counts:
-                continue
-            m = _LABEL_META.get(lbl)
-            emoji = m["emoji"] if m else "🏷️"
-            col_name, col_bar, col_n = st.columns([3, 5, 1])
-            col_name.markdown(f"{emoji} {lbl}")
-            col_bar.progress(counts[lbl] / max_count)
-            col_n.markdown(f"**{counts[lbl]}**")
-
-        st.divider()
-
-        st.caption(
-            f"Score file: `{_SCORE_FILE.relative_to(_ROOT)}`  "
-            f"({_SCORE_FILE.stat().st_size if _SCORE_FILE.exists() else 0:,} bytes)"
-        )
-        if st.button("🔄 Re-sync from disk"):
-            st.session_state.labeled = _load_jsonl(_SCORE_FILE)
-            st.session_state.labeled_keys = {_entry_key(r) for r in st.session_state.labeled}
-            st.rerun()
-
-        if _SCORE_FILE.exists():
-            st.download_button(
-                "⬇️ Download email_score.jsonl",
-                data=_SCORE_FILE.read_bytes(),
-                file_name="email_score.jsonl",
-                mime="application/jsonlines",
-            )
-
-
-# ══════════════════════════════════════════════════════════════════════════════
-# SETTINGS TAB
-# ══════════════════════════════════════════════════════════════════════════════
-
-def _sync_settings_to_state() -> None:
-    """Collect current widget values back into settings_accounts, then clear
-    widget keys so the next render picks up freshly from the updated list."""
-    accounts = st.session_state.get("settings_accounts", [])
-    synced = []
-    for i in range(len(accounts)):
-        synced.append({
-            "name":      st.session_state.get(f"s_name_{i}",   accounts[i].get("name", "")),
-            "host":      st.session_state.get(f"s_host_{i}",   accounts[i].get("host", "imap.gmail.com")),
-            "port":      int(st.session_state.get(f"s_port_{i}", accounts[i].get("port", 993))),
-            "use_ssl":   bool(st.session_state.get(f"s_ssl_{i}",  accounts[i].get("use_ssl", True))),
-            "username":  st.session_state.get(f"s_user_{i}",   accounts[i].get("username", "")),
-            "password":  st.session_state.get(f"s_pass_{i}",   accounts[i].get("password", "")),
-            "folder":    st.session_state.get(f"s_folder_{i}", accounts[i].get("folder", "INBOX")),
-            "days_back": int(st.session_state.get(f"s_days_{i}", accounts[i].get("days_back", 90))),
-        })
-    st.session_state.settings_accounts = synced
-    for key in list(st.session_state.keys()):
-        if key.startswith("s_"):
-            del st.session_state[key]
-
-
-with tab_settings:
-    # ── Init from disk on first load ─────────────────────────────────────────
-    if "settings_accounts" not in st.session_state:
-        _cfg_raw = yaml.safe_load(_CFG_FILE.read_text()) or {} if _CFG_FILE.exists() else {}
-        st.session_state.settings_accounts = [dict(a) for a in _cfg_raw.get("accounts", [])]
-        st.session_state.settings_max = _cfg_raw.get("max_per_account", 500)
-
-    _accs = st.session_state.settings_accounts
-
-    st.subheader("📧 IMAP Accounts")
-    st.caption(
-        "Credentials are saved to `config/label_tool.yaml` (gitignored). "
-        "Use an **App Password** for Gmail/Outlook — not your login password."
-    )
-
-    if not _accs:
-        st.info("No accounts configured yet. Click **➕ Add account** to get started.", icon="📭")
-
-    _to_remove = None
-    for _i, _acc in enumerate(_accs):
-        _label = f"**{_acc.get('name', 'Unnamed')}** — {_acc.get('username', '(no username)')}"
-        with st.expander(_label, expanded=not _acc.get("username")):
-            _c1, _c2 = st.columns(2)
-            _c1.text_input("Display name",  key=f"s_name_{_i}", value=_acc.get("name", ""))
-            _c2.text_input("IMAP host",     key=f"s_host_{_i}", value=_acc.get("host", "imap.gmail.com"))
-
-            _c3, _c4, _c5 = st.columns([3, 2, 1])
-            _c3.text_input("Username / email", key=f"s_user_{_i}", value=_acc.get("username", ""))
-            _c4.number_input("Port", key=f"s_port_{_i}", value=int(_acc.get("port", 993)),
-                             min_value=1, max_value=65535, step=1)
-            _c5.checkbox("SSL", key=f"s_ssl_{_i}", value=bool(_acc.get("use_ssl", True)))
-
-            st.text_input("Password / app password", key=f"s_pass_{_i}",
-                          value=_acc.get("password", ""), type="password")
-
-            _c6, _c7 = st.columns(2)
-            _c6.text_input("Folder",     key=f"s_folder_{_i}", value=_acc.get("folder", "INBOX"))
-            _c7.number_input("Default days back", key=f"s_days_{_i}",
-                             value=int(_acc.get("days_back", 90)), min_value=1, max_value=730)
-
-            _btn_l, _btn_r = st.columns([1, 3])
-            if _btn_l.button("🗑️ Remove", key=f"s_remove_{_i}"):
-                _to_remove = _i
-            if _btn_r.button("🔌 Test connection", key=f"s_test_{_i}"):
-                _test_acc = {
-                    "host":     st.session_state.get(f"s_host_{_i}",   _acc.get("host", "")),
-                    "port":     st.session_state.get(f"s_port_{_i}",   _acc.get("port", 993)),
-                    "use_ssl":  st.session_state.get(f"s_ssl_{_i}",    _acc.get("use_ssl", True)),
-                    "username": st.session_state.get(f"s_user_{_i}",   _acc.get("username", "")),
-                    "password": st.session_state.get(f"s_pass_{_i}",   _acc.get("password", "")),
-                    "folder":   st.session_state.get(f"s_folder_{_i}", _acc.get("folder", "INBOX")),
-                }
-                with st.spinner("Connecting…"):
-                    _ok, _msg = _test_imap_connection(_test_acc)
-                if _ok:
-                    st.success(_msg)
-                else:
-                    st.error(f"Connection failed: {_msg}")
-
-    if _to_remove is not None:
-        _sync_settings_to_state()
-        st.session_state.settings_accounts.pop(_to_remove)
-        st.rerun()
-
-    if st.button("➕ Add account"):
-        _sync_settings_to_state()
-        st.session_state.settings_accounts.append({
-            "name": f"Account {len(_accs) + 1}",
-            "host": "imap.gmail.com", "port": 993, "use_ssl": True,
-            "username": "", "password": "", "folder": "INBOX", "days_back": 90,
-        })
-        st.rerun()
-
-    st.divider()
-    st.subheader("⚙️ Global Settings")
-    st.number_input(
-        "Max emails per account per fetch (0 = unlimited)",
-        key="s_max_per_account",
-        value=st.session_state.settings_max,
-        min_value=0, max_value=5000, step=50,
-    )
-
-    st.divider()
-    _save_col, _reload_col = st.columns([3, 1])
-    if _save_col.button("💾 Save settings", type="primary", use_container_width=True):
-        _saved_accounts = []
-        for _i in range(len(st.session_state.settings_accounts)):
-            _a = st.session_state.settings_accounts[_i]
-            _saved_accounts.append({
-                "name":      st.session_state.get(f"s_name_{_i}",   _a.get("name", "")),
-                "host":      st.session_state.get(f"s_host_{_i}",   _a.get("host", "imap.gmail.com")),
-                "port":      int(st.session_state.get(f"s_port_{_i}", _a.get("port", 993))),
-                "use_ssl":   bool(st.session_state.get(f"s_ssl_{_i}",  _a.get("use_ssl", True))),
-                "username":  st.session_state.get(f"s_user_{_i}",   _a.get("username", "")),
-                "password":  st.session_state.get(f"s_pass_{_i}",   _a.get("password", "")),
-                "folder":    st.session_state.get(f"s_folder_{_i}", _a.get("folder", "INBOX")),
-                "days_back": int(st.session_state.get(f"s_days_{_i}", _a.get("days_back", 90))),
-            })
-        _cfg_out = {
-            "accounts": _saved_accounts,
-            "max_per_account": int(st.session_state.get("s_max_per_account", 500)),
-        }
-        _CFG_FILE.parent.mkdir(parents=True, exist_ok=True)
-        _CFG_FILE.write_text(yaml.dump(_cfg_out, default_flow_style=False, allow_unicode=True))
-        st.session_state.settings_accounts = _saved_accounts
-        st.session_state.settings_max = _cfg_out["max_per_account"]
-        st.success(f"Saved {len(_saved_accounts)} account(s) to `config/label_tool.yaml`.")
-
-    if _reload_col.button("↩ Reload", use_container_width=True, help="Discard unsaved changes and reload from disk"):
-        for _k in list(st.session_state.keys()):
-            if _k in ("settings_accounts", "settings_max") or _k.startswith("s_"):
-                del st.session_state[_k]
-        st.rerun()
-
-
-# ══════════════════════════════════════════════════════════════════════════════
-# BENCHMARK TAB
-# ══════════════════════════════════════════════════════════════════════════════
-
-with tab_benchmark:
-    # ── Model selection ───────────────────────────────────────────────────────
-    _DEFAULT_MODELS = [
-        "deberta-zeroshot", "deberta-small", "gliclass-large",
-        "bart-mnli", "bge-m3-zeroshot", "deberta-small-2pass", "deberta-base-anli",
-    ]
-    _SLOW_MODELS = [
-        "deberta-large-ling", "mdeberta-xnli-2m", "bge-reranker",
-        "deberta-xlarge", "mdeberta-mnli", "xlm-roberta-anli",
-    ]
-
-    st.subheader("🔬 Benchmark Classifier Models")
-
-    _b_include_slow = st.checkbox("Include slow / large models", value=False, key="b_include_slow")
-    _b_all_models = _DEFAULT_MODELS + (_SLOW_MODELS if _b_include_slow else [])
-    _b_selected = st.multiselect(
-        "Models to run",
-        options=_b_all_models,
-        default=_b_all_models,
-        help="Uncheck models to skip them. Slow models require --include-slow.",
-    )
-
-    _n_examples = len(st.session_state.labeled)
-    st.caption(
-        f"Scoring against `{_SCORE_FILE.name}` · **{_n_examples} labeled examples**"
-        f"  ·  Est. time: ~{max(1, len(_b_selected))} – {max(2, len(_b_selected) * 2)} min"
-    )
-
-    # Direct binary avoids conda's output interception; -u = unbuffered stdout
-    _CLASSIFIER_PYTHON = "/devl/miniconda3/envs/job-seeker-classifiers/bin/python"
-
-    if st.button("▶ Run Benchmark", type="primary", disabled=not _b_selected, key="b_run"):
-        _b_cmd = [
-            _CLASSIFIER_PYTHON, "-u",
-            str(_ROOT / "scripts" / "benchmark_classifier.py"),
-            "--score", "--score-file", str(_SCORE_FILE),
-            "--models", *_b_selected,
-        ]
-        with st.status("Running benchmark…", expanded=True) as _b_status:
-            _b_proc = subprocess.Popen(
-                _b_cmd, stdout=subprocess.PIPE, stderr=subprocess.STDOUT,
-                text=True, cwd=str(_ROOT),
-                env={**os.environ, "PYTHONUNBUFFERED": "1"},
-            )
-            _b_lines: list[str] = []
-            _b_area = st.empty()
-            for _b_line in _b_proc.stdout:
-                _b_lines.append(_b_line)
-                _b_area.code("".join(_b_lines[-30:]), language="text")
-            _b_proc.wait()
-            _b_full = "".join(_b_lines)
-            st.session_state["bench_output"] = _b_full
-            if _b_proc.returncode == 0:
-                _b_status.update(label="Benchmark complete ✓", state="complete", expanded=False)
-            else:
-                _b_status.update(label="Benchmark failed", state="error")
-
-    # ── Results display ───────────────────────────────────────────────────────
-    if "bench_output" in st.session_state:
-        _b_out = st.session_state["bench_output"]
-
-        # Parse summary table rows: name  f1  accuracy  ms
-        _b_rows = []
-        for _b_l in _b_out.splitlines():
-            _b_m = re.match(r"^([\w-]+)\s+([\d.]+)\s+([\d.]+)\s+([\d.]+)\s*$", _b_l.strip())
-            if _b_m:
-                _b_rows.append({
-                    "Model": _b_m.group(1),
-                    "macro-F1": float(_b_m.group(2)),
-                    "Accuracy": float(_b_m.group(3)),
-                    "ms/email": float(_b_m.group(4)),
-                })
-
-        if _b_rows:
-            import pandas as _pd
-            _b_df = _pd.DataFrame(_b_rows).sort_values("macro-F1", ascending=False).reset_index(drop=True)
-            st.dataframe(
-                _b_df,
-                column_config={
-                    "macro-F1": st.column_config.ProgressColumn(
-                        "macro-F1", min_value=0, max_value=1, format="%.3f",
-                    ),
-                    "Accuracy": st.column_config.ProgressColumn(
-                        "Accuracy", min_value=0, max_value=1, format="%.3f",
-                    ),
-                    "ms/email": st.column_config.NumberColumn("ms/email", format="%.1f"),
-                },
-                use_container_width=True, hide_index=True,
-            )
-
-        with st.expander("Full benchmark output"):
-            st.code(_b_out, language="text")
-
-    st.divider()
-
-    # ── Tests ─────────────────────────────────────────────────────────────────
-    st.subheader("🧪 Run Tests")
-    st.caption("Runs `pytest tests/ -v` in the job-seeker env (no model downloads required).")
-
-    if st.button("▶ Run Tests", key="b_run_tests"):
-        _t_cmd = [
-            "/devl/miniconda3/envs/job-seeker/bin/pytest", "tests/", "-v", "--tb=short",
-        ]
-        with st.status("Running tests…", expanded=True) as _t_status:
-            _t_proc = subprocess.Popen(
-                _t_cmd, stdout=subprocess.PIPE, stderr=subprocess.STDOUT,
-                text=True, cwd=str(_ROOT),
-            )
-            _t_lines: list[str] = []
-            _t_area = st.empty()
-            for _t_line in _t_proc.stdout:
-                _t_lines.append(_t_line)
-                _t_area.code("".join(_t_lines[-30:]), language="text")
-            _t_proc.wait()
-            _t_full = "".join(_t_lines)
-            st.session_state["test_output"] = _t_full
-            _t_summary = [l for l in _t_lines if "passed" in l or "failed" in l or "error" in l.lower()]
-            _t_label = _t_summary[-1].strip() if _t_summary else "Done"
-            _t_state = "error" if _t_proc.returncode != 0 else "complete"
-            _t_status.update(label=_t_label, state=_t_state, expanded=False)
-
-    if "test_output" in st.session_state:
-        with st.expander("Full test output", expanded=True):
-            st.code(st.session_state["test_output"], language="text")
diff --git a/app/utils.py b/app/utils.py
new file mode 100644
index 0000000..3a250ea
--- /dev/null
+++ b/app/utils.py
@@ -0,0 +1,85 @@
+"""Shared email utility functions for Avocet.
+
+Pure-stdlib helpers extracted from the retired label_tool.py Streamlit app.
+These are reused by the FastAPI backend and the test suite.
+"""
+from __future__ import annotations
+
+import re
+from html.parser import HTMLParser
+from typing import Any
+
+
+# ── HTML → plain-text extractor ──────────────────────────────────────────────
+
+class _TextExtractor(HTMLParser):
+    """Extract visible text from an HTML email body, preserving line breaks."""
+    _BLOCK = {"p", "div", "br", "li", "tr", "h1", "h2", "h3", "h4", "h5", "h6", "blockquote"}
+    _SKIP  = {"script", "style", "head", "noscript"}
+
+    def __init__(self):
+        super().__init__(convert_charrefs=True)
+        self._parts: list[str] = []
+        self._depth_skip = 0
+
+    def handle_starttag(self, tag, attrs):
+        tag = tag.lower()
+        if tag in self._SKIP:
+            self._depth_skip += 1
+        elif tag in self._BLOCK:
+            self._parts.append("\n")
+
+    def handle_endtag(self, tag):
+        if tag.lower() in self._SKIP:
+            self._depth_skip = max(0, self._depth_skip - 1)
+
+    def handle_data(self, data):
+        if not self._depth_skip:
+            self._parts.append(data)
+
+    def get_text(self) -> str:
+        text = "".join(self._parts)
+        lines = [ln.strip() for ln in text.splitlines()]
+        return "\n".join(ln for ln in lines if ln)
+
+
+def _strip_html(html_str: str) -> str:
+    """Convert HTML email body to plain text. Pure stdlib, no dependencies."""
+    try:
+        extractor = _TextExtractor()
+        extractor.feed(html_str)
+        return extractor.get_text()
+    except Exception:
+        return re.sub(r"<[^>]+>", " ", html_str).strip()
+
+
+def _extract_body(msg: Any) -> str:
+    """Return plain-text body. Strips HTML when no text/plain part exists."""
+    if msg.is_multipart():
+        html_fallback: str | None = None
+        for part in msg.walk():
+            ct = part.get_content_type()
+            if ct == "text/plain":
+                try:
+                    charset = part.get_content_charset() or "utf-8"
+                    return part.get_payload(decode=True).decode(charset, errors="replace")
+                except Exception:
+                    pass
+            elif ct == "text/html" and html_fallback is None:
+                try:
+                    charset = part.get_content_charset() or "utf-8"
+                    raw = part.get_payload(decode=True).decode(charset, errors="replace")
+                    html_fallback = _strip_html(raw)
+                except Exception:
+                    pass
+        return html_fallback or ""
+    else:
+        try:
+            charset = msg.get_content_charset() or "utf-8"
+            raw = msg.get_payload(decode=True).decode(charset, errors="replace")
+            if msg.get_content_type() == "text/html":
+                return _strip_html(raw)
+            return raw
+        except Exception:
+            pass
+    return ""
diff --git a/config/label_tool.yaml.example b/config/label_tool.yaml.example
index 8f80b18..9310d21 100644
--- a/config/label_tool.yaml.example
+++ b/config/label_tool.yaml.example
@@ -21,3 +21,8 @@ accounts:
 
 # Optional: limit emails fetched per account per run (0 = unlimited)
 max_per_account: 500
+
+# cf-orch SFT candidate import — path to the bench_results/ directory
+# produced by circuitforge-orch's benchmark harness.
+sft:
+  bench_results_dir: /path/to/circuitforge-orch/scripts/bench_results
diff --git a/manage.sh b/manage.sh
index fbd0ed4..734a188 100755
--- a/manage.sh
+++ b/manage.sh
@@ -21,7 +21,6 @@ DEFAULT_PORT=8503
 CONDA_BASE="${CONDA_BASE:-/devl/miniconda3}"
 ENV_UI="job-seeker"
 ENV_BM="job-seeker-classifiers"
-STREAMLIT="${CONDA_BASE}/envs/${ENV_UI}/bin/streamlit"
 PYTHON_BM="${CONDA_BASE}/envs/${ENV_BM}/bin/python"
 PYTHON_UI="${CONDA_BASE}/envs/${ENV_UI}/bin/python"
 
@@ -79,13 +78,11 @@ usage() {
     echo ""
     echo "  Usage: ./manage.sh <command> [args]"
     echo ""
-    echo "  Label tool:"
-    echo -e "    ${GREEN}start${NC}                    Start label tool UI (port collision-safe)"
-    echo -e "    ${GREEN}stop${NC}                     Stop label tool UI"
-    echo -e "    ${GREEN}restart${NC}                  Restart label tool UI"
-    echo -e "    ${GREEN}status${NC}                   Show running state and port"
-    echo -e "    ${GREEN}logs${NC}                     Tail label tool log output"
-    echo -e "    ${GREEN}open${NC}                     Open label tool in browser"
+    echo "  Vue UI + FastAPI:"
+    echo -e "    ${GREEN}start${NC}                    Build Vue SPA + start FastAPI on port 8503"
+    echo -e "    ${GREEN}stop${NC}                     Stop FastAPI server"
+    echo -e "    ${GREEN}restart${NC}                  Stop + rebuild + restart FastAPI server"
+    echo -e "    ${GREEN}open${NC}                     Open Vue UI in browser (http://localhost:8503)"
     echo ""
     echo "  Benchmark:"
     echo -e "    ${GREEN}benchmark [args]${NC}         Run benchmark_classifier.py (args passed through)"
@@ -93,12 +90,6 @@ usage() {
     echo -e "    ${GREEN}score [args]${NC}             Shortcut: --score [args]"
     echo -e "    ${GREEN}compare [args]${NC}           Shortcut: --compare [args]"
     echo ""
-    echo "  Vue API:"
-    echo -e "    ${GREEN}start-api${NC}                Build Vue SPA + start FastAPI on port 8503"
-    echo -e "    ${GREEN}stop-api${NC}                 Stop FastAPI server"
-    echo -e "    ${GREEN}restart-api${NC}              Stop + rebuild + restart FastAPI server"
-    echo -e "    ${GREEN}open-api${NC}                 Open Vue UI in browser (http://localhost:8503)"
-    echo ""
     echo "  Dev:"
     echo -e "    ${GREEN}test${NC}                     Run pytest suite"
     echo ""
@@ -121,102 +112,61 @@ shift || true
 case "$CMD" in
 
     start)
-        pid=$(_running_pid)
-        if [[ -n "$pid" ]]; then
-            port=$(_running_port)
-            warn "Already running (PID ${pid}) on port ${port} → http://localhost:${port}"
+        API_PID_FILE=".avocet-api.pid"
+        API_PORT=8503
+        if [[ -f "$API_PID_FILE" ]] && kill -0 "$(<"$API_PID_FILE")" 2>/dev/null; then
+            warn "API already running (PID $(<"$API_PID_FILE")) → http://localhost:${API_PORT}"
             exit 0
         fi
-
-        if [[ ! -x "$STREAMLIT" ]]; then
-            error "Streamlit not found at ${STREAMLIT}\nActivate env: conda run -n ${ENV_UI} ..."
-        fi
-
-        port=$(_find_free_port "$DEFAULT_PORT")
         mkdir -p "$LOG_DIR"
-
-        info "Starting label tool on port ${port}…"
-        nohup "$STREAMLIT" run app/label_tool.py \
-            --server.port "$port" \
-            --server.headless true \
-            --server.fileWatcherType none \
-            >"$LOG_FILE" 2>&1 &
-
-        pid=$!
-        echo "$pid"  > "$PID_FILE"
-        echo "$port" > "$PORT_FILE"
-
-        # Wait briefly and confirm the process survived
-        sleep 1
-        if kill -0 "$pid" 2>/dev/null; then
-            success "Avocet label tool started → http://localhost:${port}  (PID ${pid})"
-            success "Logs: ${LOG_FILE}"
-        else
-            rm -f "$PID_FILE" "$PORT_FILE"
-            error "Process died immediately. Check ${LOG_FILE} for details."
+        API_LOG="${LOG_DIR}/api.log"
+        info "Building Vue SPA…"
+        (cd web && npm run build) >> "$API_LOG" 2>&1
+        info "Starting FastAPI on port ${API_PORT}…"
+        nohup "$PYTHON_UI" -m uvicorn app.api:app \
+            --host 0.0.0.0 --port "$API_PORT" \
+            >> "$API_LOG" 2>&1 &
+        echo $! > "$API_PID_FILE"
+        # Poll until port is actually bound (up to 10 s), not just process alive
+        for _i in $(seq 1 20); do
+            sleep 0.5
+            if (echo "" >/dev/tcp/127.0.0.1/"$API_PORT") 2>/dev/null; then
+                success "Avocet started → http://localhost:${API_PORT}  (PID $(<"$API_PID_FILE"))"
+                break
+            fi
+            if ! kill -0 "$(<"$API_PID_FILE")" 2>/dev/null; then
+                rm -f "$API_PID_FILE"
+                error "Server died during startup. Check ${API_LOG}"
+            fi
+        done
+        if ! (echo "" >/dev/tcp/127.0.0.1/"$API_PORT") 2>/dev/null; then
+            error "Server did not bind to port ${API_PORT} within 10 s. Check ${API_LOG}"
         fi
         ;;
 
     stop)
-        pid=$(_running_pid)
-        if [[ -z "$pid" ]]; then
+        API_PID_FILE=".avocet-api.pid"
+        if [[ ! -f "$API_PID_FILE" ]]; then
             warn "Not running."
             exit 0
         fi
-        info "Stopping label tool (PID ${pid})…"
-        kill "$pid"
-        # Wait up to 5 s for clean exit
-        for _ in $(seq 1 10); do
-            kill -0 "$pid" 2>/dev/null || break
-            sleep 0.5
-        done
-        if kill -0 "$pid" 2>/dev/null; then
-            warn "Process did not exit cleanly; sending SIGKILL…"
-            kill -9 "$pid" 2>/dev/null || true
+        PID="$(<"$API_PID_FILE")"
+        if kill -0 "$PID" 2>/dev/null; then
+            kill "$PID" && rm -f "$API_PID_FILE"
+            success "Stopped (PID ${PID})."
+        else
+            warn "Stale PID file (process ${PID} not running). Cleaning up."
+            rm -f "$API_PID_FILE"
         fi
-        rm -f "$PID_FILE" "$PORT_FILE"
-        success "Stopped."
         ;;
 
     restart)
-        pid=$(_running_pid)
-        if [[ -n "$pid" ]]; then
-            info "Stopping existing process (PID ${pid})…"
-            kill "$pid"
-            for _ in $(seq 1 10); do
-                kill -0 "$pid" 2>/dev/null || break
-                sleep 0.5
-            done
-            kill -0 "$pid" 2>/dev/null && kill -9 "$pid" 2>/dev/null || true
-            rm -f "$PID_FILE" "$PORT_FILE"
-        fi
+        bash "$0" stop
         exec bash "$0" start
         ;;
 
-    status)
-        pid=$(_running_pid)
-        if [[ -n "$pid" ]]; then
-            port=$(_running_port)
-            success "Running  — PID ${pid}  port ${port}  → http://localhost:${port}"
-        else
-            warn "Not running."
-        fi
-        ;;
-
-    logs)
-        if [[ ! -f "$LOG_FILE" ]]; then
-            warn "No log file found at ${LOG_FILE}. Has the tool been started?"
-            exit 0
-        fi
-        info "Tailing ${LOG_FILE} (Ctrl-C to stop)"
-        tail -f "$LOG_FILE"
-        ;;
-
     open)
-        port=$(_running_port)
-        pid=$(_running_pid)
-        [[ -z "$pid" ]] && warn "Label tool does not appear to be running. Start with: ./manage.sh start"
-        URL="http://localhost:${port}"
+        URL="http://localhost:8503"
         info "Opening ${URL}"
         if command -v xdg-open &>/dev/null; then
             xdg-open "$URL"
@@ -257,72 +207,6 @@ case "$CMD" in
         exec "$0" benchmark --compare "$@"
         ;;
 
-    start-api)
-        API_PID_FILE=".avocet-api.pid"
-        API_PORT=8503
-        if [[ -f "$API_PID_FILE" ]] && kill -0 "$(<"$API_PID_FILE")" 2>/dev/null; then
-            warn "API already running (PID $(<"$API_PID_FILE")) → http://localhost:${API_PORT}"
-            exit 0
-        fi
-        mkdir -p "$LOG_DIR"
-        API_LOG="${LOG_DIR}/api.log"
-        info "Building Vue SPA…"
-        (cd web && npm run build) >> "$API_LOG" 2>&1
-        info "Starting FastAPI on port ${API_PORT}…"
-        nohup "$PYTHON_UI" -m uvicorn app.api:app \
-            --host 0.0.0.0 --port "$API_PORT" \
-            >> "$API_LOG" 2>&1 &
-        echo $! > "$API_PID_FILE"
-        # Poll until port is actually bound (up to 10 s), not just process alive
-        for _i in $(seq 1 20); do
-            sleep 0.5
-            if (echo "" >/dev/tcp/127.0.0.1/"$API_PORT") 2>/dev/null; then
-                success "Avocet API started → http://localhost:${API_PORT}  (PID $(<"$API_PID_FILE"))"
-                break
-            fi
-            if ! kill -0 "$(<"$API_PID_FILE")" 2>/dev/null; then
-                rm -f "$API_PID_FILE"
-                error "API died during startup. Check ${API_LOG}"
-            fi
-        done
-        if ! (echo "" >/dev/tcp/127.0.0.1/"$API_PORT") 2>/dev/null; then
-            error "API did not bind to port ${API_PORT} within 10 s. Check ${API_LOG}"
-        fi
-        ;;
-
-    stop-api)
-        API_PID_FILE=".avocet-api.pid"
-        if [[ ! -f "$API_PID_FILE" ]]; then
-            warn "API not running."
-            exit 0
-        fi
-        PID="$(<"$API_PID_FILE")"
-        if kill -0 "$PID" 2>/dev/null; then
-            kill "$PID" && rm -f "$API_PID_FILE"
-            success "API stopped (PID ${PID})."
-        else
-            warn "Stale PID file (process ${PID} not running). Cleaning up."
-            rm -f "$API_PID_FILE"
-        fi
-        ;;
-
-    restart-api)
-        bash "$0" stop-api
-        exec bash "$0" start-api
-        ;;
-
-    open-api)
-        URL="http://localhost:8503"
-        info "Opening ${URL}"
-        if command -v xdg-open &>/dev/null; then
-            xdg-open "$URL"
-        elif command -v open &>/dev/null; then
-            open "$URL"
-        else
-            echo "$URL"
-        fi
-        ;;
-
     help|--help|-h)
         usage
         ;;
diff --git a/tests/test_label_tool.py b/tests/test_label_tool.py
index 7e5d257..d5d05ec 100644
--- a/tests/test_label_tool.py
+++ b/tests/test_label_tool.py
@@ -5,7 +5,7 @@ These functions are stdlib-only and safe to test without an IMAP connection.
 from email.mime.multipart import MIMEMultipart
 from email.mime.text import MIMEText
 
-from app.label_tool import _extract_body, _strip_html
+from app.utils import _extract_body, _strip_html
 
 
 # ── _strip_html ──────────────────────────────────────────────────────────────