feat(benchmark): wire EmbeddingKNNAdapter into MODEL_REGISTRY as embed-knn-nomic

This commit is contained in:
pyr0ball 2026-05-05 12:43:48 -07:00
parent 41584de5df
commit 5df33b0f41
2 changed files with 22 additions and 5 deletions

View file

@ -39,6 +39,7 @@ from scripts.classifier_adapters import (
LABELS, LABELS,
LABEL_DESCRIPTIONS, LABEL_DESCRIPTIONS,
ClassifierAdapter, ClassifierAdapter,
EmbeddingKNNAdapter,
FineTunedAdapter, FineTunedAdapter,
GLiClassAdapter, GLiClassAdapter,
RerankerAdapter, RerankerAdapter,
@ -130,6 +131,13 @@ MODEL_REGISTRY: dict[str, dict[str, Any]] = {
"params": "600M", "params": "600M",
"default": False, "default": False,
}, },
"embed-knn-nomic": {
"adapter": EmbeddingKNNAdapter,
"model_id": "nomic-embed-text",
"params": "local-embed",
"default": False, # requires orch or ollama; use --include-slow
"kwargs": {"k": 3},
},
} }
# --------------------------------------------------------------------------- # ---------------------------------------------------------------------------

View file

@ -2,11 +2,6 @@
import pytest import pytest
def test_registry_has_thirteen_models():
from scripts.benchmark_classifier import MODEL_REGISTRY
assert len(MODEL_REGISTRY) == 13
def test_registry_default_count(): def test_registry_default_count():
from scripts.benchmark_classifier import MODEL_REGISTRY from scripts.benchmark_classifier import MODEL_REGISTRY
defaults = [k for k, v in MODEL_REGISTRY.items() if v["default"]] defaults = [k for k, v in MODEL_REGISTRY.items() if v["default"]]
@ -243,3 +238,17 @@ def test_build_exemplars_skips_rows_with_no_content(tmp_path):
result = build_exemplars_from_jsonl(str(f)) result = build_exemplars_from_jsonl(str(f))
assert list(result.keys()) == ["neutral"] assert list(result.keys()) == ["neutral"]
assert len(result["neutral"]) == 1 assert len(result["neutral"]) == 1
def test_registry_has_fourteen_models():
from scripts.benchmark_classifier import MODEL_REGISTRY
assert len(MODEL_REGISTRY) == 14
def test_embed_knn_nomic_registry_entry():
from scripts.benchmark_classifier import MODEL_REGISTRY
from scripts.classifier_adapters import EmbeddingKNNAdapter
entry = MODEL_REGISTRY["embed-knn-nomic"]
assert entry["adapter"] is EmbeddingKNNAdapter
assert entry["model_id"] == "nomic-embed-text"
assert entry["default"] is False
assert entry.get("kwargs", {}).get("k") == 3