feat(benchmark): wire EmbeddingKNNAdapter into MODEL_REGISTRY as embed-knn-nomic
This commit is contained in:
parent
41584de5df
commit
5df33b0f41
2 changed files with 22 additions and 5 deletions
|
|
@ -39,6 +39,7 @@ from scripts.classifier_adapters import (
|
||||||
LABELS,
|
LABELS,
|
||||||
LABEL_DESCRIPTIONS,
|
LABEL_DESCRIPTIONS,
|
||||||
ClassifierAdapter,
|
ClassifierAdapter,
|
||||||
|
EmbeddingKNNAdapter,
|
||||||
FineTunedAdapter,
|
FineTunedAdapter,
|
||||||
GLiClassAdapter,
|
GLiClassAdapter,
|
||||||
RerankerAdapter,
|
RerankerAdapter,
|
||||||
|
|
@ -130,6 +131,13 @@ MODEL_REGISTRY: dict[str, dict[str, Any]] = {
|
||||||
"params": "600M",
|
"params": "600M",
|
||||||
"default": False,
|
"default": False,
|
||||||
},
|
},
|
||||||
|
"embed-knn-nomic": {
|
||||||
|
"adapter": EmbeddingKNNAdapter,
|
||||||
|
"model_id": "nomic-embed-text",
|
||||||
|
"params": "local-embed",
|
||||||
|
"default": False, # requires orch or ollama; use --include-slow
|
||||||
|
"kwargs": {"k": 3},
|
||||||
|
},
|
||||||
}
|
}
|
||||||
|
|
||||||
# ---------------------------------------------------------------------------
|
# ---------------------------------------------------------------------------
|
||||||
|
|
|
||||||
|
|
@ -2,11 +2,6 @@
|
||||||
import pytest
|
import pytest
|
||||||
|
|
||||||
|
|
||||||
def test_registry_has_thirteen_models():
|
|
||||||
from scripts.benchmark_classifier import MODEL_REGISTRY
|
|
||||||
assert len(MODEL_REGISTRY) == 13
|
|
||||||
|
|
||||||
|
|
||||||
def test_registry_default_count():
|
def test_registry_default_count():
|
||||||
from scripts.benchmark_classifier import MODEL_REGISTRY
|
from scripts.benchmark_classifier import MODEL_REGISTRY
|
||||||
defaults = [k for k, v in MODEL_REGISTRY.items() if v["default"]]
|
defaults = [k for k, v in MODEL_REGISTRY.items() if v["default"]]
|
||||||
|
|
@ -243,3 +238,17 @@ def test_build_exemplars_skips_rows_with_no_content(tmp_path):
|
||||||
result = build_exemplars_from_jsonl(str(f))
|
result = build_exemplars_from_jsonl(str(f))
|
||||||
assert list(result.keys()) == ["neutral"]
|
assert list(result.keys()) == ["neutral"]
|
||||||
assert len(result["neutral"]) == 1
|
assert len(result["neutral"]) == 1
|
||||||
|
|
||||||
|
def test_registry_has_fourteen_models():
|
||||||
|
from scripts.benchmark_classifier import MODEL_REGISTRY
|
||||||
|
assert len(MODEL_REGISTRY) == 14
|
||||||
|
|
||||||
|
|
||||||
|
def test_embed_knn_nomic_registry_entry():
|
||||||
|
from scripts.benchmark_classifier import MODEL_REGISTRY
|
||||||
|
from scripts.classifier_adapters import EmbeddingKNNAdapter
|
||||||
|
entry = MODEL_REGISTRY["embed-knn-nomic"]
|
||||||
|
assert entry["adapter"] is EmbeddingKNNAdapter
|
||||||
|
assert entry["model_id"] == "nomic-embed-text"
|
||||||
|
assert entry["default"] is False
|
||||||
|
assert entry.get("kwargs", {}).get("k") == 3
|
||||||
|
|
|
||||||
Loading…
Reference in a new issue