Coverage for src / lilbee / data / store / ranking.py: 100%
39 statements
« prev ^ index » next coverage.py v7.13.4, created at 2026-06-28 01:01 +0000
« prev ^ index » next coverage.py v7.13.4, created at 2026-06-28 01:01 +0000
1"""Vector ranking primitives: cosine similarity and Maximal Marginal Relevance reranking."""
3from __future__ import annotations
5import numpy as np
7from lilbee.core.config import cfg
9from .types import SearchChunk
12def cosine_sim(a: list[float], b: list[float]) -> float:
13 """Cosine similarity between two vectors."""
14 arr_a = np.asarray(a, dtype=np.float64)
15 arr_b = np.asarray(b, dtype=np.float64)
16 norm_a = float(np.linalg.norm(arr_a))
17 norm_b = float(np.linalg.norm(arr_b))
18 if norm_a == 0.0 or norm_b == 0.0:
19 return 0.0
20 return float(np.dot(arr_a, arr_b) / (norm_a * norm_b))
23def mmr_rerank(
24 query_vector: list[float],
25 results: list[SearchChunk],
26 top_k: int,
27 mmr_lambda: float | None = None,
28) -> list[SearchChunk]:
29 """Maximal Marginal Relevance: select diverse results.
30 Algorithm: Carbonell & Goldstein 1998,
31 "The Use of MMR, Diversity-Based Reranking for Reordering Documents
32 and Producing Summaries."
34 ``mmr_lambda`` controls the relevance/diversity tradeoff:
35 0.0 = maximum diversity, 1.0 = pure relevance.
36 Defaults to ``cfg.mmr_lambda`` (0.5).
38 Complexity: O(top_k · N · D) time, O(N · D) space for N candidates
39 of dimension D. Each outer iteration updates a running max-redundancy
40 vector via one matmul rather than recomputing pairs pairwise.
41 Candidate vectors run through numpy in ``float32``, which can pick a
42 different candidate than the pure-Python ``float64`` loop on
43 ties within ~1e-7; distinct in principle, unobservable in practice
44 since sub-float32 differences are below retrieval signal.
45 """
46 if mmr_lambda is None:
47 mmr_lambda = cfg.mmr_lambda
48 if len(results) <= top_k:
49 return results
51 candidate_vecs = np.asarray([r.vector for r in results], dtype=np.float32)
52 query = np.asarray(query_vector, dtype=np.float32)
53 # L2-normalize once so cosine becomes a plain dot product.
54 cand_norms = np.linalg.norm(candidate_vecs, axis=1, keepdims=True)
55 cand_norms[cand_norms == 0] = 1.0
56 cand_unit = candidate_vecs / cand_norms
57 query_norm = float(np.linalg.norm(query)) or 1.0
58 query_unit = query / query_norm
60 relevance = cand_unit @ query_unit # shape (N,)
62 n = len(results)
63 max_redundancy = np.zeros(n, dtype=np.float32)
64 available = np.ones(n, dtype=bool)
65 selected: list[SearchChunk] = []
67 for picks in range(top_k):
68 redundancy_term = max_redundancy if picks > 0 else np.zeros(n, dtype=np.float32)
69 score = mmr_lambda * relevance - (1.0 - mmr_lambda) * redundancy_term
70 # Mask already-picked candidates so argmax skips them.
71 score = np.where(available, score, -np.inf)
72 best = int(np.argmax(score))
73 selected.append(results[best])
74 available[best] = False
75 # Update running max redundancy against the newly-selected vector.
76 similarity = cand_unit @ cand_unit[best]
77 max_redundancy = np.maximum(max_redundancy, similarity)
79 return selected