Skip to content

Commit 9e5acab

Browse files
committed
init
1 parent fb8f5fc commit 9e5acab

File tree

2 files changed

+2
-28
lines changed

2 files changed

+2
-28
lines changed

src/api/routers/rerank.py

Lines changed: 2 additions & 22 deletions
Original file line numberDiff line numberDiff line change
@@ -62,11 +62,8 @@ async def rerank_documents(
6262
)
6363

6464
try:
65-
# Extract kwargs but exclude rerank-specific fields
6665
kwargs = extract_embedding_kwargs(request)
6766

68-
# Remove fields that are already passed as positional arguments
69-
# to avoid "got multiple values for argument" error
7067
kwargs.pop("query", None)
7168
kwargs.pop("documents", None)
7269
kwargs.pop("top_k", None)
@@ -80,19 +77,10 @@ async def rerank_documents(
8077
detail=f"Model '{request.model_id}' is not a rerank model. Type: {config.type}",
8178
)
8279

83-
# Debug logs BEFORE calling rank_document
84-
logger.debug(f"Rerank request - Query: '{request.query}'")
85-
logger.debug(f"Documents to rank: {len(valid_docs)}")
86-
if valid_docs:
87-
logger.debug(f"First document: {valid_docs[0][1][:100]}...")
88-
logger.debug(f"Top K: {request.top_k}")
89-
9080
start = time.time()
9181

92-
# Extract documents for ranking
9382
documents_list = [doc for _, doc in valid_docs]
94-
95-
# Call rank_document - returns only top_k results
83+
9684
ranking_results = model.rank_document(
9785
query=request.query,
9886
documents=documents_list,
@@ -102,18 +90,10 @@ async def rerank_documents(
10290

10391
processing_time = time.time() - start
10492

105-
# Debug logs AFTER rank_document
106-
logger.debug(f"Ranking returned {len(ranking_results)} results")
107-
if ranking_results:
108-
logger.debug(f"Top result score: {ranking_results[0]}")
109-
110-
# Build results from ranking_results
111-
# ranking_results already contains top_k items with scores
11293
results = []
11394

11495
for rank_result in ranking_results:
115-
# Get original index from valid_docs
116-
doc_idx = rank_result.get('corpus_id', 0) # Index in filtered list
96+
doc_idx = rank_result.get('corpus_id', 0)
11797
if doc_idx < len(valid_docs):
11898
original_idx = valid_docs[doc_idx][0] # Original index
11999
doc_text = documents_list[doc_idx]

src/models/embeddings/rank.py

Lines changed: 0 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -115,8 +115,6 @@ def rank_document(
115115
self.load()
116116

117117
try:
118-
# model.rank returns List[Dict] with 'corpus_id' and 'score'
119-
# Already sorted by score (highest first) and limited to top_k
120118
ranking_results = self.model.rank(
121119
query,
122120
documents,
@@ -157,14 +155,11 @@ def _normalize_rerank_scores(
157155
if not rankings:
158156
return []
159157

160-
# Extract raw scores
161158
raw_scores = [ranking["score"] for ranking in rankings]
162159

163-
# Min-Max normalization
164160
min_score = min(raw_scores)
165161
max_score = max(raw_scores)
166162

167-
# If all scores are the same, return max target value
168163
if max_score == min_score:
169164
return [
170165
{
@@ -174,7 +169,6 @@ def _normalize_rerank_scores(
174169
for r in rankings
175170
]
176171

177-
# Normalize to target range
178172
target_min, target_max = target_range
179173
normalized_rankings = []
180174

0 commit comments

Comments
 (0)