From b3fe444ae9e1b52e213040a95b42a3713eb43d55 Mon Sep 17 00:00:00 2001 From: James Briggs <35938317+jamescalam@users.noreply.github.com> Date: Fri, 1 Dec 2023 23:34:23 -0800 Subject: [PATCH] fixed bm25 encoder --- semantic_router/encoders/bm25.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/semantic_router/encoders/bm25.py b/semantic_router/encoders/bm25.py index c419ac8f..0f3985be 100644 --- a/semantic_router/encoders/bm25.py +++ b/semantic_router/encoders/bm25.py @@ -23,14 +23,14 @@ class BM25Encoder(BaseEncoder): else: raise ValueError("No documents to encode.") # convert sparse dict to sparse vector - embeds = [0.0] * len(self.idx_mapping) - for output in sparse_dicts: + embeds = [[0.0] * len(self.idx_mapping)] * len(docs) + for i, output in enumerate(sparse_dicts): indices = output["indices"] values = output["values"] for idx, val in zip(indices, values): if idx in self.idx_mapping: position = self.idx_mapping[idx] - embeds[position] = val + embeds[i][position] = val else: print(idx, "not in encoder.idx_mapping") return embeds -- GitLab