Set indexing error when embedding model returns incorrect number of embeddings (#321)

mliu-cloudera · web-flow · commit c35a20d884c5 · 2025-09-19T14:43:55.000-07:00
* Raise error when embeddings and text chunks don't match

* Elaborate on error message
diff --git a/llm-service/app/ai/indexing/embedding_indexer.py b/llm-service/app/ai/indexing/embedding_indexer.py
@@ -130,6 +130,12 @@ def _compute_embeddings(
             logger.debug(f"Waiting for {len(futures)} futures")
             for future in as_completed(futures):
                 i, batch_embeddings = future.result()
-                for chunk, embedding in zip(batched_chunks[i], batch_embeddings):
+                batch_chunks = batched_chunks[i]
+                if len(batch_chunks) != len(batch_embeddings):
+                    raise ValueError(
+                        f"Expected {len(batch_chunks)} embedding vectors for this batch of chunks,"
+                        + f" but got {len(batch_embeddings)} from {self.embedding_model.model_name}"
+                    )
+                for chunk, embedding in zip(batch_chunks, batch_embeddings):
                     chunk.embedding = embedding
-                yield batched_chunks[i]
+                yield batch_chunks