Skip to content

Commit fef86b7

Browse files
committed
better chunks
1 parent 548fe29 commit fef86b7

File tree

1 file changed

+3
-2
lines changed

1 file changed

+3
-2
lines changed

src/doc_builder/build_embeddings.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -30,7 +30,7 @@
3030
from .convert_md_to_mdx import process_md
3131
from .convert_rst_to_mdx import find_indent, is_empty_line
3232
from .meilisearch_helper import add_embeddings_to_db, create_embedding_db, delete_embedding_db, swap_indexes
33-
from .utils import read_doc_config
33+
from .utils import chunk_list, read_doc_config
3434

3535

3636
Chunk = namedtuple("Chunk", "text source package_name")
@@ -462,7 +462,8 @@ def build_embeddings(
462462

463463
# Step 3: push embeddings to vector database (meilisearch)
464464
client = meilisearch.Client("https://edge.meilisearch.com", meilisearch_key)
465-
add_embeddings_to_db(client, MEILI_INDEX_TEMP, embeddings)
465+
for chunk_embeddings in tqdm(chunk_list(embeddings), desc="Uploading data to meilisearch"):
466+
add_embeddings_to_db(client, MEILI_INDEX_TEMP, chunk_embeddings)
466467

467468

468469
def clean_meilisearch(meilisearch_key: str):

0 commit comments

Comments
 (0)