From 51a7581860400a9248556b76edc9b5b38865bb76 Mon Sep 17 00:00:00 2001 From: shamoon <4887959+shamoon@users.noreply.github.com> Date: Tue, 29 Apr 2025 19:25:39 -0700 Subject: [PATCH] Create llmindex if doesnt exist on update run --- src/paperless_ai/indexing.py | 11 ++++++++--- 1 file changed, 8 insertions(+), 3 deletions(-) diff --git a/src/paperless_ai/indexing.py b/src/paperless_ai/indexing.py index 3eb554c75..afc0abb46 100644 --- a/src/paperless_ai/indexing.py +++ b/src/paperless_ai/indexing.py @@ -1,5 +1,6 @@ import logging import shutil +from pathlib import Path import faiss import llama_index.core.settings as llama_settings @@ -125,11 +126,15 @@ def update_llm_index(*, progress_bar_disable=False, rebuild=False): logger.warning("No documents found to index.") return - if rebuild: + if ( + rebuild + or not Path(settings.LLM_INDEX_DIR / "default__vector_store.json").exists() + ): + # Rebuild index from scratch + logger.info("Rebuilding LLM index.") embed_model = get_embedding_model() llama_settings.Settings.embed_model = embed_model - storage_context = get_or_create_storage_context(rebuild=rebuild) - # Rebuild index from scratch + storage_context = get_or_create_storage_context(rebuild=True) for document in tqdm.tqdm(documents, disable=progress_bar_disable): document_nodes = build_document_node(document) nodes.extend(document_nodes)