]> git.ipfire.org Git - thirdparty/paperless-ngx.git/commitdiff
Create llmindex if doesnt exist on update run
authorshamoon <4887959+shamoon@users.noreply.github.com>
Wed, 30 Apr 2025 02:25:39 +0000 (19:25 -0700)
committershamoon <4887959+shamoon@users.noreply.github.com>
Wed, 2 Jul 2025 18:04:03 +0000 (11:04 -0700)
src/paperless_ai/indexing.py

index 3eb554c75a21b55b854ab3309692b3de52c36b05..afc0abb460b39d9056c6d65889d6f84511fb0c80 100644 (file)
@@ -1,5 +1,6 @@
 import logging
 import shutil
+from pathlib import Path
 
 import faiss
 import llama_index.core.settings as llama_settings
@@ -125,11 +126,15 @@ def update_llm_index(*, progress_bar_disable=False, rebuild=False):
         logger.warning("No documents found to index.")
         return
 
-    if rebuild:
+    if (
+        rebuild
+        or not Path(settings.LLM_INDEX_DIR / "default__vector_store.json").exists()
+    ):
+        # Rebuild index from scratch
+        logger.info("Rebuilding LLM index.")
         embed_model = get_embedding_model()
         llama_settings.Settings.embed_model = embed_model
-        storage_context = get_or_create_storage_context(rebuild=rebuild)
-        # Rebuild index from scratch
+        storage_context = get_or_create_storage_context(rebuild=True)
         for document in tqdm.tqdm(documents, disable=progress_bar_disable):
             document_nodes = build_document_node(document)
             nodes.extend(document_nodes)