From: shamoon <4887959+shamoon@users.noreply.github.com> Date: Wed, 30 Apr 2025 02:25:39 +0000 (-0700) Subject: Create llmindex if doesnt exist on update run X-Git-Url: http://git.ipfire.org/cgi-bin/gitweb.cgi?a=commitdiff_plain;h=84e17535fce78124259c940080e0a6a8829c9f3b;p=thirdparty%2Fpaperless-ngx.git Create llmindex if doesnt exist on update run --- diff --git a/src/paperless_ai/indexing.py b/src/paperless_ai/indexing.py index 3eb554c75..afc0abb46 100644 --- a/src/paperless_ai/indexing.py +++ b/src/paperless_ai/indexing.py @@ -1,5 +1,6 @@ import logging import shutil +from pathlib import Path import faiss import llama_index.core.settings as llama_settings @@ -125,11 +126,15 @@ def update_llm_index(*, progress_bar_disable=False, rebuild=False): logger.warning("No documents found to index.") return - if rebuild: + if ( + rebuild + or not Path(settings.LLM_INDEX_DIR / "default__vector_store.json").exists() + ): + # Rebuild index from scratch + logger.info("Rebuilding LLM index.") embed_model = get_embedding_model() llama_settings.Settings.embed_model = embed_model - storage_context = get_or_create_storage_context(rebuild=rebuild) - # Rebuild index from scratch + storage_context = get_or_create_storage_context(rebuild=True) for document in tqdm.tqdm(documents, disable=progress_bar_disable): document_nodes = build_document_node(document) nodes.extend(document_nodes)