Fix default llama3.1

Correct get_tool_calls_from_response signature
2026-01-14 21:54:22 -06:00 · 2026-01-14 15:36:01 -08:00 · 2026-01-14 14:55:03 -08:00
5 changed files with 317 additions and 455 deletions
--- a/docs/configuration.md
+++ b/docs/configuration.md
@@ -1873,7 +1873,7 @@ using the OpenAI API. This setting is required to be set to use the AI features.
 #### [`PAPERLESS_AI_LLM_MODEL=<str>`](#PAPERLESS_AI_LLM_MODEL) {#PAPERLESS_AI_LLM_MODEL}
 : The model to use for the AI backend, i.e. "gpt-3.5-turbo", "gpt-4" or any of the models supported by the
-current backend. If not supplied, defaults to "gpt-3.5-turbo" for OpenAI and "llama3" for Ollama.
+current backend. If not supplied, defaults to "gpt-3.5-turbo" for OpenAI and "llama3.1" for Ollama.
    Defaults to None.
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -28,7 +28,7 @@ dependencies = [
  #          Only patch versions are guaranteed to not introduce breaking changes.
  "django~=5.2.5",
  "django-allauth[mfa,socialaccount]~=65.12.1",
-  "django-auditlog~=3.4.1",
+  "django-auditlog~=3.3.0",
  "django-cachalot~=2.8.0",
  "django-celery-results~=2.6.0",
  "django-compression-middleware~=0.5.0",
@@ -47,7 +47,7 @@ dependencies = [
  "faiss-cpu>=1.10",
  "filelock~=3.20.0",
  "flower~=2.0.1",
-  "gotenberg-client~=0.13.1",
+  "gotenberg-client~=0.12.0",
  "httpx-oauth~=0.16",
  "imap-tools~=1.11.0",
  "inotifyrecursive~=0.3",
@@ -60,7 +60,7 @@ dependencies = [
  "llama-index-llms-openai>=0.3.38",
  "llama-index-vector-stores-faiss>=0.3",
  "nltk~=3.9.1",
-  "ocrmypdf~=16.13.0",
+  "ocrmypdf~=16.12.0",
  "openai>=1.76",
  "pathvalidate~=3.3.1",
  "pdf2image~=1.17.0",
@@ -91,7 +91,7 @@ optional-dependencies.postgres = [
  "psycopg[c,pool]==3.2.12",
  # Direct dependency for proper resolution of the pre-built wheels
  "psycopg-c==3.2.12",
-  "psycopg-pool==3.3",
+  "psycopg-pool==3.2.7",
 ]
 optional-dependencies.webserver = [
  "granian[uvloop]~=2.5.1",
@@ -126,7 +126,7 @@ testing = [
 ]
 lint = [
-  "pre-commit~=4.5.1",
+  "pre-commit~=4.4.0",
  "pre-commit-uv~=4.2.0",
  "ruff~=0.14.0",
 ]
--- a/src/paperless_ai/client.py
+++ b/src/paperless_ai/client.py
@@ -23,7 +23,7 @@ class AIClient:
    def get_llm(self) -> Ollama | OpenAI:
        if self.settings.llm_backend == "ollama":
            return Ollama(
-                model=self.settings.llm_model or "llama3",
+                model=self.settings.llm_model or "llama3.1",
                base_url=self.settings.llm_endpoint or "http://localhost:11434",
                request_timeout=120,
            )
@@ -52,7 +52,7 @@ class AIClient:
        )
        tool_calls = self.llm.get_tool_calls_from_response(
            result,
-            error_on_no_tool_calls=True,
+            error_on_no_tool_call=True,
        )
        logger.debug("LLM query result: %s", tool_calls)
        parsed = DocumentClassifierSchema(**tool_calls[0].tool_kwargs)
--- a/src/paperless_ai/tests/test_chat.py
+++ b/src/paperless_ai/tests/test_chat.py
@@ -11,12 +11,14 @@ from paperless_ai.chat import stream_chat_with_documents
@pytest.fixture(autouse=True)
 def patch_embed_model():
    from llama_index.core import settings as llama_settings
    from llama_index.core.embeddings.utils import MockEmbedding
-    mock_embed_model = MockEmbedding(embed_dim=8)
+    mock_embed_model = MagicMock()
-    llama_settings.Settings.embed_model = mock_embed_model
+    mock_embed_model._get_text_embedding_batch.return_value = [
        [0.1] * 1536,
    ]  # 1 vector per input
    llama_settings.Settings._embed_model = mock_embed_model
    yield
-    llama_settings.Settings.embed_model = None
+    llama_settings.Settings._embed_model = None
@pytest.fixture(autouse=True)
--- a/uv.lock
+++ b/uv.lock
Author	SHA1	Message	Date
shamoon	94a5af66eb	Fix default llama3.1	2026-01-14 15:36:01 -08:00
shamoon	948c664dcf	Correct get_tool_calls_from_response signature	2026-01-14 14:55:03 -08:00